From 4978aaff25d210d296352554680ac95107612e50 Mon Sep 17 00:00:00 2001 From: zerob13 Date: Sat, 13 Jun 2026 07:55:59 +0800 Subject: [PATCH 1/8] refactor(ipc): migrate presenter transport --- docs/ARCHITECTURE.md | 10 +- docs/README.md | 6 +- .../baselines/archive-reference-report.md | 2 +- .../baselines/dependency-report.md | 230 +- .../main-kernel-boundary-baseline.md | 61 +- .../main-kernel-migration-scoreboard.json | 26 +- .../main-kernel-migration-scoreboard.md | 22 +- .../baselines/zero-inbound-candidates.md | 141 +- docs/architecture/event-system.md | 204 +- .../presenter-ipc-migration-plan/audit.md | 126 + .../change-map.zh-CN.md | 867 + .../presenter-ipc-migration-plan/plan.md | 643 + .../presenter-ipc-migration-plan/spec.md | 78 + .../presenter-ipc-migration-plan/tasks.md | 970 + .../verification.md | 538 + docs/guides/code-navigation.md | 6 +- docs/guides/getting-started.md | 7 +- resources/acp-registry/registry.json | 62 +- resources/model-db/providers.json | 179276 ++++++++------- scripts/architecture-guard.mjs | 33 +- scripts/generate-architecture-baseline.mjs | 44 +- src/main/appMain.ts | 10 +- src/main/contextMenuHelper.ts | 18 +- src/main/events.ts | 159 +- .../agentRuntimePresenter/dispatch.ts | 28 +- .../presenter/agentRuntimePresenter/echo.ts | 8 - .../presenter/agentRuntimePresenter/index.ts | 46 +- .../pendingInputCoordinator.ts | 5 - .../presenter/agentSessionPresenter/index.ts | 25 - .../presenter/browser/YoBrowserPresenter.ts | 30 - .../configPresenter/acpInitHelper.ts | 40 +- .../configPresenter/eventPublishers.ts | 200 + src/main/presenter/configPresenter/index.ts | 105 +- .../configPresenter/mcpConfHelper.ts | 27 +- .../configPresenter/modelStatusHelper.ts | 7 +- .../configPresenter/providerDbLoader.ts | 20 +- .../configPresenter/providerHelper.ts | 21 +- .../configPresenter/providerModelHelper.ts | 9 +- .../configPresenter/systemPromptHelper.ts | 7 +- .../configPresenter/uiSettingsHelper.ts | 18 +- src/main/presenter/deeplinkPresenter/index.ts | 22 +- src/main/presenter/devicePresenter/index.ts | 28 +- src/main/presenter/dialogPresenter/index.ts | 4 - .../FloatingButtonWindow.ts | 8 +- .../floatingButtonPresenter/index.ts | 45 +- src/main/presenter/index.ts | 243 +- .../knowledgeStorePresenter.ts | 45 +- .../lifecyclePresenter/SplashWindowManager.ts | 18 +- .../hooks/ready/eventListenerSetupHook.ts | 9 +- .../presenter/lifecyclePresenter/index.ts | 5 +- .../acp/acpProcessManager.ts | 19 +- .../llmProviderPresenter/baseProvider.ts | 5 +- .../managers/ollamaManager.ts | 3 - .../managers/rateLimitManager.ts | 18 +- .../llmProviderPresenter/oauthHelper.ts | 8 +- .../providers/acpProvider.ts | 44 +- src/main/presenter/mcpPresenter/index.ts | 50 +- src/main/presenter/mcpPresenter/mcpClient.ts | 43 +- .../presenter/mcpPresenter/serverManager.ts | 10 +- .../presenter/mcpPresenter/toolManager.ts | 14 +- src/main/presenter/notificationPresenter.ts | 11 +- .../presenter/presenterCallErrorHandler.ts | 7 +- src/main/presenter/sessionPresenter/events.ts | 12 - src/main/presenter/sessionPresenter/index.ts | 48 +- .../managers/conversationManager.ts | 68 +- .../managers/messageManager.ts | 16 +- .../sessionPresenter/tab/tabManager.ts | 19 +- src/main/presenter/shortcutPresenter.ts | 24 +- src/main/presenter/skillPresenter/index.ts | 20 - .../presenter/skillSyncPresenter/index.ts | 54 +- src/main/presenter/syncPresenter/index.ts | 44 +- src/main/presenter/tabPresenter.ts | 45 +- .../agentTools/agentToolManager.ts | 4 +- .../agentTools/chatSettingsTools.ts | 12 +- .../presenter/toolPresenter/runtimePorts.ts | 4 + src/main/presenter/upgradePresenter/index.ts | 6 +- .../windowPresenter/FloatingChatWindow.ts | 10 +- src/main/presenter/windowPresenter/index.ts | 203 +- .../presenter/workspacePresenter/index.ts | 3 - src/main/routes/config/configRouteHandler.ts | 219 + src/main/routes/config/configRouteSupport.ts | 21 + src/main/routes/index.ts | 539 +- src/main/routes/legacyTypedEventBridge.ts | 459 - .../routes/providers/providerRouteHandler.ts | 52 +- src/main/routes/publishDeepchatEvent.ts | 21 +- src/preload/browser-overlay-preload.ts | 10 +- src/preload/floating-preload.ts | 239 +- src/preload/index.d.ts | 4 +- src/preload/index.ts | 4 +- src/preload/splash-preload.ts | 65 +- src/renderer/api/AcpTerminalClient.ts | 67 + src/renderer/api/AppRuntimeClient.ts | 72 + src/renderer/api/BrowserClient.ts | 7 + src/renderer/api/ConfigClient.ts | 226 +- src/renderer/api/ContextMenuClient.ts | 28 + src/renderer/api/DatabaseSecurityClient.ts | 10 +- src/renderer/api/DeviceClient.ts | 17 +- src/renderer/api/KnowledgeClient.ts | 124 + src/renderer/api/McpClient.ts | 39 + src/renderer/api/NowledgeMemClient.ts | 34 + src/renderer/api/OAuthClient.ts | 27 + src/renderer/api/ProjectClient.ts | 7 + src/renderer/api/ProviderClient.ts | 119 +- src/renderer/api/RemoteControlClient.ts | 134 + src/renderer/api/RemoteControlRuntime.ts | 44 - src/renderer/api/SessionClient.ts | 43 + src/renderer/api/ShortcutClient.ts | 32 + src/renderer/api/ShortcutRuntime.ts | 21 - src/renderer/api/SkillClient.ts | 7 + src/renderer/api/SkillSyncClient.ts | 182 + src/renderer/api/WindowClient.ts | 95 +- src/renderer/api/index.ts | 9 + src/renderer/api/legacy/README.md | 27 - src/renderer/api/legacy/presenterTransport.ts | 102 - src/renderer/api/legacy/presenters.ts | 28 - src/renderer/api/legacy/runtime.ts | 125 - src/renderer/api/runtime.ts | 4 + src/renderer/floating/FloatingButton.vue | 6 +- src/renderer/floating/env.d.ts | 15 +- src/renderer/floating/main.ts | 13 +- src/renderer/settings/App.vue | 70 +- .../settings/components/AboutUsSettings.vue | 42 +- .../settings/components/AcpDebugDialog.vue | 50 +- .../components/AcpDependencyDialog.vue | 14 +- .../settings/components/AcpSettings.vue | 45 +- .../settings/components/AcpTerminalDialog.vue | 72 +- .../components/BuiltinKnowledgeSettings.vue | 13 +- .../settings/components/DashboardSettings.vue | 8 +- .../settings/components/DataSettings.vue | 41 +- .../components/DeepChatAgentsSettings.vue | 42 +- .../components/EnvironmentsSettings.vue | 6 +- .../components/GitHubCopilotOAuth.vue | 8 +- .../components/KnowledgeBaseSettings.vue | 6 +- .../settings/components/KnowledgeFile.vue | 37 +- .../settings/components/KnowledgeFileItem.vue | 25 +- .../settings/components/McpBuiltinMarket.vue | 18 +- .../settings/components/McpSettings.vue | 12 +- .../components/ModelProviderSettings.vue | 6 +- .../settings/components/ModelScopeMcpSync.vue | 6 +- .../components/NotificationsHooksSettings.vue | 10 +- .../components/NowledgeMemSettings.vue | 25 +- .../settings/components/ProviderApiConfig.vue | 8 +- .../components/ProviderRateLimitConfig.vue | 41 +- .../settings/components/RemoteSettings.vue | 264 +- .../settings/components/SettingsOverview.vue | 3 +- .../settings/components/ShortcutSettings.vue | 11 +- .../common/DefaultModelSettingsSection.vue | 19 +- .../common/LoggingSettingsSection.vue | 6 +- .../common/ProxySettingsSection.vue | 19 +- .../common/UploadFileSettingsSection.vue | 8 +- .../components/prompt/PromptEditorSheet.vue | 37 +- .../components/skills/SkillEditorSheet.vue | 6 +- .../components/skills/SkillInstallDialog.vue | 8 +- .../skills/SkillSyncDialog/ExportWizard.vue | 10 +- .../skills/SkillSyncDialog/ImportWizard.vue | 13 +- .../components/skills/SkillsSettings.vue | 31 +- .../components/skills/SyncPromptDialog.vue | 30 +- .../components/skills/SyncStatusCard.vue | 2 + .../components/skills/SyncStatusSection.vue | 27 +- .../settings/lib/guidedOnboardingSettings.ts | 6 +- src/renderer/settings/main.ts | 3 +- src/renderer/splash/env.d.ts | 29 + src/renderer/splash/loading.vue | 36 +- src/renderer/src/App.vue | 4 +- src/renderer/src/components/ModelSelect.vue | 2 +- src/renderer/src/components/WindowSideBar.vue | 12 +- .../message/SelectedTextContextMenu.vue | 24 +- .../src/composables/useAppIpcRuntime.ts | 96 +- src/renderer/src/env.d.ts | 29 + src/renderer/src/events.ts | 173 +- src/renderer/src/lib/ipcSubscription.ts | 1 - src/renderer/src/lib/storeInitializer.ts | 12 +- src/renderer/src/pages/ChatPage.vue | 8 +- src/renderer/src/pages/WelcomePage.vue | 7 + src/renderer/src/stores/shortcutKey.ts | 8 +- src/renderer/src/stores/ui/messageIpc.ts | 20 - src/shared/contracts/domainSchemas.ts | 354 + src/shared/contracts/events.ts | 95 +- .../contracts/events/acp-terminal.events.ts | 62 + .../contracts/events/app-runtime.events.ts | 68 + .../contracts/events/context-menu.events.ts | 18 + .../contracts/events/knowledge.events.ts | 16 + .../contracts/events/notification.events.ts | 22 + .../contracts/events/providers.events.ts | 45 + .../contracts/events/sessions.events.ts | 33 +- .../contracts/events/settings.events.ts | 43 + .../contracts/events/skillSync.events.ts | 77 + src/shared/contracts/routes.ts | 220 +- .../contracts/routes/acp-terminal.routes.ts | 20 + src/shared/contracts/routes/browser.routes.ts | 8 + src/shared/contracts/routes/config.routes.ts | 409 + .../routes/database-security.routes.ts | 51 + src/shared/contracts/routes/device.routes.ts | 31 + .../contracts/routes/knowledge.routes.ts | 129 + src/shared/contracts/routes/mcp.routes.ts | 75 + .../contracts/routes/nowledgeMem.routes.ts | 48 + src/shared/contracts/routes/oauth.routes.ts | 24 + src/shared/contracts/routes/project.routes.ts | 10 + .../contracts/routes/providers.routes.ts | 82 + .../contracts/routes/remote-control.routes.ts | 208 + .../contracts/routes/sessions.routes.ts | 18 +- .../contracts/routes/shortcut.routes.ts | 26 + .../contracts/routes/skillSync.routes.ts | 93 + src/shared/contracts/routes/skills.routes.ts | 10 + src/shared/contracts/routes/window.routes.ts | 72 + src/shared/floatingButtonChannels.ts | 25 + .../types/presenters/legacy.presenters.d.ts | 6 + test/e2e/fixtures/electronApp.ts | 108 +- test/e2e/specs/02-chat-basic.smoke.spec.ts | 5 + .../03-session-persistence.smoke.spec.ts | 5 + .../06-settings-ipc-boundary.smoke.spec.ts | 74 + .../07-floating-ipc-boundary.smoke.spec.ts | 139 + test/e2e/specs/08-browser-route.smoke.spec.ts | 73 + .../specs/09-main-ipc-boundary.smoke.spec.ts | 83 + .../10-settings-privacy-route.smoke.spec.ts | 70 + ...emote-control-readonly-route.smoke.spec.ts | 87 + .../12-knowledge-readonly-route.smoke.spec.ts | 50 + .../specs/13-mcp-readonly-route.smoke.spec.ts | 65 + .../14-nowledgemem-config-route.smoke.spec.ts | 100 + .../15-dashboard-readonly-route.smoke.spec.ts | 84 + .../16-skills-readonly-route.smoke.spec.ts | 87 + .../specs/17-acp-readonly-route.smoke.spec.ts | 109 + .../18-provider-readonly-route.smoke.spec.ts | 177 + ...19-skill-sync-readonly-route.smoke.spec.ts | 144 + ...data-security-readonly-route.smoke.spec.ts | 106 + .../21-project-readonly-route.smoke.spec.ts | 105 + .../22-window-readonly-route.smoke.spec.ts | 49 + .../23-config-readonly-route.smoke.spec.ts | 196 + ...config-system-readonly-route.smoke.spec.ts | 99 + ...ow-provider-deeplink-preview.smoke.spec.ts | 63 + .../26-deepchat-agent-crud.smoke.spec.ts | 147 + ...7-hooks-notification-command.smoke.spec.ts | 91 + .../28-shortcut-route-restore.smoke.spec.ts | 146 + .../29-workspace-readonly-route.smoke.spec.ts | 86 + test/main/presenter/SyncPresenter.test.ts | 34 + .../main/presenter/YoBrowserPresenter.test.ts | 22 +- test/main/presenter/acpProvider.test.ts | 124 +- .../agentRuntimePresenter.test.ts | 112 +- .../agentRuntimePresenter/dispatch.test.ts | 63 +- .../agentRuntimePresenter/echo.test.ts | 39 +- .../agentRuntimePresenter/process.test.ts | 74 +- .../agentSessionPresenter.test.ts | 65 +- .../agentSessionPresenter/integration.test.ts | 24 +- .../configPresenter/fontSizeSettings.test.ts | 124 + .../configPresenter/mcpConfHelper.test.ts | 52 + .../configPresenter/modelStatusHelper.test.ts | 10 +- .../configPresenter/providerDbLoader.test.ts | 35 +- .../configPresenter/providerHelper.test.ts | 10 +- .../providerModelHelper.test.ts | 8 + test/main/presenter/deeplinkPresenter.test.ts | 55 +- test/main/presenter/devicePresenter.test.ts | 29 +- test/main/presenter/dialogPresenter.test.ts | 65 + .../knowledgeStorePresenter.test.ts | 125 + .../SplashWindowManager.display.test.ts | 7 + .../acp/acpProcessManager.test.ts | 43 + .../awsBedrockProvider.test.ts | 67 +- .../ollamaManager.test.ts | 49 + .../rateLimitManager.test.ts | 40 +- test/main/presenter/mcpClient.test.ts | 5 + test/main/presenter/mcpPresenter.test.ts | 87 + .../mcpPresenter/serverManager.test.ts | 1 + .../mcpPresenter/toolManager.test.ts | 3 +- .../presenter/notificationPresenter.test.ts | 90 + test/main/presenter/pluginPresenter.test.ts | 32 +- .../presenterCallErrorHandler.test.ts | 11 +- .../skillPresenter/skillPresenter.test.ts | 145 +- .../skillSyncPresenter/index.test.ts | 130 +- .../agentTools/chatSettingsTools.test.ts | 7 +- test/main/presenter/upgradePresenter.test.ts | 14 +- .../main/presenter/workspacePresenter.test.ts | 27 +- test/main/routes/contracts.test.ts | 938 +- test/main/routes/dispatcher.test.ts | 2122 +- test/main/scripts/architectureGuard.test.ts | 55 + test/renderer/api/clients.test.ts | 1486 +- test/renderer/api/preloadBoundaries.test.ts | 326 + .../assets/markstreamTailwindSource.test.ts | 17 +- .../components/AboutUsSettings.test.ts | 81 +- .../components/AcpDebugDialog.test.ts | 179 + test/renderer/components/AcpSettings.test.ts | 57 +- test/renderer/components/App.startup.test.ts | 48 +- test/renderer/components/BrowserPanel.test.ts | 10 +- .../BuiltinKnowledgeSettings.test.ts | 74 +- test/renderer/components/ChatPage.test.ts | 29 +- .../renderer/components/ChatStatusBar.test.ts | 57 +- .../components/DashboardSettings.test.ts | 4 +- test/renderer/components/DataSettings.test.ts | 158 +- .../components/DeepChatAgentsSettings.test.ts | 133 +- .../components/EnvironmentsSettings.test.ts | 10 +- .../components/GitHubCopilotOAuth.test.ts | 119 + .../renderer/components/KnowledgeFile.test.ts | 165 + .../components/KnowledgeFileItem.test.ts | 121 + test/renderer/components/LinkNode.test.ts | 8 - .../components/MarkdownRenderer.test.ts | 4 +- .../components/McpBuiltinMarket.test.ts | 148 + test/renderer/components/McpIndicator.test.ts | 36 +- test/renderer/components/McpSettings.test.ts | 4 +- .../components/ModelProviderSettings.test.ts | 4 +- .../components/ModelScopeMcpSync.test.ts | 94 + .../components/NowledgeMemSettings.test.ts | 168 + .../components/PluginsSettings.test.ts | 6 - .../components/PromptEditorSheet.test.ts | 198 + .../components/ProviderApiConfig.test.ts | 51 +- .../ProviderRateLimitConfig.test.ts | 160 + .../components/RemoteSettings.test.ts | 23 +- .../SettingsApp.providerDeeplink.test.ts | 85 +- test/renderer/components/SettingsApp.test.ts | 255 +- .../components/SkillEditorSheet.test.ts | 139 + .../components/SkillSyncSettings.test.ts | 152 + .../components/SpotlightOverlay.test.ts | 8 +- .../renderer/components/WindowSideBar.test.ts | 8 +- .../components/WorkspaceFileNode.test.ts | 4 +- .../message/MessageBlockContent.test.ts | 13 +- .../message/MessageItemUser.test.ts | 10 +- .../message/SelectedTextContextMenu.test.ts | 79 + .../think-content/ThinkContentStyle.test.ts | 8 +- .../composables/useLegacyPresenter.test.ts | 38 - .../composables/useMessageCapture.test.ts | 11 +- test/renderer/lib/storeInitializer.test.ts | 12 +- test/renderer/stores/dialogStore.test.ts | 76 + test/renderer/stores/mcpStore.test.ts | 10 - test/renderer/stores/messageStore.test.ts | 25 +- test/renderer/stores/ollamaStore.test.ts | 7 - tsconfig.node.tsbuildinfo | 2 +- vitest.config.ts | 18 +- 324 files changed, 112475 insertions(+), 92604 deletions(-) create mode 100644 docs/architecture/presenter-ipc-migration-plan/audit.md create mode 100644 docs/architecture/presenter-ipc-migration-plan/change-map.zh-CN.md create mode 100644 docs/architecture/presenter-ipc-migration-plan/plan.md create mode 100644 docs/architecture/presenter-ipc-migration-plan/spec.md create mode 100644 docs/architecture/presenter-ipc-migration-plan/tasks.md create mode 100644 docs/architecture/presenter-ipc-migration-plan/verification.md create mode 100644 src/main/presenter/configPresenter/eventPublishers.ts delete mode 100644 src/main/presenter/sessionPresenter/events.ts delete mode 100644 src/main/routes/legacyTypedEventBridge.ts create mode 100644 src/renderer/api/AcpTerminalClient.ts create mode 100644 src/renderer/api/AppRuntimeClient.ts create mode 100644 src/renderer/api/ContextMenuClient.ts create mode 100644 src/renderer/api/KnowledgeClient.ts create mode 100644 src/renderer/api/NowledgeMemClient.ts create mode 100644 src/renderer/api/OAuthClient.ts create mode 100644 src/renderer/api/RemoteControlClient.ts delete mode 100644 src/renderer/api/RemoteControlRuntime.ts create mode 100644 src/renderer/api/ShortcutClient.ts delete mode 100644 src/renderer/api/ShortcutRuntime.ts create mode 100644 src/renderer/api/SkillSyncClient.ts delete mode 100644 src/renderer/api/legacy/README.md delete mode 100644 src/renderer/api/legacy/presenterTransport.ts delete mode 100644 src/renderer/api/legacy/presenters.ts delete mode 100644 src/renderer/api/legacy/runtime.ts delete mode 100644 src/renderer/src/lib/ipcSubscription.ts create mode 100644 src/shared/contracts/events/acp-terminal.events.ts create mode 100644 src/shared/contracts/events/app-runtime.events.ts create mode 100644 src/shared/contracts/events/context-menu.events.ts create mode 100644 src/shared/contracts/events/knowledge.events.ts create mode 100644 src/shared/contracts/events/notification.events.ts create mode 100644 src/shared/contracts/events/skillSync.events.ts create mode 100644 src/shared/contracts/routes/acp-terminal.routes.ts create mode 100644 src/shared/contracts/routes/knowledge.routes.ts create mode 100644 src/shared/contracts/routes/nowledgeMem.routes.ts create mode 100644 src/shared/contracts/routes/oauth.routes.ts create mode 100644 src/shared/contracts/routes/remote-control.routes.ts create mode 100644 src/shared/contracts/routes/shortcut.routes.ts create mode 100644 src/shared/contracts/routes/skillSync.routes.ts create mode 100644 src/shared/floatingButtonChannels.ts create mode 100644 test/e2e/specs/06-settings-ipc-boundary.smoke.spec.ts create mode 100644 test/e2e/specs/07-floating-ipc-boundary.smoke.spec.ts create mode 100644 test/e2e/specs/08-browser-route.smoke.spec.ts create mode 100644 test/e2e/specs/09-main-ipc-boundary.smoke.spec.ts create mode 100644 test/e2e/specs/10-settings-privacy-route.smoke.spec.ts create mode 100644 test/e2e/specs/11-remote-control-readonly-route.smoke.spec.ts create mode 100644 test/e2e/specs/12-knowledge-readonly-route.smoke.spec.ts create mode 100644 test/e2e/specs/13-mcp-readonly-route.smoke.spec.ts create mode 100644 test/e2e/specs/14-nowledgemem-config-route.smoke.spec.ts create mode 100644 test/e2e/specs/15-dashboard-readonly-route.smoke.spec.ts create mode 100644 test/e2e/specs/16-skills-readonly-route.smoke.spec.ts create mode 100644 test/e2e/specs/17-acp-readonly-route.smoke.spec.ts create mode 100644 test/e2e/specs/18-provider-readonly-route.smoke.spec.ts create mode 100644 test/e2e/specs/19-skill-sync-readonly-route.smoke.spec.ts create mode 100644 test/e2e/specs/20-data-security-readonly-route.smoke.spec.ts create mode 100644 test/e2e/specs/21-project-readonly-route.smoke.spec.ts create mode 100644 test/e2e/specs/22-window-readonly-route.smoke.spec.ts create mode 100644 test/e2e/specs/23-config-readonly-route.smoke.spec.ts create mode 100644 test/e2e/specs/24-config-system-readonly-route.smoke.spec.ts create mode 100644 test/e2e/specs/25-window-provider-deeplink-preview.smoke.spec.ts create mode 100644 test/e2e/specs/26-deepchat-agent-crud.smoke.spec.ts create mode 100644 test/e2e/specs/27-hooks-notification-command.smoke.spec.ts create mode 100644 test/e2e/specs/28-shortcut-route-restore.smoke.spec.ts create mode 100644 test/e2e/specs/29-workspace-readonly-route.smoke.spec.ts create mode 100644 test/main/presenter/configPresenter/fontSizeSettings.test.ts create mode 100644 test/main/presenter/dialogPresenter.test.ts create mode 100644 test/main/presenter/knowledgePresenter/knowledgeStorePresenter.test.ts create mode 100644 test/main/presenter/llmProviderPresenter/ollamaManager.test.ts create mode 100644 test/main/presenter/notificationPresenter.test.ts create mode 100644 test/main/scripts/architectureGuard.test.ts create mode 100644 test/renderer/api/preloadBoundaries.test.ts create mode 100644 test/renderer/components/AcpDebugDialog.test.ts create mode 100644 test/renderer/components/GitHubCopilotOAuth.test.ts create mode 100644 test/renderer/components/KnowledgeFile.test.ts create mode 100644 test/renderer/components/KnowledgeFileItem.test.ts create mode 100644 test/renderer/components/McpBuiltinMarket.test.ts create mode 100644 test/renderer/components/ModelScopeMcpSync.test.ts create mode 100644 test/renderer/components/NowledgeMemSettings.test.ts create mode 100644 test/renderer/components/PromptEditorSheet.test.ts create mode 100644 test/renderer/components/ProviderRateLimitConfig.test.ts create mode 100644 test/renderer/components/SkillEditorSheet.test.ts create mode 100644 test/renderer/components/SkillSyncSettings.test.ts create mode 100644 test/renderer/components/message/SelectedTextContextMenu.test.ts delete mode 100644 test/renderer/composables/useLegacyPresenter.test.ts create mode 100644 test/renderer/stores/dialogStore.test.ts diff --git a/docs/ARCHITECTURE.md b/docs/ARCHITECTURE.md index 51cb0c1de..b900cdbd7 100644 --- a/docs/ARCHITECTURE.md +++ b/docs/ARCHITECTURE.md @@ -58,8 +58,9 @@ flowchart LR - `src/shared/contracts/routes*.ts` 与 `events*.ts` 是 migrated path 的契约真源。 - `src/preload/createBridge.ts` 统一 route invoke 和 typed event subscribe。 - `src/renderer/api/*Client.ts` 是组件和 store 的默认入口。 -- `src/renderer/api/legacy/**` 是唯一 legacy quarantine。当前保留 `presenters.ts`、 - `presenterTransport.ts`、`runtime.ts` 三个兼容文件;新业务模块不应直接导入 legacy transport。 +- `src/renderer/api/legacy/**` 已退休并从当前树删除;guard 会阻止它被重新创建。 +- raw IPC 只允许存在于 `createBridge` 和专用 preload API 这类明确边界内,业务层不得直接调用 + `presenter:call`、`remoteControlPresenter:call` 或 `window.electron.ipcRenderer`。 ### 2. Main Route Runtime @@ -98,8 +99,9 @@ flowchart LR ## 防回归规则 - 新 renderer-main 能力默认走 `renderer/api/*Client` + `window.deepchat` + shared contracts。 -- legacy transport 只能留在 `src/renderer/api/legacy/**`,不新增第二个 quarantine 目录。 -- `scripts/architecture-guard.mjs` 固定 quarantine 文件数、检测 direct legacy transport、 +- legacy transport 已退休;不要重新创建 `src/renderer/api/legacy/**`,也不要新增第二个 + compatibility quarantine。确有兼容需要时,应先定义窄 typed route/event 或专用 preload API。 +- `scripts/architecture-guard.mjs` 检测 direct legacy transport、已退休 legacy 目录、 并读取 `docs/architecture/baselines/main-kernel-bridge-register.json`。 - `scripts/agent-cleanup-guard.mjs` 用于防止已退休 agent runtime 入口回流。 diff --git a/docs/README.md b/docs/README.md index d16216fff..195d8466d 100644 --- a/docs/README.md +++ b/docs/README.md @@ -16,9 +16,9 @@ Renderer -> agentSessionPresenter / agentRuntimePresenter / toolPresenter / llmProviderPresenter ``` -`useLegacyPresenter()`、`window.electron`、`window.api` 只允许作为兼容路径留在 -`src/renderer/api/legacy/**` quarantine 中。业务模块的新能力应从 `renderer/api/*Client` -和 shared contracts 进入。 +`useLegacyPresenter()`、`presenter:call`、`remoteControlPresenter:call` 和 +`src/renderer/api/legacy/**` 已经退休。业务模块的新能力应从 `renderer/api/*Client` 和 +shared contracts 进入;少数仍需要 raw IPC 的能力只能封装在明确 allowlist 的 preload/API 边界内。 ## 当前必读 diff --git a/docs/architecture/baselines/archive-reference-report.md b/docs/architecture/baselines/archive-reference-report.md index b74b85edc..c9f6607cd 100644 --- a/docs/architecture/baselines/archive-reference-report.md +++ b/docs/architecture/baselines/archive-reference-report.md @@ -1,6 +1,6 @@ # Archive Reference Baseline -Generated on 2026-04-20. +Generated on 2026-06-11. - Total references: 0 diff --git a/docs/architecture/baselines/dependency-report.md b/docs/architecture/baselines/dependency-report.md index fbcd0ff9d..0a6917fdd 100644 --- a/docs/architecture/baselines/dependency-report.md +++ b/docs/architecture/baselines/dependency-report.md @@ -1,117 +1,163 @@ # Dependency Baseline -Generated on 2026-04-20. +Generated on 2026-06-11. ## main -- Total files: 360 -- Internal dependency edges: 913 -- Cycles detected: 30 +- Total files: 428 +- Internal dependency edges: 1080 +- Cycles detected: 31 ### Top outgoing dependencies -- `presenter\index.ts`: 42 -- `presenter\configPresenter\index.ts`: 23 -- `presenter\agentRuntimePresenter\index.ts`: 22 -- `presenter\lifecyclePresenter\hooks\index.ts`: 17 -- `presenter\sqlitePresenter\index.ts`: 17 -- `presenter\sqlitePresenter\schemaCatalog.ts`: 17 -- `presenter\llmProviderPresenter\index.ts`: 14 -- `presenter\remoteControlPresenter\index.ts`: 14 -- `presenter\toolPresenter\agentTools\agentToolManager.ts`: 14 -- `presenter\agentSessionPresenter\index.ts`: 13 -- `presenter\llmProviderPresenter\acp\index.ts`: 12 -- `presenter\filePresenter\mime.ts`: 11 -- `presenter\llmProviderPresenter\managers\providerInstanceManager.ts`: 11 -- `presenter\mcpPresenter\inMemoryServers\builder.ts`: 11 -- `presenter\skillSyncPresenter\adapters\index.ts`: 11 +- `presenter/index.ts`: 45 +- `presenter/sqlitePresenter/index.ts`: 29 +- `presenter/agentRuntimePresenter/index.ts`: 27 +- `presenter/configPresenter/index.ts`: 27 +- `presenter/sqlitePresenter/schemaCatalog.ts`: 27 +- `presenter/lifecyclePresenter/hooks/index.ts`: 21 +- `presenter/toolPresenter/agentTools/agentToolManager.ts`: 20 +- `routes/index.ts`: 19 +- `presenter/agentSessionPresenter/index.ts`: 14 +- `presenter/filePresenter/mime.ts`: 14 +- `presenter/llmProviderPresenter/index.ts`: 14 +- `presenter/remoteControlPresenter/index.ts`: 14 +- `presenter/agentRuntimePresenter/dispatch.ts`: 13 +- `presenter/llmProviderPresenter/acp/index.ts`: 12 +- `presenter/llmProviderPresenter/acp/acpProcessManager.ts`: 11 ### Top incoming dependencies -- `eventbus.ts`: 56 -- `events.ts`: 56 -- `presenter\index.ts`: 44 -- `presenter\remoteControlPresenter\types.ts`: 37 -- `presenter\remoteControlPresenter\services\remoteBindingStore.ts`: 22 -- `routes\publishDeepchatEvent.ts`: 19 -- `presenter\sqlitePresenter\tables\baseTable.ts`: 17 -- `presenter\remoteControlPresenter\services\remoteConversationRunner.ts`: 16 -- `presenter\sqlitePresenter\index.ts`: 12 -- `presenter\filePresenter\BaseFileAdapter.ts`: 11 -- `presenter\llmProviderPresenter\baseProvider.ts`: 11 -- `lib\runtimeHelper.ts`: 8 -- `presenter\configPresenter\acpRegistryConstants.ts`: 8 -- `presenter\remoteControlPresenter\types\channel.ts`: 8 -- `lib\agentRuntime\sessionPaths.ts`: 7 +- `events.ts`: 55 +- `eventbus.ts`: 54 +- `presenter/index.ts`: 48 +- `presenter/remoteControlPresenter/types.ts`: 37 +- `presenter/sqlitePresenter/tables/baseTable.ts`: 28 +- `routes/publishDeepchatEvent.ts`: 28 +- `presenter/remoteControlPresenter/services/remoteBindingStore.ts`: 22 +- `presenter/sqlitePresenter/index.ts`: 17 +- `presenter/remoteControlPresenter/services/remoteConversationRunner.ts`: 16 +- `presenter/filePresenter/BaseFileAdapter.ts`: 13 +- `presenter/llmProviderPresenter/baseProvider.ts`: 11 +- `presenter/configPresenter/acpRegistryConstants.ts`: 9 +- `presenter/configPresenter/storeLike.ts`: 8 +- `presenter/llmProviderPresenter/acp/index.ts`: 8 +- `presenter/llmProviderPresenter/runtimePorts.ts`: 8 ### Cycle samples -- `presenter\index.ts -> presenter\windowPresenter\index.ts -> presenter\index.ts` -- `presenter\index.ts -> presenter\windowPresenter\index.ts -> presenter\tabPresenter.ts -> presenter\index.ts` -- `presenter\index.ts -> presenter\windowPresenter\index.ts -> presenter\windowPresenter\FloatingChatWindow.ts -> presenter\index.ts` -- `presenter\index.ts -> presenter\shortcutPresenter.ts -> presenter\index.ts` -- `presenter\index.ts -> presenter\llmProviderPresenter\index.ts -> presenter\llmProviderPresenter\baseProvider.ts -> presenter\devicePresenter\index.ts -> presenter\index.ts` -- `presenter\index.ts -> presenter\llmProviderPresenter\index.ts -> presenter\llmProviderPresenter\managers\providerInstanceManager.ts -> presenter\llmProviderPresenter\providers\githubCopilotProvider.ts -> presenter\githubCopilotDeviceFlow.ts -> presenter\index.ts` -- `presenter\index.ts -> presenter\llmProviderPresenter\index.ts -> presenter\llmProviderPresenter\managers\providerInstanceManager.ts -> presenter\llmProviderPresenter\providers\ollamaProvider.ts -> presenter\llmProviderPresenter\aiSdk\index.ts -> presenter\llmProviderPresenter\aiSdk\runtime.ts -> presenter\index.ts` -- `presenter\filePresenter\mime.ts -> presenter\filePresenter\CsvFileAdapter.ts -> presenter\filePresenter\BaseFileAdapter.ts -> presenter\filePresenter\mime.ts` -- `presenter\index.ts -> presenter\sessionPresenter\index.ts -> presenter\index.ts` -- `presenter\index.ts -> presenter\sessionPresenter\index.ts -> presenter\sessionPresenter\managers\conversationManager.ts -> presenter\index.ts` -- `presenter\index.ts -> presenter\upgradePresenter\index.ts -> presenter\index.ts` -- `presenter\index.ts -> presenter\mcpPresenter\index.ts -> presenter\mcpPresenter\serverManager.ts -> presenter\mcpPresenter\mcpClient.ts -> presenter\index.ts` -- `presenter\index.ts -> presenter\mcpPresenter\index.ts -> presenter\mcpPresenter\serverManager.ts -> presenter\mcpPresenter\mcpClient.ts -> presenter\mcpPresenter\inMemoryServers\builder.ts -> presenter\mcpPresenter\inMemoryServers\deepResearchServer.ts -> presenter\index.ts` -- `presenter\index.ts -> presenter\mcpPresenter\index.ts -> presenter\mcpPresenter\serverManager.ts -> presenter\mcpPresenter\mcpClient.ts -> presenter\mcpPresenter\inMemoryServers\builder.ts -> presenter\mcpPresenter\inMemoryServers\autoPromptingServer.ts -> presenter\index.ts` -- `presenter\index.ts -> presenter\mcpPresenter\index.ts -> presenter\mcpPresenter\serverManager.ts -> presenter\mcpPresenter\mcpClient.ts -> presenter\mcpPresenter\inMemoryServers\builder.ts -> presenter\mcpPresenter\inMemoryServers\conversationSearchServer.ts -> presenter\index.ts` -- `presenter\index.ts -> presenter\mcpPresenter\index.ts -> presenter\mcpPresenter\serverManager.ts -> presenter\mcpPresenter\mcpClient.ts -> presenter\mcpPresenter\inMemoryServers\builder.ts -> presenter\mcpPresenter\inMemoryServers\builtinKnowledgeServer.ts -> presenter\index.ts` -- `presenter\index.ts -> presenter\mcpPresenter\index.ts -> presenter\mcpPresenter\toolManager.ts -> presenter\index.ts` -- `presenter\index.ts -> presenter\mcpPresenter\index.ts -> presenter\index.ts` -- `presenter\sqlitePresenter\index.ts -> presenter\agentSessionPresenter\legacyImportService.ts -> presenter\sqlitePresenter\index.ts` -- `presenter\index.ts -> presenter\syncPresenter\index.ts -> presenter\index.ts` - -## renderer - -- Total files: 220 -- Internal dependency edges: 376 +- `presenter/index.ts -> presenter/windowPresenter/index.ts -> presenter/index.ts` +- `presenter/index.ts -> presenter/windowPresenter/index.ts -> presenter/tabPresenter.ts -> presenter/index.ts` +- `presenter/index.ts -> presenter/windowPresenter/index.ts -> presenter/windowPresenter/FloatingChatWindow.ts -> presenter/index.ts` +- `presenter/index.ts -> presenter/shortcutPresenter.ts -> presenter/index.ts` +- `presenter/index.ts -> presenter/llmProviderPresenter/index.ts -> presenter/llmProviderPresenter/baseProvider.ts -> presenter/devicePresenter/index.ts -> presenter/index.ts` +- `presenter/index.ts -> presenter/llmProviderPresenter/index.ts -> presenter/llmProviderPresenter/managers/providerInstanceManager.ts -> presenter/llmProviderPresenter/providers/githubCopilotProvider.ts -> presenter/githubCopilotDeviceFlow.ts -> presenter/index.ts` +- `presenter/index.ts -> presenter/llmProviderPresenter/index.ts -> presenter/llmProviderPresenter/managers/providerInstanceManager.ts -> presenter/llmProviderPresenter/providers/ollamaProvider.ts -> presenter/llmProviderPresenter/aiSdk/index.ts -> presenter/llmProviderPresenter/aiSdk/runtime.ts -> presenter/index.ts` +- `presenter/index.ts -> presenter/sessionPresenter/index.ts -> presenter/index.ts` +- `presenter/index.ts -> presenter/sessionPresenter/index.ts -> presenter/sessionPresenter/managers/conversationManager.ts -> presenter/index.ts` +- `presenter/index.ts -> presenter/upgradePresenter/index.ts -> presenter/index.ts` +- `presenter/index.ts -> presenter/mcpPresenter/index.ts -> presenter/mcpPresenter/serverManager.ts -> presenter/mcpPresenter/mcpClient.ts -> presenter/index.ts` +- `presenter/index.ts -> presenter/mcpPresenter/index.ts -> presenter/mcpPresenter/serverManager.ts -> presenter/mcpPresenter/mcpClient.ts -> presenter/mcpPresenter/inMemoryServers/builder.ts -> presenter/mcpPresenter/inMemoryServers/deepResearchServer.ts -> presenter/index.ts` +- `presenter/index.ts -> presenter/mcpPresenter/index.ts -> presenter/mcpPresenter/serverManager.ts -> presenter/mcpPresenter/mcpClient.ts -> presenter/mcpPresenter/inMemoryServers/builder.ts -> presenter/mcpPresenter/inMemoryServers/autoPromptingServer.ts -> presenter/index.ts` +- `presenter/index.ts -> presenter/mcpPresenter/index.ts -> presenter/mcpPresenter/serverManager.ts -> presenter/mcpPresenter/mcpClient.ts -> presenter/mcpPresenter/inMemoryServers/builder.ts -> presenter/mcpPresenter/inMemoryServers/conversationSearchServer.ts -> presenter/index.ts` +- `presenter/index.ts -> presenter/mcpPresenter/index.ts -> presenter/mcpPresenter/serverManager.ts -> presenter/mcpPresenter/mcpClient.ts -> presenter/mcpPresenter/inMemoryServers/builder.ts -> presenter/mcpPresenter/inMemoryServers/builtinKnowledgeServer.ts -> presenter/index.ts` +- `presenter/index.ts -> presenter/mcpPresenter/index.ts -> presenter/mcpPresenter/toolManager.ts -> presenter/index.ts` +- `presenter/index.ts -> presenter/mcpPresenter/index.ts -> presenter/index.ts` +- `presenter/sqlitePresenter/index.ts -> presenter/agentSessionPresenter/legacyImportService.ts -> presenter/sqlitePresenter/index.ts` +- `presenter/sqlitePresenter/index.ts -> presenter/agentSessionPresenter/legacyImportService.ts -> presenter/agentRuntimePresenter/messageStore.ts -> presenter/sqlitePresenter/index.ts` +- `presenter/index.ts -> presenter/syncPresenter/index.ts -> presenter/index.ts` + +## renderer-main + +- Total files: 261 +- Internal dependency edges: 458 - Cycles detected: 3 ### Top outgoing dependencies -- `App.vue`: 25 -- `pages\ChatPage.vue`: 16 -- `components\message\MessageItemAssistant.vue`: 15 -- `i18n\index.ts`: 12 -- `components\chat\ChatStatusBar.vue`: 9 -- `views\ChatTabView.vue`: 9 -- `components\ChatConfig.vue`: 8 -- `components\mcp-config\components\McpServers.vue`: 8 -- `components\sidepanel\viewer\WorkspacePreviewPane.vue`: 8 -- `components\sidepanel\WorkspacePanel.vue`: 8 -- `pages\NewThreadPage.vue`: 8 -- `components\markdown\MarkdownRenderer.vue`: 7 -- `components\mcp-config\components\index.ts`: 7 -- `components\message\MessageBlockContent.vue`: 7 -- `lib\storeInitializer.ts`: 7 +- `App.vue`: 29 +- `pages/ChatPage.vue`: 27 +- `i18n/index.ts`: 20 +- `components/message/MessageItemAssistant.vue`: 18 +- `pages/NewThreadPage.vue`: 18 +- `components/chat/ChatStatusBar.vue`: 17 +- `views/ChatTabView.vue`: 12 +- `components/ChatConfig.vue`: 8 +- `components/sidepanel/WorkspacePanel.vue`: 8 +- `components/sidepanel/viewer/WorkspacePreviewPane.vue`: 8 +- `components/WindowSideBar.vue`: 7 +- `components/chat/ChatInputBox.vue`: 7 +- `components/markdown/MarkdownRenderer.vue`: 7 +- `components/mcp-config/components/McpServers.vue`: 7 +- `components/mcp-config/components/index.ts`: 7 ### Top incoming dependencies -- `components\chat\messageListItems.ts`: 16 -- `stores\ui\session.ts`: 16 -- `stores\artifact.ts`: 13 -- `stores\providerStore.ts`: 13 -- `stores\theme.ts`: 12 -- `stores\ui\agent.ts`: 12 -- `stores\modelStore.ts`: 10 -- `stores\ui\sidepanel.ts`: 10 -- `stores\uiSettingsStore.ts`: 10 -- `stores\mcp.ts`: 8 -- `components\icons\ModelIcon.vue`: 6 -- `components\use-toast.ts`: 6 -- `stores\language.ts`: 6 -- `stores\ui\draft.ts`: 5 -- `stores\ui\pageRouter.ts`: 5 +- `components/chat/messageListItems.ts`: 22 +- `stores/ui/session.ts`: 16 +- `stores/providerStore.ts`: 14 +- `stores/artifact.ts`: 13 +- `stores/theme.ts`: 13 +- `stores/ui/agent.ts`: 13 +- `stores/uiSettingsStore.ts`: 12 +- `stores/modelStore.ts`: 11 +- `stores/ui/sidepanel.ts`: 10 +- `components/use-toast.ts`: 9 +- `stores/mcp.ts`: 8 +- `components/icons/ModelIcon.vue`: 6 +- `lib/onboardingResume.ts`: 6 +- `stores/language.ts`: 6 +- `stores/ui/draft.ts`: 5 ### Cycle samples -- `components\json-viewer\JsonValue.ts -> components\json-viewer\JsonObject.ts -> components\json-viewer\JsonValue.ts` -- `components\json-viewer\JsonValue.ts -> components\json-viewer\JsonArray.ts -> components\json-viewer\JsonValue.ts` -- `composables\usePageCapture.example.ts -> composables\usePageCapture.example.ts` +- `components/json-viewer/JsonValue.ts -> components/json-viewer/JsonObject.ts -> components/json-viewer/JsonValue.ts` +- `components/json-viewer/JsonArray.ts -> components/json-viewer/JsonValue.ts -> components/json-viewer/JsonArray.ts` +- `composables/usePageCapture.example.ts -> composables/usePageCapture.example.ts` + +## renderer-settings + +- Total files: 92 +- Internal dependency edges: 98 +- Cycles detected: 0 + +### Top outgoing dependencies + +- `main.ts`: 19 +- `components/ModelProviderSettingsDetail.vue`: 10 +- `components/skills/SkillsSettings.vue`: 8 +- `components/KnowledgeBaseSettings.vue`: 7 +- `components/CommonSettings.vue`: 5 +- `components/ModelProviderSettings.vue`: 5 +- `components/BedrockProviderSettingsDetail.vue`: 4 +- `components/SettingsOverview.vue`: 4 +- `components/DataSettings.vue`: 3 +- `components/PromptSetting.vue`: 3 +- `components/skills/SkillSyncDialog/ImportWizard.vue`: 3 +- `App.vue`: 2 +- `components/DisplaySettings.vue`: 2 +- `components/McpSettings.vue`: 2 +- `components/skills/SkillSyncDialog/SkillSyncDialog.vue`: 2 + +### Top incoming dependencies + +- `components/control-center/SettingsPageShell.vue`: 12 +- `lib/guidedOnboardingSettings.ts`: 3 +- `components/ProviderDialogContainer.vue`: 2 +- `components/ProviderModelManager.vue`: 2 +- `components/ProviderRateLimitConfig.vue`: 2 +- `components/ProviderSettingsShell.vue`: 2 +- `components/common/SettingToggleRow.vue`: 2 +- `components/skills/SkillSyncDialog/ConflictResolver.vue`: 2 +- `App.vue`: 1 +- `components/AboutUsSettings.vue`: 1 +- `components/AcpDebugDialog.vue`: 1 +- `components/AcpSettings.vue`: 1 +- `components/AddCustomModelButton.vue`: 1 +- `components/AddCustomProviderDialog.vue`: 1 +- `components/AzureProviderConfig.vue`: 1 + +### Cycle samples + +- None diff --git a/docs/architecture/baselines/main-kernel-boundary-baseline.md b/docs/architecture/baselines/main-kernel-boundary-baseline.md index 52844fc24..04925427f 100644 --- a/docs/architecture/baselines/main-kernel-boundary-baseline.md +++ b/docs/architecture/baselines/main-kernel-boundary-baseline.md @@ -1,59 +1,57 @@ # Main Kernel Boundary Baseline -Generated on 2026-04-20. +Generated on 2026-06-11. Current phase: P5. ## Metric Snapshot | Metric | Value | | --- | --- | -| `renderer.usePresenter.count` | 1 | +| `renderer.usePresenter.count` | 0 | | `renderer.business.usePresenter.count` | 0 | -| `renderer.quarantine.usePresenter.count` | 1 | -| `renderer.windowElectron.count` | 2 | +| `renderer.quarantine.usePresenter.count` | 0 | +| `renderer.windowElectron.count` | 0 | | `renderer.business.windowElectron.count` | 0 | -| `renderer.quarantine.windowElectron.count` | 2 | -| `renderer.windowApi.count` | 2 | +| `renderer.quarantine.windowElectron.count` | 0 | +| `renderer.windowApi.count` | 0 | | `renderer.business.windowApi.count` | 0 | -| `renderer.quarantine.windowApi.count` | 2 | -| `renderer.quarantine.sourceFile.count` | 3 | +| `renderer.quarantine.windowApi.count` | 0 | +| `renderer.quarantine.sourceFile.count` | 0 | | `hotpath.presenterEdge.count` | 10 | -| `runtime.rawTimer.count` | 122 | +| `runtime.rawTimer.count` | 157 | | `migrated.rawChannel.count` | 4 | | `bridge.active.count` | 0 | | `bridge.expired.count` | 0 | ## Renderer Single-Track Split -- Business layer: `src/renderer/src/**` -- Quarantine layer: `src/renderer/api/legacy/**` +- Business layer: `src/renderer/src/**`, `src/renderer/settings/**` +- Retired quarantine layer: `src/renderer/api/legacy/**` must remain deleted | Legacy surface | Business layer | Quarantine layer | Total | | --- | --- | --- | --- | -| legacy presenter helper | 0 | 1 | 1 | -| `window.electron` | 0 | 2 | 2 | -| `window.api` | 0 | 2 | 2 | +| legacy presenter helper | 0 | 0 | 0 | +| `window.electron` | 0 | 0 | 0 | +| `window.api` | 0 | 0 | 0 | ## Quarantine Exit Snapshot -- Retained capability family: `renderer legacy transport` -- Source files: 3 / 3 -- Delete condition: remove after settings compatibility surfaces stop importing the quarantine adapters. +- Retained capability family: none; `renderer legacy transport` is retired +- Source files: 0 / 0 +- Delete condition: already satisfied; a recreated quarantine directory is a regression. -- `src/renderer/api/legacy/presenterTransport.ts` -- `src/renderer/api/legacy/presenters.ts` -- `src/renderer/api/legacy/runtime.ts` +- None ## Phase Gates | Phase | Gate indicator | Current signal | Status | | --- | --- | --- | --- | -| `P0` | Fixed quarantine path `src/renderer/api/legacy/**` exists and baseline emits business/quarantine split metrics | `src/renderer/api/legacy/**` exists; split metrics emitted | ready | +| `P0` | Retired quarantine path `src/renderer/api/legacy/**` must remain deleted and baseline emits business/retired split metrics | `src/renderer/api/legacy/**` deleted; split metrics emitted | ready | | `P1` | Business layer direct legacy presenter helper / `window.electron` / `window.api` counts must reach `0` | legacyPresenter=0, window.electron=0, window.api=0 | ready | | `P2` | Business layer `configPresenter` and `llmproviderPresenter` hits must reach `0` | configPresenter=0, llmproviderPresenter=0 | ready | | `P3` | Business layer window/device/workspace/project/file/browser/tab presenter hits must reach `0` | window=0, device=0, workspace=0, project=0, file=0, browser=0, tab=0 | ready | | `P4` | Business layer session residual / skill / mcp / sync / upgrade / dialog / tool presenter hits must reach `0` | agentSession=0, skill=0, mcp=0, sync=0, upgrade=0, dialog=0, tool=0 | ready | -| `P5` | Business layer direct legacy access must be `0`, and quarantine source files must satisfy the exit standard (`<= 3` source files) | businessLegacy=0/0/0, quarantineSourceFiles=3/3 | ready | +| `P5` | Business layer direct legacy access must be `0`, and retired quarantine source files must stay at `0` | businessLegacy=0/0/0, quarantineSourceFiles=0/0 | ready | ## Hot Path Direct Dependencies @@ -72,39 +70,38 @@ Current phase: P5. ## Renderer legacy presenter helpers -- Total count: 1 +- Total count: 0 -- `src/renderer/api/legacy/presenters.ts`: 1 +- None ## Renderer window.electron -- Total count: 2 +- Total count: 0 -- `src/renderer/api/legacy/presenterTransport.ts`: 1 -- `src/renderer/api/legacy/runtime.ts`: 1 +- None ## Renderer window.api -- Total count: 2 +- Total count: 0 -- `src/renderer/api/legacy/runtime.ts`: 2 +- None ## Raw Timers -- Total count: 122 +- Total count: 157 - `src/main/presenter/githubCopilotDeviceFlow.ts`: 6 - `src/main/presenter/browser/BrowserTab.ts`: 5 - `src/main/presenter/devicePresenter/index.ts`: 5 +- `src/main/presenter/llmProviderPresenter/aiSdk/runtime.ts`: 5 - `src/renderer/src/components/message/MessageToolbar.vue`: 4 - `src/renderer/src/composables/message/useMessageScroll.ts`: 4 - `src/main/lib/agentRuntime/backgroundExecSessionManager.ts`: 3 - `src/main/presenter/configPresenter/acpInitHelper.ts`: 3 +- `src/main/presenter/lifecyclePresenter/SplashWindowManager.ts`: 3 - `src/main/presenter/skillPresenter/skillExecutionService.ts`: 3 - `src/main/presenter/tabPresenter.ts`: 3 - `src/main/presenter/upgradePresenter/index.ts`: 3 -- `src/renderer/src/stores/mcp.ts`: 3 -- `src/main/lib/agentRuntime/rtkRuntimeService.ts`: 2 ## Migrated Path Raw Channel Literals diff --git a/docs/architecture/baselines/main-kernel-migration-scoreboard.json b/docs/architecture/baselines/main-kernel-migration-scoreboard.json index 8af594126..57ad23c76 100644 --- a/docs/architecture/baselines/main-kernel-migration-scoreboard.json +++ b/docs/architecture/baselines/main-kernel-migration-scoreboard.json @@ -1,20 +1,20 @@ { "program": "main-kernel-refactor", - "generatedOn": "2026-04-20", + "generatedOn": "2026-06-11", "currentPhase": "P5", "metrics": { - "renderer.usePresenter.count": 1, + "renderer.usePresenter.count": 0, "renderer.business.usePresenter.count": 0, - "renderer.quarantine.usePresenter.count": 1, - "renderer.windowElectron.count": 2, + "renderer.quarantine.usePresenter.count": 0, + "renderer.windowElectron.count": 0, "renderer.business.windowElectron.count": 0, - "renderer.quarantine.windowElectron.count": 2, - "renderer.windowApi.count": 2, + "renderer.quarantine.windowElectron.count": 0, + "renderer.windowApi.count": 0, "renderer.business.windowApi.count": 0, - "renderer.quarantine.windowApi.count": 2, - "renderer.quarantine.sourceFile.count": 3, + "renderer.quarantine.windowApi.count": 0, + "renderer.quarantine.sourceFile.count": 0, "hotpath.presenterEdge.count": 10, - "runtime.rawTimer.count": 122, + "runtime.rawTimer.count": 157, "migrated.rawChannel.count": 4, "bridge.active.count": 0, "bridge.expired.count": 0 @@ -22,8 +22,8 @@ "phaseGates": [ { "phase": "P0", - "indicator": "Fixed quarantine path `src/renderer/api/legacy/**` exists and baseline emits business/quarantine split metrics", - "current": "`src/renderer/api/legacy/**` exists; split metrics emitted", + "indicator": "Retired quarantine path `src/renderer/api/legacy/**` must remain deleted and baseline emits business/retired split metrics", + "current": "`src/renderer/api/legacy/**` deleted; split metrics emitted", "status": "ready" }, { @@ -52,8 +52,8 @@ }, { "phase": "P5", - "indicator": "Business layer direct legacy access must be `0`, and quarantine source files must satisfy the exit standard (`<= 3` source files)", - "current": "businessLegacy=0/0/0, quarantineSourceFiles=3/3", + "indicator": "Business layer direct legacy access must be `0`, and retired quarantine source files must stay at `0`", + "current": "businessLegacy=0/0/0, quarantineSourceFiles=0/0", "status": "ready" } ], diff --git a/docs/architecture/baselines/main-kernel-migration-scoreboard.md b/docs/architecture/baselines/main-kernel-migration-scoreboard.md index 6f0f05ad8..f6d930994 100644 --- a/docs/architecture/baselines/main-kernel-migration-scoreboard.md +++ b/docs/architecture/baselines/main-kernel-migration-scoreboard.md @@ -1,24 +1,24 @@ # Main Kernel Migration Scoreboard -Generated on 2026-04-20. +Generated on 2026-06-11. Current phase: P5. Phase 0 establishes the comparison baseline. Later phases should update this report and compare against this checkpoint. | Metric | Value | Status | | --- | --- | --- | -| `renderer.usePresenter.count` | 1 | baseline | +| `renderer.usePresenter.count` | 0 | baseline | | `renderer.business.usePresenter.count` | 0 | baseline | -| `renderer.quarantine.usePresenter.count` | 1 | baseline | -| `renderer.windowElectron.count` | 2 | baseline | +| `renderer.quarantine.usePresenter.count` | 0 | baseline | +| `renderer.windowElectron.count` | 0 | baseline | | `renderer.business.windowElectron.count` | 0 | baseline | -| `renderer.quarantine.windowElectron.count` | 2 | baseline | -| `renderer.windowApi.count` | 2 | baseline | +| `renderer.quarantine.windowElectron.count` | 0 | baseline | +| `renderer.windowApi.count` | 0 | baseline | | `renderer.business.windowApi.count` | 0 | baseline | -| `renderer.quarantine.windowApi.count` | 2 | baseline | -| `renderer.quarantine.sourceFile.count` | 3 | baseline | +| `renderer.quarantine.windowApi.count` | 0 | baseline | +| `renderer.quarantine.sourceFile.count` | 0 | baseline | | `hotpath.presenterEdge.count` | 10 | baseline | -| `runtime.rawTimer.count` | 122 | baseline | +| `runtime.rawTimer.count` | 157 | baseline | | `migrated.rawChannel.count` | 4 | baseline | | `bridge.active.count` | 0 | baseline | | `bridge.expired.count` | 0 | baseline | @@ -27,10 +27,10 @@ Phase 0 establishes the comparison baseline. Later phases should update this rep | Phase | Status | Current signal | | --- | --- | --- | -| `P0` | ready | `src/renderer/api/legacy/**` exists; split metrics emitted | +| `P0` | ready | `src/renderer/api/legacy/**` deleted; split metrics emitted | | `P1` | ready | legacyPresenter=0, window.electron=0, window.api=0 | | `P2` | ready | configPresenter=0, llmproviderPresenter=0 | | `P3` | ready | window=0, device=0, workspace=0, project=0, file=0, browser=0, tab=0 | | `P4` | ready | agentSession=0, skill=0, mcp=0, sync=0, upgrade=0, dialog=0, tool=0 | -| `P5` | ready | businessLegacy=0/0/0, quarantineSourceFiles=3/3 | +| `P5` | ready | businessLegacy=0/0/0, quarantineSourceFiles=0/0 | diff --git a/docs/architecture/baselines/zero-inbound-candidates.md b/docs/architecture/baselines/zero-inbound-candidates.md index 22d13f18a..fafc21875 100644 --- a/docs/architecture/baselines/zero-inbound-candidates.md +++ b/docs/architecture/baselines/zero-inbound-candidates.md @@ -1,75 +1,96 @@ # Zero Inbound Candidates -Generated on 2026-04-20. +Generated on 2026-06-11. These files have no in-repo importers inside their scope and need manual classification before deletion. ## main -- Candidate count: 15 +- Candidate count: 16 +- `backgroundExecUtilityHostEntry.ts` - `env.d.ts` -- `lib\system.ts` -- `lib\terminalHelper.ts` -- `presenter\browser\BrowserContextBuilder.ts` -- `presenter\configPresenter\aes.ts` -- `presenter\llmProviderPresenter\oauthHelper.ts` -- `presenter\mcpPresenter\agentMcpFilter.ts` -- `presenter\searchPrompts\searchPrompts.ts` -- `presenter\sessionPresenter\events.ts` -- `presenter\sessionPresenter\persistence\conversationPersister.ts` -- `presenter\sessionPresenter\persistence\messagePersister.ts` -- `presenter\sessionPresenter\tab\tabAdapter.ts` -- `presenter\sessionPresenter\types.ts` -- `presenter\sqlitePresenter\tables\attachments.ts` -- `presenter\workspacePresenter\fileCache.ts` +- `lib/system.ts` +- `lib/terminalHelper.ts` +- `presenter/browser/BrowserContextBuilder.ts` +- `presenter/configPresenter/aes.ts` +- `presenter/llmProviderPresenter/oauthHelper.ts` +- `presenter/mcpPresenter/agentMcpFilter.ts` +- `presenter/searchPrompts/searchPrompts.ts` +- `presenter/sessionPresenter/events.ts` +- `presenter/sessionPresenter/persistence/conversationPersister.ts` +- `presenter/sessionPresenter/persistence/messagePersister.ts` +- `presenter/sessionPresenter/tab/tabAdapter.ts` +- `presenter/sessionPresenter/types.ts` +- `presenter/sqlitePresenter/tables/attachments.ts` +- `presenter/workspacePresenter/fileCache.ts` -## renderer +## renderer-main -- Candidate count: 44 +- Candidate count: 46 -- `components\ChatConfig.vue` -- `components\ChatConfig\ConfigSwitchField.vue` -- `components\FileItem.vue` -- `components\ModelSelect.vue` -- `components\ScrollablePopover.vue` -- `components\artifacts\ArtifactBlock.vue` -- `components\chat-input\SkillsIndicator.vue` -- `components\chat-input\VoiceCallWidget.vue` -- `components\chat-input\components\ToolbarButton.vue` -- `components\chat-input\composables\useAgentMcpData.ts` -- `components\chat-input\composables\useContextLength.ts` -- `components\chat-input\composables\useDragAndDrop.ts` -- `components\chat-input\composables\useInputHistory.ts` -- `components\chat-input\composables\useInputSettings.ts` -- `components\chat-input\composables\usePromptInputFiles.ts` -- `components\chat-input\composables\useRateLimitStatus.ts` -- `components\editor\mention\PromptParamsDialog.vue` -- `components\editor\mention\mention.ts` -- `components\editor\mention\slashMention.ts` -- `components\mcp-config\AgentMcpSelector.vue` -- `components\message\MessageActionButtons.vue` -- `components\message\MessageItemPlaceholder.vue` -- `components\message\ReferencePreview.vue` -- `components\settings\ModelConfigItem.vue` -- `composables\message\useMessageScroll.ts` -- `composables\useArtifactCodeEditor.ts` -- `composables\useArtifactContext.ts` -- `composables\useArtifactExport.ts` -- `composables\useArtifactViewMode.ts` -- `composables\useSearchConfig.ts` -- `composables\useViewportSize.ts` +- `components/ChatConfig.vue` +- `components/ChatConfig/ConfigSwitchField.vue` +- `components/FileItem.vue` +- `components/ModelSelect.vue` +- `components/ScrollablePopover.vue` +- `components/artifacts/ArtifactBlock.vue` +- `components/chat-input/SkillsIndicator.vue` +- `components/chat-input/VoiceCallWidget.vue` +- `components/chat-input/components/ToolbarButton.vue` +- `components/chat-input/composables/useAgentMcpData.ts` +- `components/chat-input/composables/useContextLength.ts` +- `components/chat-input/composables/useDragAndDrop.ts` +- `components/chat-input/composables/useInputHistory.ts` +- `components/chat-input/composables/useInputSettings.ts` +- `components/chat-input/composables/usePromptInputFiles.ts` +- `components/chat-input/composables/useRateLimitStatus.ts` +- `components/chat/composables/useVoiceInput.ts` +- `components/editor/mention/PromptParamsDialog.vue` +- `components/editor/mention/mention.ts` +- `components/editor/mention/slashMention.ts` +- `components/mcp-config/AgentMcpSelector.vue` +- `components/mcp-config/const.ts` +- `components/message/MessageActionButtons.vue` +- `components/message/MessageItemPlaceholder.vue` +- `components/message/ReferencePreview.vue` +- `components/settings/ModelConfigItem.vue` +- `composables/message/useMessageScroll.ts` +- `composables/useArtifactCodeEditor.ts` +- `composables/useArtifactContext.ts` +- `composables/useArtifactExport.ts` +- `composables/useArtifactViewMode.ts` +- `composables/useSearchConfig.ts` +- `composables/useViewportSize.ts` - `env.d.ts` -- `lib\float.cursor.ts` -- `lib\gemini.ts` -- `lib\sanitizeText.ts` +- `lib/float.cursor.ts` +- `lib/gemini.ts` +- `lib/sanitizeText.ts` +- `main.ts` +- `stores/floatingButton.ts` +- `stores/prompts.ts` +- `stores/providerDeeplinkImport.ts` +- `stores/shortcutKey.ts` +- `stores/sync.ts` +- `stores/systemPromptStore.ts` +- `utils/maxOutputTokens.ts` +- `views/SettingsTabView.vue` + +## renderer-settings + +- Candidate count: 13 + +- `components/AcpDependencyDialog.vue` +- `components/AcpProfileDialog.vue` +- `components/AcpProfileManagerDialog.vue` +- `components/AcpTerminalDialog.vue` +- `components/common/AutoCompactionSettingsSection.vue` +- `components/common/DefaultModelSettingsSection.vue` +- `components/prompt/PromptSettingsHeader.vue` +- `components/skills/SkillSyncDialog/SyncResult.vue` +- `components/skills/SkillsHeader.vue` +- `icons/MaximizeIcon.vue` +- `icons/MinimizeIcon.vue` +- `icons/RestoreIcon.vue` - `main.ts` -- `stores\floatingButton.ts` -- `stores\prompts.ts` -- `stores\providerDeeplinkImport.ts` -- `stores\shortcutKey.ts` -- `stores\sync.ts` -- `stores\systemPromptStore.ts` -- `utils\maxOutputTokens.ts` -- `views\SettingsTabView.vue` diff --git a/docs/architecture/event-system.md b/docs/architecture/event-system.md index 23c937b92..93e77c82b 100644 --- a/docs/architecture/event-system.md +++ b/docs/architecture/event-system.md @@ -5,7 +5,8 @@ 注意: - 当前 active renderer-main boundary 已经优先走 `renderer/api/*Client` + `window.deepchat` + typed contracts -- 下文中涉及 `useLegacyPresenter()`、`window.api`、raw `window.electron` 的内容,应视为 legacy / compatibility 背景 +- 历史 `useLegacyPresenter()` / `presenter:call` transport 已退休;新调用不得重新引入该路径 +- raw `window.electron` 只能出现在明确 allowlist 的 preload/bridge 边界 - 当前 single-track 规则见 `docs/ARCHITECTURE.md` 的 renderer-main boundary 章节 ## 📋 核心组件 @@ -183,12 +184,8 @@ sendToTab(tabId: number, eventName: string, ...args) { ### 4. sendToWindow - 窗口级别通信 -```typescript -// 发送到特定窗口的所有标签页 -eventBus.sendToWindow(windowId, TAB_EVENTS.TITLE_UPDATED, { - title: '新标题' -}) -``` +当前新代码不应再通过 raw tab renderer channel 同步标签标题或标签列表;窗口/标签状态如需暴露给 +renderer,应先定义 shared typed event contract,再由 presenter 发布 typed envelope。 **实现**: @@ -428,7 +425,6 @@ eventBus.send(MCP_EVENTS.TOOL_CALL_RESULT, { ```typescript export const TAB_EVENTS = { - TITLE_UPDATED: 'tab:title-updated', // 标签标题更新 CONTENT_UPDATED: 'tab:content-updated', // 标签内容更新 STATE_CHANGED: 'tab:state-changed', // 标签状态变化 VISIBILITY_CHANGED: 'tab:visibility-changed', // 标签可见性变化 @@ -455,27 +451,27 @@ eventBus.sendToMain(TAB_EVENTS.RENDERER_TAB_READY, { tabId }) eventBus.send(TAB_EVENTS.CLOSED, { tabId }) ``` -### WINDOW_EVENTS - 窗口事件 +### WINDOW_EVENTS - 窗口内部事件 ```typescript export const WINDOW_EVENTS = { - READY_TO_SHOW: 'window:ready-to-show', // 窗口准备显示 - WINDOW_FOCUSED: 'window:focused', // 窗口获得焦点 - WINDOW_BLURRED: 'window:blurred', // 窗口失去焦点 - WINDOW_MAXIMIZED: 'window:maximized', // 窗口最大化 - WINDOW_UNMAXIMIZED: 'window:unmaximized', // 窗口还原 - WINDOW_RESIZED: 'window:resized', // 窗口大小变化 - WINDOW_CLOSED: 'window:closed', // 窗口关闭 - ENTER_FULL_SCREEN: 'window:enter-full-screen', // 进入全屏 - LEAVE_FULL_SCREEN: 'window:leave-full-screen', // 退出全屏 + WINDOW_RESIZE: 'window:resize', // main 内部:窗口大小变化 + WINDOW_MAXIMIZED: 'window:maximized', // main 内部:窗口最大化 + WINDOW_UNMAXIMIZED: 'window:unmaximized', // main 内部:窗口还原 + WINDOW_ENTER_FULL_SCREEN: 'window:enter-full-screen', + WINDOW_LEAVE_FULL_SCREEN: 'window:leave-full-screen', + WINDOW_CLOSED: 'window:closed' } ``` **使用场景**: - 窗口生命周期管理 -- 窗口 UI 状态同步 +- TabPresenter 根据窗口尺寸、最大化、全屏和关闭事件调整 BrowserView bounds +- 主窗口和设置窗口的 renderer UI 状态必须使用 typed `window.state.changed` 事件,不再直接监听 + `window:maximized` / `window:unmaximized` / `window:enter-full-screen` / + `window:leave-full-screen` raw channel -**文件位置**:`src/main/events.ts:88-107` +**文件位置**:`src/main/events.ts` ### WORKSPACE_EVENTS - 工作区事件 @@ -660,151 +656,71 @@ sequenceDiagram - typed event contract - `renderer/api/*Client` -下面的 `useLegacyPresenter()` 小节主要用于解释 legacy transport 是如何工作的,以及为什么它需要被继续收口。 - -### useLegacyPresenter - legacy Presenter 兼容调用 - -**文件位置**:`src/renderer/api/legacy/presenters.ts` - -| 组件 | 文件位置 | 职责 | -|------|---------|------| -| **useLegacyPresenter** | `src/renderer/api/legacy/presenters.ts` | 为兼容路径提供类型安全的 Presenter 方法调用代理 | - -### 工作原理 - -`useLegacyPresenter()` 实现了渲染层到主进程的 legacy 双向代理调用系统: - -1. **类型安全** - 通过 TypeScript 泛型确保调用方法的类型正确 -2. **WebContentsId 映射** - 自动获取并缓存当前的 webContentsId,供主进程映射到 tabId/windowId -3. **安全序列化** - `safeSerialize()` 处理不可序列化对象 -4. **统一 IPC 通道** - 所有调用通过 `presenter:call` 路由到主进程 +历史 `useLegacyPresenter()`、`presenter:call`、`remoteControlPresenter:call` 和 +`src/renderer/api/legacy/**` 已删除。当前 request/response 调用统一通过 shared route +contract、`window.deepchat.invoke()` 和 `renderer/api/*Client` 完成;主进程 route handler 再转接到 +对应 presenter 或 service。 ```mermaid sequenceDiagram - participant UI as Vue Component - participant UP as useLegacyPresenter - participant IPC as electron.ipcRenderer - participant Router as presenter:call - participant P as Presenter - - UI->>UP: useLegacyPresenter('agentSessionPresenter') - UI->>UP: sendMessage(...) - UP->>UP: safeSerialize(payloads) - UP->>UP: getLegacyWebContentsId() - UP->>IPC: invoke(presenter:call) - IPC->>Router: 路由到指定 Presenter - Router->>P: 调用 sendMessage - P-->>Router: 返回结果 - Router-->>IPC: 返回结果 - IPC-->>UP: Promise resolve - UP-->>UI: 返回结果 -``` - -### 核心实现 - -```typescript -export function useLegacyPresenter( - name: T, - options?: LegacyPresenterOptions -): IPresenter[T] { - return useLegacyPresenterTransport(name, options) -} -``` - -通过 Proxy 机制,所有对 Presenter 方法的调用都会被拦截并转换为 IPC 调用: - -```typescript -Proxy handler: - get(presenterName, functionName) { - return async (...payloads) => { - const webContentsId = getLegacyWebContentsId() - const rawPayloads = payloads.map((e) => safeSerialize(toRaw(e))) - return window.electron.ipcRenderer.invoke( - 'presenter:call', - presenterName, - functionName, - ...rawPayloads - ) - } - } -``` - -### WebContentsId 到 tabId/windowId 映射 - -- legacy runtime 通过 `getLegacyWebContentsId()` 包装 `window.api.getWebContentsId()` 获取自己的 webContentsId -- 主进程通过 IPC 调用携带的 webContentsId 自动映射到对应的 tabId 和 windowId -- 这解决了渲染层不知道自己所属 tabId 的问题 - -### 使用示例 - -```typescript -// Vue 组件中 -import { useLegacyPresenter } from '@api/legacy/presenters' - -const agentPresenter = useLegacyPresenter('agentSessionPresenter') -const projectPresenter = useLegacyPresenter('projectPresenter') - -// 发送消息 -async function sendMessage(sessionId: string, content: string) { - await agentPresenter.sendMessage(sessionId, content) -} - -// 打开项目目录 -async function openProject(path: string) { - await projectPresenter.openDirectory(path) -} -``` - -### 与 EventBus 的区别 - -| 特性 | EventBus | useLegacyPresenter (legacy IPC) | -|------|----------|-------------------| + participant UI as Vue Component / Store + participant Client as renderer/api Client + participant Bridge as window.deepchat + participant Route as main route dispatcher + participant P as Presenter / Service + + UI->>Client: method(input) + Client->>Bridge: invoke(route.name, input) + Bridge->>Route: validated route envelope + Route->>P: call presenter/service method + P-->>Route: result + Route-->>Bridge: validated output + Bridge-->>Client: typed result + Client-->>UI: domain-shaped result +``` + +与 EventBus 的区别: + +| 特性 | EventBus / typed events | Typed route | +|------|----------|-------------| | 模式 | pub/sub(发布/订阅) | request/response(请求/响应) | | 方向 | 主要主→渲染(广播) | 渲染→主(调用) | | 返回值 | 无返回值 | Promise | | 典型用途 | 状态通知、流式更新、UI 同步 | CRUD 操作、命令执行、数据查询 | -| 监听方式 | renderer 监听事件 | renderer 调用方法 | -| 通信通道 | `sendToRenderer()` / `on()` | `invoke('presenter:call')` | - -### 调试支持 - -通过环境变量 `VITE_LOG_IPC_CALL=1` 可以开启 IPC 调用日志: - -```bash -VITE_LOG_IPC_CALL=1 npm run dev -``` +| 监听方式 | `window.deepchat.on()` 或 client 封装 | client 方法调用 | +| 通信通道 | typed event envelope | typed route envelope | -控制台输出: -``` -[Renderer IPC] WebContents:42 -> agent.sendMessage -``` +调试 renderer-main 调用时,优先看 `src/shared/contracts/routes*.ts`、`src/renderer/api/*Client.ts` +和 `src/main/routes/*`;不要从已退休 legacy presenter transport 反推。 ## 🔍 在渲染进程监听事件 ### Vue 组件中监听事件 ```typescript -import { eventBus } from '@preload' +import { chatStreamCompletedEvent, chatStreamUpdatedEvent } from '@shared/contracts/events' export default { setup() { + let stopChunk: (() => void) | null = null + let stopEnd: (() => void) | null = null + onMounted(() => { // 监听流响应 - window.api.on(STREAM_EVENTS.RESPONSE, (data) => { + stopChunk = window.deepchat.on(chatStreamUpdatedEvent.name, (data) => { console.log('收到流响应:', data) - // 更新 UI }) // 监听流结束 - window.api.on(STREAM_EVENTS.END, (data) => { + stopEnd = window.deepchat.on(chatStreamCompletedEvent.name, (data) => { console.log('流结束:', data) }) }) onUnmounted(() => { // 清理监听器 - window.api.removeAllListeners(STREAM_EVENTS.RESPONSE) - window.api.removeAllListeners(STREAM_EVENTS.END) + stopChunk?.() + stopEnd?.() }) } } @@ -814,20 +730,27 @@ export default { ```typescript import { defineStore } from 'pinia' -import { eventBus } from '@preload' +import { chatStreamUpdatedEvent } from '@shared/contracts/events' export const useChatStore = defineStore('chat', { state: () => ({ - messages: [] + messages: [], + stopStreamListener: null as null | (() => void) }), actions: { initEventListener() { - window.api.on(STREAM_EVENTS.RESPONSE, (data) => { + this.stopStreamListener?.() + this.stopStreamListener = window.deepchat.on(chatStreamUpdatedEvent.name, (data) => { this.handleStreamResponse(data) }) }, + disposeEventListener() { + this.stopStreamListener?.() + this.stopStreamListener = null + }, + handleStreamResponse(data) { // 处理流响应 const { content, tool_call, eventId } = data @@ -842,7 +765,8 @@ export const useChatStore = defineStore('chat', { - **EventBus**: `src/main/eventbus.ts:1-152` - **事件常量**: `src/main/events.ts:1-263` - **Presenter 初始化**: `src/main/presenter/index.ts` -- **useLegacyPresenter**: `src/renderer/api/legacy/presenters.ts` +- **Typed route/event contracts**: `src/shared/contracts/routes.ts`, `src/shared/contracts/events.ts` +- **Renderer clients**: `src/renderer/api/` ## 📚 相关阅读 diff --git a/docs/architecture/presenter-ipc-migration-plan/audit.md b/docs/architecture/presenter-ipc-migration-plan/audit.md new file mode 100644 index 000000000..f371d388b --- /dev/null +++ b/docs/architecture/presenter-ipc-migration-plan/audit.md @@ -0,0 +1,126 @@ +# Presenter IPC Migration Completion - Audit + +Audit snapshot: 2026-06-10. + +Execution snapshot: 2026-06-11. + +- Renderer settings business surfaces have been migrated off `@api/legacy/presenters` and direct + `window.electron.ipcRenderer` for the audited slices. +- Completed typed domains now include Knowledge, Skill Sync, OAuth, NowledgeMem, database repair, + browser sandbox clear, MCP Router, Remote Control, settings/window notifications, ACP settings + reload, Skills catalog reload, ACP terminal command/events, Shortcut runtime, chat stream + terminal events, context menu events, app runtime events, and secondary renderer preload + hardening. +- Current source scan still shows raw IPC in startup/specialized preload boundaries only: + `src/preload/index.ts`, `src/preload/plugin-settings-preload.ts`, + `src/preload/splash-preload.ts`, `src/preload/floating-preload.ts`, + `src/preload/browser-overlay-preload.ts`, and `src/preload/createBridge.ts`. +- `presenter:call`, `remoteControlPresenter:call`, `Presenter.DISPATCHABLE_PRESENTERS`, + `Presenter.REMOTE_CONTROL_METHODS`, and `src/renderer/api/legacy/**` have been removed from + source. + +## Commands Used + +```bash +rg "useLegacyPresenter|window\\.electron|window\\.api" src/renderer src/preload +rg "ipcMain\\.|ipcRenderer\\.|webContents\\.send|sendSync" src/main src/preload src/renderer +rg "eventBus\\.send|eventBus\\.sendToRenderer|eventBus\\.on" src/main +node scripts/architecture-guard.mjs +``` + +`node scripts/architecture-guard.mjs` passed after the guard was expanded to settings and after +`src/renderer/api/legacy/**` was retired. + +## Existing Typed Boundary + +The shared contract catalog currently contains broad coverage: + +| Contract area | Current coverage | +| --- | --- | +| Routes | 271 typed routes across browser, chat, config, database security, device, dialog, file, MCP, models, onboarding, plugins, project, providers, scheduled tasks, sessions, settings, skills, startup, sync, system, tab, tools, upgrade, window, workspace | +| Events | 54 typed events across browser, chat, config, dialog, MCP, models, providers, sessions, settings, skills, startup, sync, upgrade, window, workspace | +| Bridge | `src/preload/createBridge.ts` validates route input/output and typed event envelopes | +| Main dispatcher | `src/main/routes/index.ts` owns `deepchat:route:invoke` | +| Renderer clients | `src/renderer/api/*Client.ts` covers the main chat/session/provider/model/MCP/settings path | + +## Generic Presenter Dispatchers Retired + +`src/main/presenter/index.ts` no longer registers: + +| IPC handler | Current role | Risk | +| --- | --- | --- | +| `presenter:call` | Removed | Generic method reflection is no longer renderer-callable | +| `remoteControlPresenter:call` | Removed | Remote control now uses typed `remoteControl.*` routes | + +The generic dispatcher allowlists `Presenter.DISPATCHABLE_PRESENTERS` and +`Presenter.REMOTE_CONTROL_METHODS` have also been removed. + +## Initial Legacy Presenter Call Inventory + +The following table records the 2026-06-10 audit baseline before the execution work in this branch. +It is intentionally kept as a migration source map, not as the current remaining source scan. + +Initial named `useLegacyPresenter('...')` hits: + +| Presenter | Count | Main callers and methods | +| --- | ---: | --- | +| `configPresenter` | 12 | ACP registry/manual agent management, DeepChat agent CRUD, hooks notifications, skill draft suggestions, update channel, proxy settings, logging folder, provider DB refresh, generic get/set setting | +| `windowPresenter` | 5 | settings window close/provider-install state, main-window focus for onboarding, update check broadcast, guided onboarding helper injection | +| `llmproviderPresenter` | 5 | key status, refresh models, embedding dimensions, ModelScope MCP sync, provider rate limit update/status, ACP debug action | +| `devicePresenter` | 5 | app/device info, select directory/files, data reset | +| `skillSyncPresenter` | 4 | scan, discovery acknowledgement, import/export preview and execution | +| `projectPresenter` | 3 | recent projects, select directory, path exists | +| `knowledgePresenter` | 3 | knowledge file CRUD, query, validation, supported languages/separators | +| `agentSessionPresenter` | 2 | agents list, usage dashboard, RTK health retry | +| `oauthPresenter` | 1 | GitHub Copilot OAuth/device flow | +| `mcpPresenter` | 1 | MCP Router market/API key/install helpers | +| `toolPresenter` | 1 | tool definitions for agent settings | +| `skillPresenter` | 1 | read skill file | +| `filePresenter` | 1 | prompt editor file preparation | +| `sqlitePresenter` | 1 | repair schema | +| `yoBrowserPresenter` | 1 | clear browser sandbox data | +| `exporter` | 1 | NowledgeMem config/test/update | +| `shortcutPresenter` | 1 | renderer shortcut runtime helper | + +There were also wrapper-level usages: + +| Wrapper | File | Current role | +| --- | --- | --- | +| `RemoteControlRuntime` | `src/renderer/api/RemoteControlRuntime.ts` | Wraps `useLegacyRemoteControlPresenter()` | +| `ShortcutRuntime` | `src/renderer/api/ShortcutRuntime.ts` | Wraps `useLegacyShortcutPresenter()` | +| `src/renderer/api/legacy/**` | quarantine | Contains the generic legacy transport and runtime wrappers | + +## Initial Direct Raw IPC And Window Runtime Inventory + +The following inventory is also the pre-execution baseline. The 2026-06-11 execution snapshot above +is the authoritative current state for remaining raw IPC exceptions. + +| Area | Files | Channels or APIs | +| --- | --- | --- | +| Chat stream compatibility | `src/renderer/src/stores/ui/messageIpc.ts` | listens to legacy `STREAM_EVENTS.END` and `STREAM_EVENTS.ERROR` even though `chat.stream.completed/failed` exists | +| Context menu bridge | `src/renderer/src/components/message/SelectedTextContextMenu.vue`, `src/main/contextMenuHelper.ts` | raw `context-menu-translate`, `context-menu-ask-ai` | +| Settings shell | `src/renderer/settings/App.vue` | `SETTINGS_EVENTS.NAVIGATE`, `SETTINGS_EVENTS.PROVIDER_INSTALL`, `SETTINGS_EVENTS.READY`, notification events | +| ACP settings/debug/terminal | `AcpSettings.vue`, `AcpDebugDialog.vue`, `AcpTerminalDialog.vue` | `CONFIG_EVENTS.AGENTS_CHANGED`, `ACP_DEBUG_EVENTS.EVENT`, `acp-init:*`, `external-deps-required`, `acp-terminal:*` | +| Knowledge base | `KnowledgeFile.vue`, `KnowledgeFileItem.vue` | `RAG_EVENTS.FILE_UPDATED`, `RAG_EVENTS.FILE_PROGRESS` | +| Provider rate limit | `ProviderRateLimitConfig.vue` | `RATE_LIMIT_EVENTS.CONFIG_UPDATED`, `REQUEST_EXECUTED`, `REQUEST_QUEUED` | +| Skill sync/catalog | `SyncPromptDialog.vue`, `SkillsSettings.vue` | `SKILL_SYNC_EVENTS.NEW_DISCOVERIES`, `skill:installed`, `skill:uninstalled`, `skill:metadata-updated` | +| Direct `window.api` | settings components | copy text, read clipboard, open external, file path extraction | +| Splash renderer | `src/renderer/splash/loading.vue` | database unlock submit/cancel/progress/request through raw Electron API | + +## Secondary Renderer And Preload Inventory + +| Renderer | Boundary today | Recommendation | +| --- | --- | --- | +| Main renderer | `window.deepchat` plus narrow `window.api` runtime helpers | Keep `window.api` behind `src/renderer/api/runtime.ts`; no component-level raw IPC | +| Settings renderer | same preload as main renderer | Migrated to `renderer/api/*Client`; no component-level legacy IPC | +| Plugin settings renderer | `deepchatPlugin` backed by `createBridge(ipcRenderer)` | Keep specialized API, already typed-route backed | +| Browser overlay | `yoBrowserOverlay.onActivityChanged` using typed event name and schema validation | Keep specialized API unless moved to `createBridge` later | +| Floating widget | `floatingButtonAPI` with shared custom channels and payload validation | Keep specialized API; listeners return scoped unsubscribe functions | +| Splash | `window.deepchatSplash` dedicated startup API | Keep raw IPC inside preload only because unlock can run before route runtime | + +## Guard Gap + +`scripts/architecture-guard.mjs` now scans `src/renderer/src` and `src/renderer/settings`, forbids +business-layer imports from `@api/legacy/**`, and treats a recreated `src/renderer/api/legacy/**` +directory as a regression. Remaining work is to regenerate the architecture baseline reports and add +a dedicated fixture/test proving settings-level legacy imports fail the guard. diff --git a/docs/architecture/presenter-ipc-migration-plan/change-map.zh-CN.md b/docs/architecture/presenter-ipc-migration-plan/change-map.zh-CN.md new file mode 100644 index 000000000..70a906af8 --- /dev/null +++ b/docs/architecture/presenter-ipc-migration-plan/change-map.zh-CN.md @@ -0,0 +1,867 @@ +# Presenter IPC 迁移改造清单 + +更新时间:2026-06-12 +当前分支:`codex/presenter-ipc-migration-plan` + +## 结论 + +这次真正要改的不是把所有 presenter 本体推倒重写,而是把 renderer 到 main 的 IPC 边界收口。 + +目标结构是: + +```text +settings / renderer 组件 + -> src/renderer/api/*Client.ts + -> window.deepchat.invoke/on + -> src/shared/contracts/routes + events + -> src/main/routes/* + -> 现有 presenter 方法 +``` + +也就是说,presenter 仍然是 main 侧业务 owner;要去掉的是 renderer 直接知道 +`knowledgePresenter`、`skillSyncPresenter`、`remoteControlPresenter:call`、`window.electron.ipcRenderer` +这些 legacy IPC 细节。 + +## 当前状态和剩余 Legacy 面 + +以 2026-06-11 当前工作区扫描为准,settings 业务组件已经不再直接调用 +`useLegacyPresenter(...)`、`useLegacyRemoteControlPresenter(...)`、 +`useLegacyShortcutPresenter(...)`,也不再直接订阅 settings/notification/ACP/knowledge/skill-sync +等旧 IPC 事件。 + +当前仍保留的 raw IPC 只在这些 preload/bridge 边界: + +| 类型 | 文件 | 保留原因 | +| --- | --- | --- | +| typed bridge 内部实现 | `src/preload/createBridge.ts` | 这是 `window.deepchat.invoke/on` 的底层桥,不属于业务 legacy 调用。 | +| preload runtime id | `src/preload/index.ts` | 仍用 `sendSync('get-window-id')` / `sendSync('get-web-contents-id')` 暴露窗口上下文,后续应并入窄 preload runtime API。 | +| plugin settings 专用 preload | `src/preload/plugin-settings-preload.ts` | 用 `createBridge(ipcRenderer)` 包成 `window.deepchatPlugin`,仍是 typed route backed。 | +| 启动/解锁窗口 preload | `src/preload/splash-preload.ts` | splash 可能早于完整 presenter route runtime 启动;renderer 只使用 `window.deepchatSplash`;preload 边界已通过单测覆盖,真实加密库解锁仍需隔离 profile 验证。 | +| 悬浮窗专用 preload | `src/preload/floating-preload.ts` | 使用 shared channel 常量、payload 校验和 scoped unsubscribe。 | +| browser overlay preload | `src/preload/browser-overlay-preload.ts` | 专用 overlay API,已用 shared event schema 校验 activity payload。 | + +初始审计中发现的 settings 侧缺口,目前状态如下: + +| 初始 legacy 域 | 当前状态 | +| --- | --- | +| `knowledgePresenter` | 已迁移到 `knowledge.*` routes、`knowledge.file.*` typed events、`KnowledgeClient`。 | +| `skillSyncPresenter` | 已迁移到 `skillSync.*` routes/events、`SkillSyncClient`。 | +| `remoteControlPresenter:call` | `RemoteSettings` 已迁移到 `remoteControl.*` routes、`RemoteControlClient`;main 兼容 handler 已删除。 | +| `agentSessionPresenter` | Dashboard/Remote agent list 已迁移到 `SessionClient` typed routes。 | +| MCP Router | 已迁移到 `mcp.router.*` routes 和 `McpClient`。 | +| GitHub Copilot OAuth | 已迁移到 `oauth.githubCopilot.*` routes 和 `OAuthClient`。 | +| NowledgeMem/exporter | 已迁移到 `nowledgeMem.*` routes 和 `NowledgeMemClient`。 | +| `sqlitePresenter.repairSchema` | 已迁移到 `databaseSecurity.repairSchema` route。 | +| `yoBrowserPresenter.clearSandboxData` | 已迁移到 `browser.clearSandboxData` route。 | +| `skillPresenter.readSkillFile` | 已迁移到 `skills.readFile` route。 | +| Settings/notification/ACP terminal 旧事件 | 已迁移到 `WindowClient`、`AcpTerminalClient` 和 typed events。 | + +自动化迁移 gate 已经收口;剩余不是代码路径,而是需要真实外部服务/本机状态的人工验证记录, +例如 GitHub Copilot OAuth、Remote Control 真实账号绑定、MCP Router 安装、NowledgeMem live +connection、真实 profile 数据库修复、browser sandbox reset、使用隔离加密 profile 的 splash +数据库解锁。 + +## 分层改造 + +### 1. Shared contracts + +要在 `src/shared/contracts/routes/*.routes.ts` 和 `src/shared/contracts/events/*.events.ts` +为每个剩余域补 route/event contract。每个 route 必须定义: + +- `name` +- `input` schema +- `output` schema +- renderer 看到的 domain 名,而不是 presenter 名 + +例子: + +| 旧 presenter 方法 | 新 route | +| --- | --- | +| `knowledgePresenter.listFiles(id)` | `knowledge.listFiles` | +| `skillSyncPresenter.previewImport(...)` | `skillSync.previewImport` | +| `remoteControlPresenter.createTelegramPairCode()` | `remoteControl.createPairCode` | +| `sqlitePresenter.repairSchema()` | `database.repairSchema` | + +事件也一样,renderer 不再听旧通道,而是听 typed event: + +| 旧事件 | 新事件 | +| --- | --- | +| `RAG_EVENTS.FILE_UPDATED` | `knowledge.file.updated` | +| `RAG_EVENTS.FILE_PROGRESS` | `knowledge.file.progress` | +| `SKILL_SYNC_EVENTS.NEW_DISCOVERIES` | `skillSync.discoveries.changed` | +| `NOTIFICATION_EVENTS.SHOW_ERROR` | `notifications.errorShown` 或 settings notification domain | + +### 2. Main routes + +要在 `src/main/routes/index.ts` 或更细的 route handler 中把新 route 接到现有 presenter。 + +关键点: + +- main route runtime 需要注入对应 presenter,例如 `knowledgePresenter`、`skillSyncPresenter`、 + `remoteControlPresenter`。 +- route handler 只做输入校验、调用 presenter、输出校验,不把 UI 状态塞进去。 +- 涉及当前窗口的 route,例如 settings ready、close、provider install consume,必须使用 + invoking `webContentsId`,不能用“当前 focused window”猜。 + +### 3. Event bridge + +main 内部可以继续用 `EventBus`,但 renderer-visible 事件要统一通过 typed event 发布。 + +要改 `src/main/routes/legacyTypedEventBridge.ts`: + +- 把 `RAG_EVENTS.FILE_UPDATED/FILE_PROGRESS` 映射到 `knowledge.file.updated/progress`。 +- 把 `SKILL_SYNC_EVENTS.NEW_DISCOVERIES` 映射到 `skillSync.discoveries.changed`。 +- 把 notification/settings/ACP terminal 等旧事件逐步映射到 typed events 或专用 client API。 + +注意:bridge 是过渡层。最终如果 presenter 直接 publish typed event,bridge 可以删除。 + +### 4. Renderer API clients + +每个域补一个或扩展一个 client,文件放在 `src/renderer/api`。 + +| 域 | Client | +| --- | --- | +| Knowledge | 新增 `KnowledgeClient.ts` | +| Skill sync | 新增 `SkillSyncClient.ts` | +| Remote control | 新增 `RemoteControlClient.ts`,替代 `RemoteControlRuntime.ts` | +| Agent session dashboard | 扩展 `SessionClient.ts` 或新建 dashboard client | +| MCP Router | 扩展 `McpClient.ts` | +| GitHub Copilot OAuth | 新增 `OAuthClient.ts` 或放到 Provider auth client | +| NowledgeMem | 新增 `NowledgeMemClient.ts` 或归到 exporter/export client | +| Database repair | 扩展 `DatabaseSecurityClient.ts` 或新增 database ops route | +| Browser sandbox | 扩展 `BrowserClient.ts` | +| Skill file read | 扩展 `SkillClient.ts` | + +Client 负责把 route 的 envelope 还原成组件需要的老返回形态。这样组件改动最小。 + +### 5. Renderer 组件 + +组件里要做的事很机械: + +- 删除 `useLegacyPresenter(...)`。 +- 删除 `window.electron.ipcRenderer.on/send/removeAllListeners`。 +- 改用 `createXxxClient()`。 +- 事件订阅统一保存 unsubscribe,在 `onBeforeUnmount/onUnmounted` 调用。 +- 不再 `removeAllListeners(oldChannel)`,因为那会误删同通道其他监听者。 + +### 6. Guard + +`scripts/architecture-guard.mjs` 现在已经能拦 settings legacy IPC,并且已有测试证明: + +- settings 重新引入 `@api/legacy/presenters` / `useLegacyPresenter` 会失败。 +- settings 重新直接监听 `window.electron.ipcRenderer.on(...)` 会失败。 +- `src/renderer/api/legacy/**` 被视为已退休路径,重新出现会失败。 +- baseline 已重新生成,业务层 legacy 计数为 `0`,剩余例外限定在 preload/bridge 边界。 + +## Presenter-by-Presenter 改造 + +### `knowledgePresenter` + +旧入口: + +- `KnowledgeBaseSettings.vue`: `isSupported` +- `BuiltinKnowledgeSettings.vue`: `getSupportedLanguages`, `getSeparatorsForLanguage` +- `KnowledgeFile.vue`: `getSupportedFileExtensions`, `validateFile`, `addFile`, `deleteFile`, + `reAddFile`, `listFiles`, `similarityQuery`, `pauseAllRunningTasks`, `resumeAllPausedTasks` +- `KnowledgeFile.vue`, `KnowledgeFileItem.vue`: `RAG_EVENTS.FILE_UPDATED/FILE_PROGRESS` + +要改: + +- 新增 `src/shared/contracts/routes/knowledge.routes.ts`。 +- 新增 `src/shared/contracts/events/knowledge.events.ts`。 +- 新增 `src/renderer/api/KnowledgeClient.ts`。 +- `src/main/routes/index.ts` 注入 `knowledgePresenter` 并 dispatch `knowledge.*`。 +- `legacyTypedEventBridge.ts` 把 RAG 事件映射到 typed event。 +- 四个知识库组件改用 `KnowledgeClient`。 + +测试: + +- `test/main/routes/contracts.test.ts`: route/event catalog 包含 `knowledge.*`。 +- `test/main/routes/dispatcher.test.ts`: mock `knowledgePresenter`,验证每个 route 调到正确方法。 +- `test/renderer/api/clients.test.ts`: `KnowledgeClient` 输入输出和事件 unsubscribe。 +- 组件测试:`BuiltinKnowledgeSettings`, `KnowledgeBaseSettings`, `KnowledgeFile`, + `KnowledgeFileItem`。 + +副作用: + +- `addFile/reAddFile` 会触发 embedding、向量库写入和进度事件。 +- `similarityQuery` 会返回已索引内容片段,不能扩大调用面。 +- 文件选择和真实文件 path 在单测里很难完全模拟。 + +人工验证: + +- 新建一个内置知识库配置。 +- 添加一个支持文件,确认列表出现并有进度。 +- 暂停/恢复处理。 +- re-add 文件。 +- 删除文件。 +- 执行一次相似度搜索。 +- 上传不支持的文件,确认错误提示仍然正确。 + +### `skillSyncPresenter` + +旧入口: + +- `SyncPromptDialog.vue`: `getNewDiscoveries`, `acknowledgeDiscoveries`, `SKILL_SYNC_EVENTS.NEW_DISCOVERIES` +- `SyncStatusSection.vue`: `scanExternalTools` +- `ImportWizard.vue`: `scanExternalTools`, `previewImport`, `executeImport` +- `ExportWizard.vue`: `getRegisteredTools`, `previewExport`, `executeExport` + +要改: + +- 新增 `skillSync.*` routes。 +- 新增 `SkillSyncClient.ts`。 +- 新增 typed events:`skillSync.discoveries.changed`,必要时补 scan/import/export progress。 +- 组件全部改用 `SkillSyncClient`。 + +测试: + +- route contract 测 tool id、skill name、conflict strategy、export options。 +- handler 测 scanner/converter 被正确调用。 +- renderer client 测 preview/execute 的输入输出。 +- 组件测发现提示、扫描、导入预览、导出预览、冲突策略。 + +副作用: + +- import/export 会读写外部工具目录。 +- conflict strategy 一旦传错会覆盖或复制技能文件。 +- 外部工具扫描依赖用户机器环境,CI 只能 mock。 + +人工验证: + +- 扫描本机已安装工具。 +- 导入一个技能,分别验证 skip/overwrite/rename 等冲突策略。 +- 导出一个技能到一个临时外部工具目录。 +- 验证“不再提示新发现”仍然生效。 + +### `remoteControlPresenter` + +旧入口: + +- `RemoteSettings.vue`: `useLegacyRemoteControlPresenter({ safeCall: false })` +- Telegram/Weixin 兼容方法:settings/status/bindings/pair code/login/restart/remove + +要改: + +- 新增 `remoteControl.*` routes 和 `RemoteControlClient.ts`。 +- 优先用通用 channel route: + - `remoteControl.listChannels` + - `remoteControl.getSettings` + - `remoteControl.saveSettings` + - `remoteControl.getStatus` + - `remoteControl.listBindings` + - `remoteControl.removeBinding` + - `remoteControl.removePrincipal` + - `remoteControl.getPairingSnapshot` + - `remoteControl.createPairCode` + - `remoteControl.clearPairCode` +- Weixin iLink 保留窄 route: + - `remoteControl.weixinIlink.startLogin` + - `remoteControl.weixinIlink.waitLogin` + - `remoteControl.weixinIlink.removeAccount` + - `remoteControl.weixinIlink.restartAccount` +- `RemoteSettings.vue` 不再依赖 `RemoteControlRuntime.ts`。 +- 最后删除 `remoteControlPresenter:call` handler 和 allowlist。 + +测试: + +- route schema 测 channel enum 和 settings discriminated union。 +- handler 测不同 channel 的 presenter 方法映射。 +- `RemoteSettings.vue` 组件测保存、状态刷新、配对码、binding 删除。 + +副作用: + +- 远控配置可能包含 token、secret、账号绑定,route output 必须脱敏。 +- Weixin 登录是长任务,自动化只能 mock;真实等待流程需要人工测。 + +人工验证: + +- Telegram 保存 token,生成/清除 pair code,删除 binding。 +- Feishu/QQBot/Discord 保存配置并刷新状态。 +- Weixin iLink 启动登录、等待成功或失败、重启账号、移除账号。 + +### `agentSessionPresenter` + +旧入口: + +- `DashboardSettings.vue`: `getUsageDashboard`, `retryRtkHealthCheck` +- `RemoteSettings.vue`: `getAgents` + +要改: + +- `getAgents` 优先复用已有 `SessionClient.getAgents` 或 `ConfigClient.listAgents`。 +- 新增: + - `sessions.usageDashboard.get` + - `sessions.rtkHealth.retry` +- `DashboardSettings.vue` 和 `RemoteSettings.vue` 改用 typed client。 + +测试: + +- route handler 测 dashboard 聚合和 retry 调用。 +- 组件测试 dashboard loading/error/empty、有数据、RTK retry。 +- Remote settings 测 agent 列表加载。 + +副作用: + +- dashboard 可能扫描大量会话,route 要保留现有性能和错误兜底。 +- RTK retry 会触发后台检查,必须仍然是用户显式点击。 + +人工验证: + +- 打开有历史会话的 dashboard。 +- 点击 RTK retry,确认状态和错误信息刷新。 +- Remote settings 的 agent 下拉仍能加载。 + +### `mcpPresenter` 的 MCP Router 部分 + +旧入口: + +- `McpBuiltinMarket.vue`: `getMcpRouterApiKey`, `setMcpRouterApiKey`, + `updateMcpRouterServersAuth`, `isServerInstalled`, `listMcpRouterServers`, + `installMcpRouterServer` + +要改: + +- 扩展 `McpClient.ts`,新增 `mcp.router.*` routes。 +- API key 存储和 server install 仍在 main。 +- 安装后继续复用 MCP 配置刷新/服务器状态事件。 + +测试: + +- route contract 测 page/limit/apiKey/serverKey。 +- handler mock 网络和安装流程。 +- `McpBuiltinMarket.vue` 组件测保存 key、分页、安装按钮状态。 + +副作用: + +- 会访问 MCP Router 网络接口。 +- 保存 API key 会写配置。 +- 安装 server 会改 MCP server 配置,可能启动进程。 + +人工验证: + +- 保存 MCP Router API key。 +- 拉取市场列表。 +- 安装一个 server,确认 MCP 设置里出现。 + +### `oauthPresenter` + +旧入口: + +- `GitHubCopilotOAuth.vue`: `startGitHubCopilotLogin`, `startGitHubCopilotDeviceFlowLogin` + +要改: + +- 新增 `oauth.githubCopilot.startLogin` 和 `oauth.githubCopilot.startDeviceFlowLogin`, + 或放到 provider auth domain。 +- 新增 `OAuthClient.ts` 或 `ProviderAuthClient.ts`。 +- 组件只关心 boolean/result,不直接碰 presenter。 + +测试: + +- handler mock OAuth presenter,验证 providerId 传递。 +- 组件测登录成功/失败和 loading 状态。 + +副作用: + +- 会打开浏览器/device flow,写入 provider credential。 +- CI 只能 mock shell/deeplink。 + +人工验证: + +- 用 disposable provider/account 跑一次 device flow。 +- 如果传统 OAuth 仍保留,也跑一次传统登录。 + +### `exporter` / NowledgeMem + +旧入口: + +- `NowledgeMemSettings.vue`: `getNowledgeMemConfig`, `updateNowledgeMemConfig`, + `testNowledgeMemConnection` + +要改: + +- 新增 `nowledgeMem.getConfig/updateConfig/testConnection` routes。 +- 新增 `NowledgeMemClient.ts`,或放到 export/domain client。 +- config schema 要限制 URL、timeout 范围,同时保留现有默认值。 + +测试: + +- route schema 测 timeout bounds 和 URL 字段。 +- handler mock exporter。 +- 组件测保存、重置、测试连接成功/失败。 + +副作用: + +- test connection 会发网络请求。 +- API key 不能泄露到日志或错误详情。 + +人工验证: + +- 配一个本地或 disposable endpoint。 +- 验证测试成功、测试失败、保存后刷新仍保留。 + +### `sqlitePresenter` + +旧入口: + +- `DataSettings.vue`: `repairSchema` + +要改: + +- 新增 `database.repairSchema` 或 `databaseSecurity.repairSchema` route。 +- 推荐放在 database ops domain,不和 encryption route 混太深。 +- `DataSettings.vue` 改用 typed client。 + +测试: + +- handler mock repair report。 +- 组件测 repair loading、成功报告、错误状态。 + +副作用: + +- 会修改本地数据库 schema。 +- 不能在真实主 profile 上随便人工验证。 + +人工验证: + +- 复制一个测试 profile。 +- 在副本上触发 repair。 +- 检查报告 UI 和数据库仍能正常打开。 + +### `yoBrowserPresenter` + +旧入口: + +- `DataSettings.vue`: `clearSandboxData` + +要改: + +- 扩展 `BrowserClient.ts`,新增 `browser.clearSandboxData`。 +- `DataSettings.vue` 改用 `BrowserClient`。 + +测试: + +- browser route handler mock。 +- 组件测清理确认、loading、错误 toast。 + +副作用: + +- 会清浏览器 sandbox/cache。 + +人工验证: + +- 打开 browser 产生 sandbox 数据。 +- 清理。 +- 再打开确认是干净状态。 + +### `skillPresenter` + +旧入口: + +- `SkillEditorSheet.vue`: `readSkillFile` + +要改: + +- 扩展 `SkillClient.ts`,新增 `skills.readFile`。 +- renderer 只能传 skill name/id,路径解析留在 main。 + +测试: + +- schema 拒绝空名和路径穿越形态。 +- Skill editor 组件测加载内容。 + +副作用: + +- 文件读取不能扩大到任意路径。 + +人工验证: + +- 打开一个已安装 skill。 +- 编辑保存。 +- 关闭再打开确认内容仍正确。 + +### Settings shell / notification / ACP terminal 原始事件 + +旧入口: + +- `settings/App.vue`: settings navigation、provider install、ready、notification。 +- `AboutUsSettings.vue`: update check event。 +- `AcpTerminalDialog.vue`: `acp-init:*`, `external-deps-required`, `acp-terminal:*`。 + +已改: + +- Settings shell 通过 `WindowClient` typed route/event: + - `settings.navigateRequested` + - `settings.providerInstallRequested` + - `settings.checkForUpdatesRequested` + - `window.notifySettingsReady` + - `notification.error` + - `databaseSecurity.repairSuggested` +- About 更新检查订阅 `WindowClient.onSettingsCheckForUpdates()`。 +- `AcpSettings.vue` 的 agent reload 订阅 `ConfigClient.onAgentsChanged()`。 +- `SkillsSettings.vue` 的 skill catalog reload 订阅 `SkillClient.onCatalogChanged()`。 +- ACP terminal 新增专用 `AcpTerminalClient`: + - `acpTerminal.input` + - `acpTerminal.kill` + - `acpTerminal.started/output/exited/error` + - `acpTerminal.externalDependenciesRequired` + +测试: + +- settings app 事件订阅测试已更新。 +- About update check 组件测试已更新。 +- ACP terminal route/client 已由 contracts、dispatcher、client 测试覆盖。 +- 证据: + - `pnpm exec vitest run test/main/routes/contracts.test.ts test/main/routes/dispatcher.test.ts test/renderer/api/clients.test.ts test/renderer/components/SettingsApp.test.ts test/renderer/components/SettingsApp.providerDeeplink.test.ts test/renderer/components/AboutUsSettings.test.ts` + - `pnpm exec vitest run test/main/routes/contracts.test.ts test/main/routes/dispatcher.test.ts test/renderer/api/clients.test.ts test/renderer/components/AcpSettings.test.ts` + +副作用: + +- settings provider deeplink 可能发生在 settings window 打开之前,需要保留 pending 消费语义。 +- ACP terminal 是长连接/子进程输出流,事件 payload 要小且稳定。 + +人工验证: + +- provider deeplink 打开 settings 并进入安装预览。 +- settings 内跳转目标 section 正常。 +- About 页外部触发 check update 正常。 +- ACP terminal 初始化、输出、输入、kill、依赖缺失提示正常。 + +### 当前仍保留的 raw IPC 例外 + +保留项: + +- `src/preload/createBridge.ts` +- `src/preload/index.ts` +- `src/preload/plugin-settings-preload.ts` +- `src/preload/splash-preload.ts` +- `src/preload/floating-preload.ts` +- `src/preload/browser-overlay-preload.ts` + +为什么保留: + +- splash 是启动期窗口,数据库解锁可能发生在 presenter route runtime 可用之前。 +- floating/browser overlay/plugin settings 是专用 preload API,不是业务组件直接调用 presenter。 +- `createBridge` 是 typed route/event 的底层实现。 +- `src/preload/index.ts` 仍提供窄 `window.api` runtime helper 和同步窗口 ID 获取。 + +本轮已完成: + +- splash 建立 `window.deepchatSplash` 专用 API,renderer 不再暴露通用 `window.electron`。 +- floating/browser overlay 完成 channel 常量共享和 payload validation。 +- 删除 `remoteControlPresenter:call`、generic `presenter:call` 和 + `src/renderer/api/legacy/**`。 + +## Legacy Transport 删除后的最终验证条件 + +删除已完成;当前验证状态如下。 + +已通过: + +- `pnpm run format` +- `pnpm run i18n` +- `pnpm run lint` +- `pnpm run typecheck` +- `pnpm run build` +- 全量 `pnpm test -- --silent --reporter=dot`:376 个文件通过,6 个跳过;3175 个测试通过, + 41 个跳过。 +- 聚焦迁移测试:13 个文件 / 130 个测试通过。 +- Electron smoke e2e:启动应用、settings control center navigation 两个用例通过。 +- Electron settings IPC boundary e2e:真实 settings 窗口确认 `window.deepchat.invoke/on` 存在、 + broad `window.electron` / `api.ipcRenderer` 不暴露,`presenter:call` 被拒绝,并打开 + knowledge、skills、remote、MCP、data 五个迁移后的设置页。 +- Electron main renderer IPC boundary e2e:真实主聊天窗口确认 `window.deepchat.invoke/on` 存在, + 可调用 typed `device.getAppVersion` route,broad `window.electron` / `api.ipcRenderer` 不暴露, + `presenter:call` 被拒绝。 +- Electron Data Settings privacy mode e2e:真实 Data Settings 页面点击 Privacy Mode 开关, + 验证 `settings.getSnapshot/settings.update` typed route 状态变化,并在用例结束前恢复原始 + `privacyModeEnabled` 值。 +- Electron Remote Control read-only route e2e:真实 Remote Settings 页面切换 Telegram、Feishu、 + QQBot、Discord、Weixin iLink 五个 channel tab,并对每个 channel 读取 + `remoteControl.listChannels/getChannelSettings/getChannelStatus/getChannelBindings`,不需要真实远控账号, + 也不修改远控配置。 +- RemoteControl runtime 收口:`WindowSideBar` 已直接使用 `RemoteControlClient` 读取主窗口远控状态, + `src/renderer/api/RemoteControlRuntime.ts` 已删除。聚焦验证中,`WindowSideBar`/`RemoteSettings`/ + route/client 相关单测 5 个文件 126 个测试通过;真实主窗口 e2e 现在额外读取 + `remoteControl.listChannels/getChannelStatus`,并和 Remote Settings 只读 e2e 一起串行通过。 +- Upgrade raw update 事件收口:`upgradePresenter` 不再向 renderer 发送旧的 + `update:status-changed`、`update:error`、`update:progress`、`update:will-restart` raw channel; + renderer 只通过 `UpgradeClient` 接收 typed `upgrade.status.changed`、`upgrade.progress`、 + `upgrade.willRestart`、`upgrade.error` 事件。`UPDATE_EVENTS` 现在只剩 main 内部 + `update:state-changed`,用于 upgrade/lifecycle 之间的更新中状态同步。聚焦单测 4 个文件 64 个测试通过, + 旧 raw update 事件名源码扫描无命中。 +- Dialog raw 事件收口:`DialogPresenter.showDialog` 不再发送旧的 `dialog:request` raw channel; + renderer dialog store 只通过 typed `dialog.requested` 打开全局对话框,并继续通过 + `dialog.respond/dialog.error` typed routes 回传结果。聚焦验证中,presenter、route、client、store + 相关 5 个文件 82 个测试通过;`dialog:request/dialog:response` 源码扫描无命中。 +- Workspace invalidation 收口:`WorkspacePresenter` watcher 不再发送旧的 + `workspace:files-changed` raw channel,只发送 typed `workspace.invalidated`。聚焦验证中, + workspace presenter watcher、route、client 相关 4 个文件 94 个测试通过; + `workspace:files-changed` 源码扫描无命中。真实主窗口 e2e 通过 `workspace.register` 读取当前仓库的 + `workspace.readDirectory/searchFiles/getGitStatus`,并在 `finally` unregister;不启动 watcher、不打开文件、 + 不调用 OS reveal。 +- Device reset 完成通知收口:`DevicePresenter` 的开发环境 reset 完成分支不再发送旧的 + `notification:data-reset-complete-dev` raw channel,而是直接发布 typed + `appRuntime.dataResetCompleteDev`。`WindowPresenter` 里对应的旧通道翻译 case 已删除,main/renderer + `NOTIFICATION_EVENTS.DATA_RESET_COMPLETE_DEV` 常量已删除,源码扫描无命中。聚焦单测覆盖 presenter、 + route、client、Data Settings 相关 5 个文件 103 个测试;真实 Data Settings 只读 e2e 与 + `01-launch`、`06-settings-ipc-boundary` 串行运行通过。实际点击 reset data 会删除用户数据,仍只在 + disposable profile 里人工验证。 +- System notification click 收口:`NotificationPresenter` 在 Electron 系统通知被点击时,不再发旧的 + `notification:sys-notify-clicked` raw channel,而是直接发布 typed + `appRuntime.systemNotificationClicked`,payload 形态保持 `{ payload: id }`。`WindowPresenter` + 对应旧通道翻译 case 已删除,main/renderer 的 `NOTIFICATION_EVENTS` 常量也已删除。聚焦单测 4 个文件 + 67 个测试通过,真实主窗口 `01-launch` + `09-main-ipc-boundary` e2e 串行通过。真实 OS 通知展示和点击 + 依赖系统通知权限,仍作为平台人工验证项。 +- Ollama pull progress 收口:`OllamaManager` 不再双发旧的 `ollama:pull-model-progress` raw event, + 只发布 typed `providers.ollama.pull.progress`。renderer 已通过 `ProviderClient.onOllamaPullProgress` + 和 `ollamaStore` 消费该事件;main/renderer 的 `OLLAMA_EVENTS` 常量已删除,源码扫描无命中。聚焦单测 + 4 个文件 58 个测试通过,真实 Model Providers 只读 e2e 与 `01-launch`、`06-settings-ipc-boundary` + 串行通过。真实拉取模型依赖本机 Ollama daemon 和网络/本地模型缓存,仍作为 opt-in 手测项。 +- Skill catalog/session 收口:`SkillPresenter` 不再双发旧的 `skill:discovered`、 + `skill:installed`、`skill:uninstalled`、`skill:metadata-updated`、`skill:activated`、 + `skill:deactivated` raw event,只发布 typed `skills.catalog.changed` 和 + `skills.session.changed`。`McpIndicator`、skills store 和 settings 已经通过 `SkillClient` 消费 typed + event;main/renderer 的 `SKILL_EVENTS` 常量已删除,源码和测试扫描无命中。聚焦单测 5 个文件 151 个测试通过, + 真实 Skills 设置页只读 e2e 与 `01-launch`、`06-settings-ipc-boundary` 串行通过。安装/卸载/编辑技能会写磁盘, + 仍作为人工或专项 e2e。 +- YoBrowser lifecycle/open 收口:`YoBrowserPresenter` 不再双发旧的 `yo-browser:*` raw event,只发布 + typed `browser.status.changed`、`browser.open.requested` 和 `browser.activity.changed`。旧的 + `yo-browser:window-count-changed` 没有业务消费方,直接退休,不补 typed 替代。`BrowserPanel` 测试也改成 + typed event 名称;main/renderer 的 `YO_BROWSER_EVENTS` 常量已删除,源码和测试扫描无命中。聚焦单测 + 4 个文件 71 个测试通过;真实 browser route e2e 通过。`01-launch`、`06-settings-ipc-boundary` + 单跑通过,三用例组合里 `06` 曾出现 app fixture setup 超时,按既有 e2e harness 抖动记录。 +- MCP sampling 收口:`McpPresenter` 不再双发旧的 `mcp:sampling-request`、 + `mcp:sampling-decision`、`mcp:sampling-cancelled` raw channel,只发布 typed + `mcp.sampling.request`、`mcp.sampling.decision`、`mcp.sampling.cancelled`。`McpClient` 和 + `mcpSampling` store 已经消费 typed event;main/renderer 事件常量里的 sampling 三项已删除,源码和测试扫描无命中。 + 聚焦单测 4 个文件 68 个测试通过,真实 MCP Settings 只读 e2e 与 `01-launch`、 + `06-settings-ipc-boundary` 串行运行通过。真实 approve/reject/cancel sampling 弹窗链路需要一个会发 + sampling 请求的测试 MCP server 和可运行模型路径,仍作为人工或未来专项 e2e。 +- Config font-size 收口:`ConfigPresenter.setSetting('fontSizeLevel', value)` 不再发送旧的 + `config:font-size-changed` raw channel,只通过 typed `settings.changed` 通知 renderer。`uiSettingsStore` + 已经从 `SettingsClient.onChanged` 消费 typed event 并同步 `fontSizeClass`;main/renderer 的 + `FONT_SIZE_CHANGED` 常量已删除,源码和测试扫描无命中。聚焦单测 6 个文件 88 个测试通过,真实 + config/settings 只读 e2e 与 `01-launch`、`06-settings-ipc-boundary` 串行运行通过。真实 Display + Settings 中调大/调小字体并确认主窗口/设置窗口 class 同步,仍作为人工或未来专项 e2e。 +- NowledgeMem config 收口:`ConfigPresenter.setNowledgeMemConfig` 不再发送旧的 + `config:nowledge-mem-config-updated` raw channel;NowledgeMem 设置页保存/读取完全通过 + `nowledgeMem.updateConfig/getConfig` typed routes。main 侧 `NOWLEDGE_MEM_CONFIG_UPDATED` 常量已删除, + 源码和测试扫描无命中。聚焦单测 5 个文件 83 个测试通过,真实 Knowledge Settings 中的 NowledgeMem + 配置 e2e 与 `01-launch`、`06-settings-ipc-boundary` 串行运行通过,包含临时写入和恢复原配置。真实 + Test Connection 仍需要本机 NowledgeMem 服务,保留人工验证。 +- MCP config bridge 收口:`McpConfHelper.batchImportMcpServers` 不再把 + `MCP_EVENTS.CONFIG_CHANGED` 直接 `sendToRenderer`,而是只发 main 内部事件;`legacyTypedEventBridge` + 继续把它发布成 typed `mcp.config.changed` 给 renderer。renderer 侧未使用的 `MCP_EVENTS` raw 常量块已删除。 + 聚焦单测 5 个文件 89 个测试通过,真实 MCP Settings 只读 e2e 与 `01-launch`、 + `06-settings-ipc-boundary` 串行运行通过。外部 marketplace batch import 会修改 MCP server 配置且可能依赖网络, + 仍作为人工或 opt-in e2e。 +- ACP workspace/debug 收口:`AcpProvider` 和 `AcpProcessManager` 不再发送旧的 + `acp-workspace:*` raw channel;ACP ready 事件改为 typed `sessions.acp.modes.ready`、 + `sessions.acp.commands.ready`、`sessions.acp.configOptions.ready`。ACP debug 事件改成 main 内部 + `ACP_DEBUG_EVENTS.EVENT`,由 bridge 发布 typed `providers.acp.debug.event` 给 renderer。main/renderer + 的 `ACP_WORKSPACE_EVENTS` 常量已删除,ChatStatusBar 测试也改成直接触发 `SessionClient` typed listener。 + 聚焦单测 6 个文件 157 个测试通过,真实 ACP/Provider 设置只读 e2e 与 `01-launch`、 + `06-settings-ipc-boundary` 串行运行通过。真实 ACP agent warmup、debug action、mode/model/config option + 流转需要可运行 agent 和本机依赖,仍作为人工或 opt-in e2e。 +- Electron Knowledge read-only route e2e:真实 Knowledge Settings 页面读取 + `knowledge.isSupported/getSupportedLanguages/getSeparatorsForLanguage/getSupportedFileExtensions`, + 不添加文件、不触发 ingestion、不修改知识库数据。 +- Electron MCP read-only route e2e:真实 MCP Settings 页面读取 + `mcp.getEnabled/getServers/getClients/listToolDefinitions/listPrompts/listResources/getNpmRegistryStatus`, + 不切换 MCP、不刷新 registry、不安装 marketplace server、不启停 MCP server。 +- Electron NowledgeMem config route e2e:真实 Knowledge Settings 页面展开 NowledgeMem 配置面板, + 通过 UI 保存临时 base URL/API key,验证 `nowledgeMem.getConfig/updateConfig` typed routes, + 并在用例结束前恢复原配置;不运行需要真实服务的 Test Connection。 +- Electron Dashboard read-only route e2e:真实 Settings Overview dashboard 读取 + `sessions.getUsageDashboard`,验证 summary、calendar、provider/model breakdown、RTK snapshot + 结构;不触发 `sessions.retryRtkHealthCheck`,不修改 session 数据。 +- Electron Skills read-only route e2e:真实 Skills Settings 页面读取 + `skills.getDirectory/listMetadata`;如果当前 profile 存在已安装 skill,则额外验证 + `skills.readFile/getFolderTree/getExtension/listScripts`。用例不安装、不删除、不保存 skill 文件。 +- Skills 聚焦稳定性 e2e:`01-launch`、`06-settings-ipc-boundary`、 + `16-skills-readonly-route` 三个用例一起运行通过;同时收紧 e2e 主窗口识别,避免 floating/settings/splash + 等非主窗口被误判为主聊天窗口。 +- Electron ACP read-only route e2e:真实 ACP Settings 页面读取 + `config.getAcpState/listAcpRegistryAgents/listManualAcpAgents/getAcpSharedMcpSelections/listAgents`, + 验证 ACP 状态、registry agent、manual agent、shared MCP selections、DeepChat/ACP agent list; + 不切换 ACP、不刷新 registry、不安装/修复/卸载 registry agent、不修改 manual agent。 +- ACP 聚焦稳定性 e2e:`01-launch`、`06-settings-ipc-boundary`、 + `17-acp-readonly-route` 三个用例一起运行通过。 +- Electron Provider read-only route e2e:真实 Model Providers 设置页面等待 provider 列表渲染, + 读取 `providers.listSummaries/listDefaults/listModels/getRateLimitStatus`,断言时只保留 provider + 数量、模型数量、字段类型和布尔状态;不保存 provider 设置、不刷新模型、不测试真实连通性、不运行 + OAuth、不同步 ModelScope MCP server、不启动 ACP debug action。 +- Provider 聚焦稳定性 e2e:`01-launch`、`06-settings-ipc-boundary`、 + `18-provider-readonly-route` 三个用例一起运行通过。 +- Electron SkillSync read-only route/event e2e:真实 Skills Settings 页面确认同步状态区存在, + 读取 `skillSync.getRegisteredTools/getNewDiscoveries/scanExternalTools`,并验证 typed + `skillSync.scan.started/completed` 事件可送达;不 acknowledge discoveries,不 preview/execute + import/export。 +- SkillSync 聚焦稳定性 e2e:`01-launch`、`06-settings-ipc-boundary`、 + `19-skill-sync-readonly-route` 三个用例一起运行通过。 +- Electron Data Security read-only route e2e:真实 Data Settings 页面确认 database encryption、 + database repair、YoBrowser sandbox 三个区域可见,读取 + `databaseSecurity.getStatus/device.getInfo/device.getAppVersion`;不启用/停用数据库加密、不改密码、 + 不修复 schema、不重置数据、不清理 browser sandbox。 +- Data Security 聚焦稳定性 e2e:`01-launch`、`06-settings-ipc-boundary`、 + `20-data-security-readonly-route` 三个用例一起运行通过。 +- Electron Project read-only route e2e:真实 Environments Settings 页面读取 + `project.listRecent/listEnvironments/pathExists`,并对当前仓库路径和一个生成的不存在路径验证 + `pathExists`;不打开目录、不唤起 native directory picker。 +- Project 聚焦稳定性 e2e:`01-launch`、`06-settings-ipc-boundary`、 + `21-project-readonly-route` 三个用例一起运行通过。 +- Electron Window read-only route e2e:真实主窗口和真实 Settings 窗口分别读取 + `window.getCurrentState`,验证 context-aware route 返回两个不同窗口的状态快照;不最小化、不最大化、 + 不 focus、不关闭窗口。 +- Window 聚焦稳定性 e2e:`01-launch`、`06-settings-ipc-boundary`、 + `22-window-readonly-route` 三个用例一起运行通过。 +- Electron provider install preview e2e:通过 typed + `window.requeuePendingSettingsProviderInstall` route 排队一个自定义 provider 预览,打开真实 Settings + 窗口后验证 Provider 预览弹窗展示 provider 名称、base URL、masked key,并确认 pending preview 队列已消费; + 不点击确认,不写 provider 配置。 +- Provider preview 聚焦稳定性 e2e:`01-launch`、`06-settings-ipc-boundary`、 + `25-window-provider-deeplink-preview` 三个用例一起运行通过。 +- Electron Config settings read-only route e2e:真实 DeepChat Agents、Notifications Hooks、 + Shortcuts 设置页面读取 `config.listAgents`、`config.resolveDeepChatAgentConfig`、 + `config.getAgentMcpSelections`、`config.getHooksNotifications`、`config.getShortcutKeys`;不创建/更新/删除 + agent,不保存 hooks,不执行 hook command,不重置或修改快捷键。 +- Config settings 聚焦稳定性 e2e:`01-launch`、`06-settings-ipc-boundary`、 + `23-config-readonly-route` 三个用例一起运行通过。 +- Electron Shortcut config route/event e2e:真实 Shortcuts 设置页中,从 Settings renderer 通过 + typed `config.setShortcutKeys` 写入临时 `QuickSearch` 快捷键,验证 + `config.shortcutKeys.changed` typed event,再调用 `shortcut.destroy`、`shortcut.register`、 + `shortcut.unregister`,最后在 `finally` 恢复原始快捷键配置。 +- Shortcut event bridge 收口:`config.shortcutKeys.changed` 现在由 + `ConfigPresenter.setShortcutKey/resetShortcutKeys` 直接发布,`legacyTypedEventBridge` 不再 monkey patch + `configPresenter` 的快捷键方法。聚焦 route/client/component 单测 4 个文件 81 个测试通过。 +- Shortcut 聚焦稳定性 e2e:`01-launch`、`06-settings-ipc-boundary`、 + `28-shortcut-route-restore` 三个用例使用 `--workers=1` 串行运行通过;删除 shortcut monkey patch + 后同一组 e2e 重新构建再跑也通过。Electron 组合用例需要串行跑,因为 DeepChat 有单实例 + `SingletonLock`,并发 worker 可能在启动阶段误失败。 +- Electron Hooks notification command e2e:通过 `config.setHooksNotifications` 保存一条临时 hook, + 在真实 Notifications Hooks 页面确认渲染,再通过 `config.testHookCommand` 执行无副作用本地 + `node -e` 命令,验证 stdout/exit code,最后在 `finally` 恢复原 hooks config。 +- Hooks notification 聚焦稳定性 e2e:`01-launch`、`06-settings-ipc-boundary`、 + `27-hooks-notification-command` 三个用例一起运行通过。 +- Electron DeepChat agent CRUD e2e:真实 DeepChat Agents 设置页通过 UI 创建唯一临时 agent, + 用 `config.listAgents` 验证,再通过 UI 更新名称/描述,最后通过 `config.deleteDeepChatAgent` 删除,并在 + `finally` 里按测试名前缀做兜底清理。 +- DeepChat agent CRUD 聚焦稳定性 e2e:`01-launch`、`06-settings-ipc-boundary`、 + `26-deepchat-agent-crud` 三个用例一起运行通过。 +- Electron Config system read-only route e2e:真实 About 设置页面读取 + `config.getProxySettings`、`config.getUpdateChannel`、`config.getSyncSettings`、 + `config.getSkillDraftSuggestions`、`config.getEntries` 的模型默认值/文件大小配置和 + `upgrade.getStatus`;不打开 General proxy 区域、不修改 proxy/update channel、不检查更新、不下载更新、 + 不打开日志目录、不刷新 provider DB。 +- Config system 聚焦稳定性 e2e:`01-launch`、`06-settings-ipc-boundary`、 + `24-config-system-readonly-route` 三个用例一起运行通过。 +- Upgrade/About 聚焦稳定性 e2e:重新构建后,`01-launch`、`06-settings-ipc-boundary`、 + `24-config-system-readonly-route` 三个用例使用 `--workers=1` 串行运行通过。 +- 稳定本地用户路径组合 e2e:启动、settings navigation、settings IPC boundary、floating IPC boundary、 + browser route lifecycle、main renderer IPC boundary、Data Settings privacy mode、Remote Control + read-only routes、Knowledge read-only routes、MCP read-only routes、NowledgeMem config route + 和 Dashboard read-only route 十二个用例一起运行通过。e2e launcher 的主窗口等待放宽到 60 秒, + 避免长组合顺序运行时出现冷启动误报。 +- 包含 Skills 的 13 用例长组合暂不升级为稳定 gate:本轮长组合里的 `01-launch` 和 + `08-browser-route` 在 Electron app setup 阶段超时,但二者随后单跑通过,Skills 单跑和聚焦组合也通过; + 当前归类为 e2e harness 稳定性问题,不是 presenter route 行为失败。 +- Electron floating IPC boundary e2e:通过 typed config route 打开真实 floating renderer,验证 built/e2e + 模式加载 bundled renderer 文件,窗口只暴露 `floatingButtonAPI`,不暴露 broad + `window.electron`、`window.deepchat`、`api.ipcRenderer`,并在用例结束后恢复原 floating 设置。 +- Electron browser route e2e:用 `browser.loadUrl` 加载本地 `data:` 页面,轮询 + `browser.getStatus` 到 ready,验证 typed `browser.status.changed` 事件并调用 `browser.destroy`; + 该用例故意不清理真实 profile 的 browser sandbox。 +- Session/Conversation/Stream runtime 收口:`AgentSessionPresenter` 删除旧 `session:*` renderer + 双发,只保留 `sessions.updated` typed event;`AgentRuntimePresenter`、`dispatch`、`echo` 和 + `PendingInputCoordinator` 删除旧 `stream:*`/`session:*` renderer 发送,改为 + `chat.stream.updated/completed/failed`、`sessions.status.changed`、 + `sessions.pendingInputs.changed` 和新增 `sessions.compaction.changed`;旧 + `sessionPresenter` 的 conversation/tab/message managers 停止发送无人消费的 `conversation:*`; + `LifecycleManager.notifyMessage` 不再动态转发任意 lifecycle event 到 renderer。源码层 + `eventBus.sendToRenderer` 只剩 typed publisher `publishDeepchatEvent`。 +- 本轮验证:`format`、`i18n`、`lint`、`typecheck`、`electron-vite build` 均通过;聚焦单测 9 个文件 + 339 个测试通过;e2e 中 `01-launch`、`09-main-ipc-boundary`、`23-config-readonly-route` + 通过,`06-settings-ipc-boundary` 在四用例组合里 Electron app fixture setup 超时后单跑通过, + `01-launch + 09-main-ipc-boundary` 使用 `--workers=1` 组合通过。 +- 最后一轮 presenter event 扫尾:`eventBus.send(...)` 已经在 `src/main` / `src/renderer` + 源码中清零,`legacyTypedEventBridge` 已删除且无引用;`eventBus.sendToRenderer` 在运行时代码中只剩 + typed publisher `publishDeepchatEvent` 使用。`WindowPresenter` / `TabPresenter` 中无人订阅的旧广播 + 已删除,包括 `system-theme-updated`、窗口最大化/全屏旧 channel、`setActiveTab`、 + `update-window-tabs` 和 `tab:title-updated`。 +- 当前 `src/main/presenter` 下仍能搜到的 `webContents.send(...)` 不再是全局 presenter 事件迁移缺口, + 而是明确保留的独立窗口/专用 preload 协议:floating button 的 `floatingButtonAPI` channel、 + splash/database-unlock 启动期 channel、browser overlay activity channel,以及 ACP terminal 发给 + settings webContents 的 `DEEPCHAT_EVENT_CHANNEL` typed envelope。若后续要继续收敛这些小窗口, + 应先为 secondary renderer 增加 typed-envelope preload 支持,再迁移发送端。 +- 最新聚焦验证:`contracts.test.ts`、`dispatcher.test.ts`、`clients.test.ts`、 + `preloadBoundaries.test.ts` 共 4 个文件 84 个测试通过;`windowPresenter.test.ts` 1 个文件 + 4 个测试通过。 +- 最新用户视角 e2e:`01-launch`、`06-settings-ipc-boundary`、`07-floating-ipc-boundary`、 + `09-main-ipc-boundary`、`22-window-readonly-route`、`23-config-readonly-route` 使用 + `-c test/e2e/playwright.config.ts --workers=1` 运行通过,共 6 个测试。为了避免本机真实 + DeepChat profile 的加密数据库 splash 和首次引导状态干扰自动化验证,e2e fixture 现在默认创建临时 + `DEEPCHAT_E2E_USER_DATA_DIR`,并写入已完成 onboarding 的最小 `app-settings.json`。 +- 2026-06-13 收尾补充:renderer 侧无人引用的 `WINDOW_EVENTS` / `SYSTEM_EVENTS` 常量已删除, + `docs/architecture/event-system.md` 已改为说明这些窗口事件只属于 main 内部协作;全量本地 smoke + e2e 使用 `--workers=1` 跑完,结果为 26 个通过、3 个跳过。跳过项是 live provider/chat 集成测试, + 需要 `RUN_PROVIDER_INTEGRATION=true` 和显式配置好的 provider/model/API key。 +- 同日最终门禁:`format`、`i18n`、`lint`、`typecheck`、focused Vitest 5 个文件 88 个测试通过; + `src/renderer/src/env.d.ts` 显式补齐 Vite env、CSS、`?url` asset 和 inline worker 声明,避免 + `vue-tsgo` 依赖隐式 `vite/client` 合并。 +- 同日完整单测门禁:`pnpm test -- --silent --reporter=dot` 通过,382 个文件通过、6 个跳过, + 3192 个测试通过、41 个跳过;其中把陈旧的 `session:activated` / `stream:end` 测试断言改成 + typed `sessions.updated` / `chat.stream.completed`,Config helper 测试也补齐 `sendToMain` 与 typed + renderer publisher mock。 + +仍未满足: + +- 真实外部服务/本机 profile 的人工验证还没有全部完成。 +- Provider 外部动作仍需人工或带真实凭据的 opt-in smoke:refresh models、provider live + connection、key status、rate-limit update、Ollama model pull progress、live chat generation、 + session persistence、GitHub Copilot OAuth、ACP debug action。 +- SkillSync 仍需人工验证真实导入/导出和冲突处理,因为这些会写入 DeepChat skill 目录或外部工具目录。 +- MCP sampling 仍需人工或专项 e2e 验证真实 approve/reject/cancel 弹窗链路,因为现有只读 e2e 不会启动 + 会发 sampling 请求的 MCP server,也不会跑模型调用。 +- Display Settings 字体大小仍需人工或专项 e2e 验证真实 UI 点击和跨窗口 class 同步,因为现有 config + smoke 只读,不修改用户显示设置。 +- NowledgeMem Test Connection 仍需人工或 opt-in e2e,因为它依赖本机或测试环境中真实运行的 + NowledgeMem 服务。 +- MCP 外部 batch import 仍需人工或 opt-in e2e,因为它会修改 MCP server 配置,并可能依赖外部 marketplace + 数据。 +- ACP runtime 行为仍需人工或 opt-in e2e:真实 agent warmup、debug action、mode/model/config option + 变更都依赖本机 agent/runtime 环境。 +- Data/database 外部或破坏性动作仍需在 disposable/copied profile 上人工验证:数据库加密启用/改密/停用、 + database repair、各类 reset data、开发环境 reset 完成提示、YoBrowser sandbox clear、真实加密库 + splash unlock。 +- Project/native path 仍需人工验证:目录选择器、open directory、remote/default workdir 选择和 OS + shell 集成。 +- Window 行为型动作仍需人工验证:focus main、minimize、maximize/restore、close settings/current + window,以及 OS 级 `deepchat://provider/install` 协议分发到 preview queue 的端到端行为。 +- Config 行为型动作仍需人工验证:DeepChat agent 的高级编辑项,例如模型选择、默认项目路径、工具开关、 + subagent slots 和 auto-compaction 控件;hooks notification 的自定义脚本/失败场景和真实事件派发; + system notification 的真实 OS 展示/点击; + Shortcut Settings UI 里的编辑、清除、重置、保存动作,以及 OS global shortcut 的真实按键触发、 + focus/blur 后是否重复注册、快捷键冲突处理;proxy/update channel 保存、打开日志目录、provider DB + refresh、真实 update check/download/restart install,因为这些会修改用户设置、依赖平台全局快捷键状态、 + 调用 OS shell、重启应用或触发网络/元数据刷新。 + +最终合并前仍建议跑下面的 gate: + +```bash +rg "useLegacyPresenter|useLegacyRemoteControlPresenter|useLegacyShortcutPresenter" src/renderer +rg "@api/legacy|legacy/presenters|legacy/runtime" src +rg "presenter:call|remoteControlPresenter:call" src/main src/renderer +rg "DISPATCHABLE_PRESENTERS|REMOTE_CONTROL_METHODS|src/renderer/api/legacy" src/main src/renderer src/preload +node scripts/architecture-guard.mjs +pnpm run format +pnpm run i18n +pnpm run lint +pnpm run typecheck +pnpm test +``` + +多个 Electron e2e spec 合并运行时请加 `--workers=1`,避免单实例锁导致第二个 Electron 进程启动失败。 + +搜索必须只剩明确 allowlist,例如 preload/runtime 兼容层;业务组件里不能再有。 diff --git a/docs/architecture/presenter-ipc-migration-plan/plan.md b/docs/architecture/presenter-ipc-migration-plan/plan.md new file mode 100644 index 000000000..3e1a51840 --- /dev/null +++ b/docs/architecture/presenter-ipc-migration-plan/plan.md @@ -0,0 +1,643 @@ +# Presenter IPC Migration Completion - Plan + +## Target Architecture + +```text +Renderer UI / stores / settings + -> renderer/api domain clients + -> window.deepchat.invoke/on + -> shared/contracts routes + events + -> src/main/routes handlers/services + -> narrow presenter-backed ports + -> presenter runtime owners +``` + +Rules for the remaining migration: + +- Route and client names should follow product domains (`RemoteControlClient`, `KnowledgeClient`, + `SkillSyncClient`) rather than presenter class names. +- `EventBus` may remain internal to main, but renderer-visible events should be emitted with + `publishDeepchatEvent`. +- Long-running operations need explicit progress events or task IDs; do not rely on raw + `eventBus.sendToRenderer` channels. +- Avoid exposing broad utility methods from `windowPresenter`, `configPresenter`, or + `llmproviderPresenter`. Add narrow commands instead. + +## Phase 0 - Make The Guard Honest + +Status: complete for the active migration. The guard now scans settings, forbids renderer business +imports from `@api/legacy/**`, treats a recreated `src/renderer/api/legacy/**` directory as a +regression, has fixture tests for settings legacy/raw IPC, and the baseline reports show zero +renderer legacy counts. + +Update the migration guard before migrating individual presenters: + +| Change | Files | +| --- | --- | +| Add renderer roots to scan: settings, splash, floating, browser overlay, plugin settings | `scripts/architecture-guard.mjs`, `scripts/generate-architecture-baseline.mjs` | Done for settings/business roots and regenerated baseline | +| Keep allowlists explicit for `src/renderer/api/runtime.ts` and specialized preloads | same scripts | Done for the active guard | +| Add phase gates for settings renderer legacy counts | same scripts plus baseline JSON/MD | Done | +| Add tests that a fixture under settings fails on `useLegacyPresenter` and raw IPC | `test/main` or script tests | Done | + +Side effect: the guard will initially fail. Land this with a temporary baseline or bridge register +that lists every active exception from `audit.md`, then remove exceptions as each phase lands. + +## Presenter-by-Presenter Migration Plan + +### `configPresenter` + +Current legacy methods: + +- ACP: `getAcpEnabled`, `setAcpEnabled`, `listAcpRegistryAgents`, `refreshAcpRegistry`, + `ensureAcpAgentInstalled`, `repairAcpAgent`, `uninstallAcpRegistryAgent`, + `setAcpAgentEnabled`, `setAcpAgentEnvOverride`, `listManualAcpAgents`, `addManualAcpAgent`, + `updateManualAcpAgent`, `removeManualAcpAgent`. +- DeepChat agents: `listAgents`, `createDeepChatAgent`, `updateDeepChatAgent`, + `deleteDeepChatAgent`, `getSystemPrompts`. +- Settings helpers: `getSetting`, `setSetting`, `getProxyMode`, `setProxyMode`, + `getCustomProxyUrl`, `setCustomProxyUrl`, `getUpdateChannel`, `setUpdateChannel`, + `openLoggingFolder`, `refreshProviderDb`. +- Hooks: `getHooksNotificationsConfig`, `setHooksNotificationsConfig`, `testHookCommand`. +- Skill draft suggestions: `getSkillDraftSuggestionsEnabled`, + `setSkillDraftSuggestionsEnabled`. + +Target: + +- Extend existing `ConfigClient` where a compatible route already exists. +- Add narrow route groups for missing domains: + - `config.acp.*` for ACP registry/manual-agent lifecycle. + - `config.agents.create/update/delete` for DeepChat agent CRUD. + - `config.hooksNotifications.get/set/test`. + - `config.proxy.get/set`, `config.updateChannel.get/set`, `config.openLoggingFolder`. + - Move `refreshProviderDb` to a provider/database route if possible, because it is not general + config editing. +- Replace `CONFIG_EVENTS.AGENTS_CHANGED` direct listener in `AcpSettings.vue` with + `ConfigClient.onAgentsChanged`. + +Tests: + +- Contract schema tests for ACP agent install state, manual agent input, hooks config, proxy mode. +- Route handler tests with mocked `configPresenter`. +- Renderer client tests for new methods. +- Component tests for `AcpSettings`, `DeepChatAgentsSettings`, `NotificationsHooksSettings`, + proxy/logging/default-model sections. + +Side effects: + +- ACP install/repair/uninstall can be slow and writes to runtime directories. Preserve existing + progress/state semantics and avoid route timeouts. +- Hooks config may contain command strings; schema should preserve existing values but reject + malformed structures. +- Proxy changes trigger main-process network side effects through existing `CONFIG_EVENTS`. + +Manual validation: + +- Toggle ACP globally, install/repair/uninstall one registry agent, add/edit/remove one manual ACP + agent, and confirm agent list refreshes in settings and new-thread surfaces. +- Create/edit/delete a DeepChat agent and verify session creation still resolves its config. +- Change proxy mode/custom URL and verify provider test connection uses the new proxy state. +- Open logging folder from settings on macOS/Windows/Linux. + +### `llmproviderPresenter` + +Current legacy methods: + +- `getKeyStatus`, `refreshModels`. +- `getDimensions`. +- `syncModelScopeMcpServers`. +- `getProviderRateLimitStatus`, `updateProviderRateLimit`. +- `runAcpDebugAction`. + +Target: + +- Use existing `ProviderClient.refreshModels` and `ProviderClient.getProviderRateLimitStatus` + where possible. +- Add: + - `providers.getKeyStatus`. + - `providers.updateRateLimit`. + - `models.getEmbeddingDimensions` or extend `models.getCapabilities` if dimensions belong there. + - `providers.modelScope.syncMcpServers`. + - `providers.acp.debug.run` plus typed `providers.acp.debug.event`. +- Replace `RATE_LIMIT_EVENTS.*` and `ACP_DEBUG_EVENTS.EVENT` raw listeners with typed events. + +Tests: + +- Provider route handler tests for key status, rate-limit update, ModelScope sync, ACP debug action. +- Event contract tests for rate-limit and ACP debug events. +- Renderer tests for `ProviderApiConfig`, `ProviderRateLimitConfig`, `ModelScopeMcpSync`, + `AcpDebugDialog`. + +Side effects: + +- Key status and ACP debug may touch credentials or subprocess state. Route outputs must stay + redacted. +- Rate-limit events can be frequent; keep payload small and versioned. +- Model refresh can hit external providers; tests should mock provider runtime. + +Manual validation: + +- Refresh models for one configured provider. +- Toggle provider rate limiting and confirm queued/executed counters update. +- Run ACP debug action and confirm the debug dialog receives live logs without leaking secrets. + +### `devicePresenter` + +Current legacy methods: + +- `getDeviceInfo`, `getAppVersion`, `selectDirectory`, `selectFiles`, `resetDataByType`. + +Target: + +- Replace `getDeviceInfo`, `getAppVersion`, and `selectDirectory` with existing `DeviceClient`. +- Add `device.selectFiles`. +- Add `device.resetDataByType` or a more explicit `data.reset` route. +- Move direct clipboard/open-external/file-path calls in components to `DeviceClient`, + `BrowserClient`, or `FileClient` runtime wrappers. + +Tests: + +- Device route contract and handler tests. +- Renderer tests for file selection and data reset UI. + +Side effects: + +- `resetDataByType` is destructive. Route should require an explicit reset type enum and keep the + existing confirmation UI unchanged. +- Native file dialogs are hard to automate; unit-test the route and manually verify dialog behavior. + +Manual validation: + +- Select files in skill install and knowledge file flows. +- Reset chat/config/knowledge data in a disposable profile and confirm app restarts or refreshes as + expected. + +### `windowPresenter` + +Current legacy methods and patterns: + +- `closeSettingsWindow`, `focusMainWindow`, `setPendingSettingsProviderInstall`, + `consumePendingSettingsProviderInstall`, `sendToAllWindows`. +- Raw settings events: navigation, provider install preview, settings ready, update check. +- Several settings pages pass `windowPresenter` only to guided onboarding helpers. + +Target: + +- Replace onboarding helper dependency with `WindowClient.focusMainWindow` or a narrow + `system.focusMainWindow` route. +- Add explicit settings routes/events: + - `settings.closeCurrentWindow`. + - `settings.providerInstall.consumePending`. + - `settings.providerInstall.requested` typed event. + - `settings.navigation.requested` typed event or use existing `system.openSettings`. +- Do not expose `sendToAllWindows`. Replace update check with `UpgradeClient.check` or a narrow + `upgrade.check` call. +- Remove unused `windowPresenter` injections from settings pages. + +Tests: + +- Route context tests for current-window behavior using `webContentsId/windowId`. +- Settings app tests for navigation/provider install preview. +- Guided onboarding tests with a mocked narrow focus function. + +Side effects: + +- Settings is a separate BrowserWindow. Current-window routes must use the invoking webContents, + not whichever main window is focused. +- Provider deeplink preview must still arrive if settings opens after the deeplink is received. + +Manual validation: + +- Open settings from main, navigate to provider/model/MCP/skills guided onboarding steps, then return + focus to main. +- Trigger `deepchat://provider/install` and confirm preview opens in settings. +- Check for updates from About settings. + +### `skillSyncPresenter` + +Current legacy methods: + +- `scanExternalTools`, `getNewDiscoveries`, `acknowledgeDiscoveries`, `getRegisteredTools`, + `previewImport`, `executeImport`, `previewExport`, `executeExport`. +- Raw events: `SKILL_SYNC_EVENTS.NEW_DISCOVERIES`, scan/import/export progress. + +Target: + +- Add `skillSync.*` routes and `SkillSyncClient`. +- Add typed events: + - `skillSync.discoveries.changed`. + - `skillSync.scan.started/completed`. + - `skillSync.import.progress/completed`. + - `skillSync.export.progress/completed`. +- Keep payloads based on `@shared/types/skillSync`, but add route schemas for tool IDs, skill names, + conflict strategy, export target, and result envelopes. + +Tests: + +- Route contract tests for import/export inputs. +- Handler tests with mocked scanner/converter. +- Renderer tests for sync prompt, status section, import wizard, export wizard. + +Side effects: + +- Import/export writes files outside app data. Preserve existing permission and path validation. +- Worker fallback behavior must stay the same. + +Manual validation: + +- Scan installed external tools. +- Import one skill with each conflict option in a temporary skills directory. +- Export one active skill to at least one supported external tool format. + +### `projectPresenter` + +Current legacy methods: + +- `getRecentProjects`, `selectDirectory`, `pathExists`. + +Target: + +- Replace recent projects and directory selection with existing `ProjectClient.listRecent` and + `ProjectClient.selectDirectory`. +- Add `project.pathExists`. + +Tests: + +- Project route handler test for `pathExists`. +- Renderer tests for environment/default workdir validation. + +Side effects: + +- `pathExists` can leak local filesystem existence. Keep it a user-initiated settings route and avoid + returning extra metadata. + +Manual validation: + +- Remote-control default workdir picker and environment settings path validation. + +### `knowledgePresenter` + +Current legacy methods: + +- `isSupported`, `getSupportedLanguages`, `getSeparatorsForLanguage`, `getSupportedFileExtensions`, + `validateFile`, `addFile`, `deleteFile`, `reAddFile`, `listFiles`, `similarityQuery`, + `pauseAllRunningTasks`, `resumeAllPausedTasks`. +- Raw events: `RAG_EVENTS.FILE_UPDATED`, `RAG_EVENTS.FILE_PROGRESS`. + +Target: + +- Add `knowledge.*` routes and `KnowledgeClient`. +- Add typed events: + - `knowledge.file.updated`. + - `knowledge.file.progress`. +- Reuse existing `config.getKnowledgeConfigs` / `config.setKnowledgeConfigs` for config list editing, + but move runtime file/index operations to `KnowledgeClient`. + +Tests: + +- Route contract tests for file IDs, knowledge base IDs, query string, validation result. +- Main tests using mocked `knowledgePresenter` and `filePresenter`. +- Renderer tests for knowledge file upload/list/progress. + +Side effects: + +- File ingestion can trigger embeddings and vector DB writes. Keep operation status visible and avoid + large progress payloads. +- Similarity query can expose indexed content. Preserve current UI-only access pattern. + +Manual validation: + +- Add a supported file, watch progress, pause/resume, re-add, delete, and run a similarity query. +- Verify unsupported file handling and file-size validation. + +### `agentSessionPresenter` + +Current legacy methods: + +- `getAgents`, `getUsageDashboard`, `retryRtkHealthCheck`. + +Target: + +- Replace `getAgents` with existing `SessionClient.getAgents` or `ConfigClient.listAgents`, + depending on UI need. +- Add `sessions.usageDashboard.get`. +- Add `sessions.rtkHealth.retry`. + +Tests: + +- Route handler tests for dashboard aggregation and RTK retry dispatch. +- Dashboard settings component tests. + +Side effects: + +- Usage dashboard may scan many sessions. Preserve pagination/aggregation performance. +- RTK health retry may start background checks; keep it explicit and user-triggered. + +Manual validation: + +- Open dashboard settings with a non-empty history. +- Trigger RTK health retry and verify status updates or logs. + +### `remoteControlPresenter` + +Current legacy methods: + +- Generic channel methods: `listRemoteChannels`, `getChannelSettings`, `saveChannelSettings`, + `getChannelStatus`, `getChannelBindings`, `removeChannelBinding`, `removeChannelPrincipal`, + `getChannelPairingSnapshot`, `createChannelPairCode`, `clearChannelPairCode`. +- Legacy channel-specific methods still used by compatibility code for Telegram and Weixin iLink. +- `RemoteControlRuntime.ts` wraps `remoteControlPresenter:call`. + +Target: + +- Add `remoteControl.*` routes and `RemoteControlClient`. +- Prefer generic channel routes over channel-specific renderer methods: + - `remoteControl.listChannels` + - `remoteControl.getSettings` + - `remoteControl.saveSettings` + - `remoteControl.getStatus` + - `remoteControl.listBindings` + - `remoteControl.removeBinding` + - `remoteControl.removePrincipal` + - `remoteControl.getPairingSnapshot` + - `remoteControl.createPairCode` + - `remoteControl.clearPairCode` + - `remoteControl.weixinIlink.startLogin/waitLogin/removeAccount/restartAccount` +- Delete `RemoteControlRuntime.ts` after `RemoteSettings.vue` uses the typed client. + +Tests: + +- Route schema tests for discriminated channel payloads. +- Handler tests with mocked `remoteControlPresenter`. +- Renderer tests for Telegram/Feishu/QQBot/Discord/Weixin settings panels. + +Side effects: + +- Remote control stores credentials and account bindings. Outputs must be redacted. +- Weixin login wait is long-running; route should support timeout and cancellation semantics. +- Some channels require network access and cannot be fully automated. + +Manual validation: + +- Telegram: save token, create/clear pair code, bind/unbind a chat. +- Feishu/QQBot/Discord: toggle remote control settings and verify status display. +- Weixin iLink: start login, wait for success/failure, restart/remove account. + +### `skillPresenter` + +Current legacy method: + +- `readSkillFile`. + +Target: + +- Add `skills.readFile` or extend `SkillClient` with a read method. +- Keep name validation and path resolution inside `skillPresenter`; renderer passes only skill name. + +Tests: + +- Route schema rejects empty/traversal-like names. +- Skill editor test loads content through `SkillClient`. + +Side effects: + +- Reading arbitrary files must not be exposed. Only skill-owned files should be reachable. + +Manual validation: + +- Open an installed skill in the editor, edit, save, and reopen. + +### `mcpPresenter` + +Current legacy methods: + +- MCP Router market helpers: `getMcpRouterApiKey`, `setMcpRouterApiKey`, + `updateMcpRouterServersAuth`, `isServerInstalled`, `listMcpRouterServers`, + `installMcpRouterServer`. + +Target: + +- Add `mcp.router.*` routes and `McpClient` methods. +- Keep API key storage and server install logic in main. +- Use existing MCP typed events for config/server status changes where possible. + +Tests: + +- Route handler tests for API key read/write with redaction as needed. +- Market install tests with mocked router manager/network. + +Side effects: + +- MCP Router calls can hit network and persist credentials. +- Installing a server modifies MCP config and can start/stop server processes. + +Manual validation: + +- Save MCP Router API key, list market servers, install one server, verify it appears in MCP settings. + +### `exporter` / NowledgeMem + +Current legacy methods: + +- `getNowledgeMemConfig`, `updateNowledgeMemConfig`, `testNowledgeMemConnection`. + +Target: + +- Add `nowledgeMem.getConfig`, `nowledgeMem.updateConfig`, `nowledgeMem.testConnection` routes and + a `NowledgeMemClient`, or place them under an `export` route group if preferred. + +Tests: + +- Route schema bounds timeout and URL fields. +- Handler tests mock `exporter`. +- Renderer test for `NowledgeMemSettings`. + +Side effects: + +- Test connection performs network I/O. Unit tests must mock it; manual validation should use a local + disposable endpoint. + +Manual validation: + +- Save config, test connection success/failure, reload settings and confirm persistence. + +### `filePresenter` + +Current legacy methods: + +- `getMimeType`, `prepareFile`. + +Target: + +- Replace with existing `FileClient.getMimeType` and `FileClient.prepareFile`. + +Tests: + +- Component test for prompt editor file upload can mock `FileClient`. + +Side effects: + +- None expected if method semantics are preserved. + +Manual validation: + +- Attach a prompt file and confirm text extraction/preview still works. + +### `toolPresenter` + +Current legacy method: + +- `getAllToolDefinitions`. + +Target: + +- Replace with existing `ToolClient.getAllToolDefinitions`. + +Tests: + +- DeepChat agent settings component test with disabled tool selections. + +Side effects: + +- Tool definitions depend on MCP config and agent mode; make sure the typed call passes the same + context as the legacy call. + +Manual validation: + +- Open DeepChat agent settings and toggle disabled agent tools. + +### `sqlitePresenter` + +Current legacy method: + +- `repairSchema`. + +Target: + +- Add a narrow `database.repairSchema` or `databaseSecurity.repairSchema` route. Keep it separate + from encryption routes if the semantics are operational repair rather than security. + +Tests: + +- Handler test with mocked repair report. +- Data settings component test for repair result display. + +Side effects: + +- Repair can mutate local database schema. Manual validation should use a copied test profile. + +Manual validation: + +- Trigger repair on a disposable profile and verify the report UI. + +### `yoBrowserPresenter` + +Current legacy method: + +- `clearSandboxData`. + +Target: + +- Add `browser.clearSandboxData` to `BrowserClient`. + +Tests: + +- Browser route handler test with mocked presenter. +- Data settings component test. + +Side effects: + +- Clears browser sandbox/cache. Make the destructive action explicit in UI. + +Manual validation: + +- Clear sandbox data and verify browser sessions start cleanly. + +### `oauthPresenter` + +Current legacy methods: + +- `startGitHubCopilotLogin`, `startGitHubCopilotDeviceFlowLogin`. + +Target: + +- Add `oauth.githubCopilot.startLogin` and `oauth.githubCopilot.startDeviceFlowLogin`, or place them + under provider auth routes if provider ownership is preferred. +- Keep OAuth callback/deeplink handling in main. + +Tests: + +- Route handler tests with mocked `oauthPresenter`. +- Renderer test for `GitHubCopilotOAuth`. + +Side effects: + +- Opens external auth flow and writes credentials. Unit tests must mock shell/deeplink behavior. + +Manual validation: + +- Run both GitHub Copilot auth flows in a disposable account or mocked auth environment. + +### `shortcutPresenter` + +Current legacy methods: + +- `registerShortcuts`, `destroy` through `ShortcutRuntime`. + +Target: + +- Prefer removing renderer control if main lifecycle already owns shortcut registration. +- If renderer control is still required, add narrow `shortcuts.register` and `shortcuts.unregister` + routes and replace `ShortcutRuntime`. + +Tests: + +- Shortcut store test confirms it calls typed client or no longer calls main. +- Existing `shortcutPresenter` main tests stay as runtime behavior coverage. + +Side effects: + +- Global shortcuts affect the OS. Avoid duplicate registration when app focus changes. + +Manual validation: + +- Change shortcut settings, blur/focus app, and confirm shortcuts work once without duplicates. + +## Event Migration Plan + +| Raw event | Target | +| --- | --- | +| `STREAM_EVENTS.END/ERROR` fallback in `messageIpc.ts` | Remove after all terminal refresh paths publish `chat.stream.completed/failed`; add typed event for `emitMessageRefresh` if needed | +| `context-menu-translate`, `context-menu-ask-ai` | Add typed context-menu event or a narrow preload API; keep DOM CustomEvent inside renderer | +| `SETTINGS_EVENTS.NAVIGATE`, `SETTINGS_EVENTS.PROVIDER_INSTALL` | `settings.navigation.requested`, `settings.providerInstall.requested` typed events | +| `NOTIFICATION_EVENTS.SHOW_ERROR`, database repair suggested | Typed notification/settings events or explicit settings store action | +| `CONFIG_EVENTS.AGENTS_CHANGED` | Existing `config.agents.changed` | +| `ACP_DEBUG_EVENTS.EVENT` | `providers.acp.debug.event` | +| `RAG_EVENTS.FILE_UPDATED/FILE_PROGRESS` | `knowledge.file.updated/progress` | +| `RATE_LIMIT_EVENTS.*` | `providers.rateLimit.*` typed events | +| `SKILL_SYNC_EVENTS.*` | `skillSync.*` typed events | +| `skill:installed/uninstalled/metadata-updated` | Existing `skills.catalog.changed` | +| `acp-init:*`, `external-deps-required`, `acp-terminal:*` | ACP init/terminal typed specialized API or route/event group | + +## Verification Strategy + +Automated gates after each implementation PR: + +```bash +pnpm run format +pnpm run i18n +pnpm run lint +pnpm run typecheck +pnpm test -- test/main/routes test/main/contracts test/renderer/api +pnpm test -- test/renderer/components/.test.ts +node scripts/architecture-guard.mjs +``` + +Manual verification is required for: + +- Native file/directory dialogs. +- OAuth login/device flow. +- ACP agent install/repair/uninstall and terminal interaction. +- Remote-control channel login/pairing with real services. +- Database reset/repair on a copied profile. +- Floating widget drag/open-session behavior. +- Splash database unlock flow. diff --git a/docs/architecture/presenter-ipc-migration-plan/spec.md b/docs/architecture/presenter-ipc-migration-plan/spec.md new file mode 100644 index 000000000..87224ed58 --- /dev/null +++ b/docs/architecture/presenter-ipc-migration-plan/spec.md @@ -0,0 +1,78 @@ +# Presenter IPC Migration Completion - Spec + +> Status: automated migration gate passed; external/manual validation remains. +> Audit snapshot: 2026-06-10; latest verification snapshot: 2026-06-11 on branch +> `codex/presenter-ipc-migration-plan`. + +## Problem + +DeepChat has a typed renderer-main boundary for the main chat path: + +```text +renderer/api/*Client + -> window.deepchat + -> shared/contracts routes + events + -> src/main/routes + -> presenter-backed ports +``` + +At the start of this work the migration was incomplete: the main window hot path was mostly +migrated, but settings and secondary renderer surfaces still used legacy presenter reflection, raw +`window.electron.ipcRenderer` channels, or direct `window.api` calls. + +The stale signal was risky: `docs/architecture/baselines/main-kernel-migration-scoreboard.md` +claimed P5 was ready and `node scripts/architecture-guard.mjs` passed, while the source still +contained settings renderer legacy calls. The guard protected the migrated main renderer hot path +more than the full renderer surface. The current branch expands that guard and removes the broad +renderer legacy transport from business code. + +## Goals + +1. Remove renderer business dependency on `useLegacyPresenter()`, `useLegacyRemoteControlPresenter()`, + `useLegacyShortcutPresenter()`, raw `window.electron`, and direct `window.api`. +2. Replace every renderer-visible presenter method with a typed domain client backed by + `src/shared/contracts/routes/*.routes.ts`, `src/shared/contracts/events/*.events.ts`, and + `src/main/routes`. +3. Keep `EventBus` as an internal main-process coordination mechanism, but publish renderer-visible + notifications through typed events. +4. Retire `ipcMain.handle('presenter:call')` and `ipcMain.handle('remoteControlPresenter:call')` + once no renderer imports the legacy transport. +5. Extend architecture guard coverage so future changes cannot reintroduce legacy IPC in + `src/renderer/settings`, `src/renderer/splash`, `src/renderer/floating`, + `src/renderer/browser-overlay`, or other renderer entry points. + +## Non-Goals + +- No behavior redesign of presenters themselves. +- No data-model migration unless a typed route requires payload normalization for existing data. +- No removal of main-process internal `EventBus` listeners. +- No immediate removal of specialized preload APIs for floating, splash, browser overlay, or plugin + settings if they are still the correct boundary for a dedicated renderer. They should still get + typed payload validation and explicit allowlists. +- No UI redesign. + +## Acceptance Criteria + +- `rg "useLegacyPresenter|useLegacyRemoteControlPresenter|useLegacyShortcutPresenter" src/renderer` + only finds legacy quarantine definitions or returns no business usages. +- `rg "window\\.electron|window\\.api" src/renderer` only finds explicitly allowlisted runtime + wrappers or specialized preloads; settings/business components have zero direct hits. +- All renderer-visible calls are represented in shared route/event contracts with zod validation. +- `presenter:call` and `remoteControlPresenter:call` handlers are removed or gated behind a documented + temporary bridge register with zero active renderer consumers. +- `scripts/architecture-guard.mjs` scans all renderer roots and fails on new legacy IPC outside + allowlisted wrappers. +- Existing tests pass for affected domains, and each new route/client/event has focused unit coverage. +- Manual verification covers the surfaces that cannot be safely automated, especially external + integrations such as ACP install, remote-control login/pairing, provider OAuth, and database reset. + +## Constraints + +- New renderer-main capabilities must use shared contracts and `renderer/api/*Client`. +- Do not expose broad presenter methods through new typed routes. Prefer domain-specific routes with + narrow input/output schemas. +- Avoid adding methods such as `windowPresenter.sendToAllWindows` to typed clients. Replace the user + workflow with a narrower command or event. +- Preserve dual publish only during an individual migration PR. After the consumer is migrated, remove + the legacy raw event in the same PR or a directly follow-up PR. +- Secrets and tokens must never be sent through broad typed events or logged in route errors. diff --git a/docs/architecture/presenter-ipc-migration-plan/tasks.md b/docs/architecture/presenter-ipc-migration-plan/tasks.md new file mode 100644 index 000000000..7e3099f26 --- /dev/null +++ b/docs/architecture/presenter-ipc-migration-plan/tasks.md @@ -0,0 +1,970 @@ +# Presenter IPC Migration Completion - Tasks + +> Status: active execution record. Each checked item must have static or test evidence below it. + +## T0 - Documentation And Audit + +- [x] Create branch `codex/presenter-ipc-migration-plan`. +- [x] Audit typed routes/events and legacy renderer IPC usage. +- [x] Write spec, audit, plan, and tasks. + +Verification: + +- `node scripts/architecture-guard.mjs` currently passes, confirming the guard gap rather than + proving migration completion. + +## T1 - Architecture Guard Coverage + +- [x] Extend guard scans to all renderer roots, especially `src/renderer/settings` and + `src/renderer/splash`. +- [x] Add explicit allowlists for runtime wrappers and specialized preload APIs. +- [x] Treat retired `src/renderer/api/legacy/**` as forbidden instead of quarantine. +- [x] Regenerate baseline reports with current legacy exceptions recorded. +- [x] Add a test or fixture proving settings-level `useLegacyPresenter` fails the guard. +- [x] Define the per-slice verification matrix in + [verification.md](./verification.md). + +Side effect: + +- CI may begin failing until the baseline/bridge register is updated. Treat that as intentional + visibility, not a migration failure. + +Evidence: + +- `node scripts/architecture-guard.mjs` passed after the guard began scanning + `src/renderer/settings` and after `src/renderer/api/legacy/**` was deleted. +- Source scan: `rg "@api/legacy|legacy/presenters|legacy/runtime" src -g '*.ts' -g '*.vue' -g '*.d.ts'` + returns no hits. +- `node scripts/generate-architecture-baseline.mjs` regenerated + `docs/architecture/baselines/main-kernel-boundary-baseline.md` and + `docs/architecture/baselines/main-kernel-migration-scoreboard.*` with `renderer.*` legacy counts + at `0`. +- Evidence: `pnpm exec vitest run test/main/scripts/architectureGuard.test.ts --silent --reporter=dot` + passed with 1 file / 2 tests. + +## T2 - Easy Replacements Using Existing Clients + +- [x] Replace `filePresenter.getMimeType/prepareFile` with `FileClient`. +- [x] Replace `toolPresenter.getAllToolDefinitions` with `ToolClient`. +- [x] Replace `projectPresenter.getRecentProjects/selectDirectory` with `ProjectClient`. +- [x] Replace `devicePresenter.getAppVersion/getDeviceInfo/selectDirectory` with `DeviceClient`. +- [x] Replace `agentSessionPresenter.getAgents` with `SessionClient.getAgents` or + `ConfigClient.listAgents`. +- [x] Replace direct `window.api.copyText/readClipboardText/openExternal/getPathForFile` with + existing runtime wrapper methods through `DeviceClient`, `BrowserClient`, or `FileClient`. +- [x] Remove unused legacy `windowPresenter`/`configPresenter` injections where no method is needed. + +Automated tests: + +- Renderer component tests for prompt editor, DeepChat agent settings, remote settings path picker, + About settings, and data settings. +- `node scripts/architecture-guard.mjs`. + +Manual tests: + +- File picker, prompt file import, and remote default workdir selection. + +Project/environment evidence: + +- Runtime read-only evidence: + `pnpm exec playwright test -c test/e2e/playwright.config.ts test/e2e/specs/21-project-readonly-route.smoke.spec.ts` + passed with 1 smoke test. It opens the real Environments Settings page and reads + `project.listRecent`, `project.listEnvironments`, and `project.pathExists` for both an existing + repository path and a generated missing path without opening directories or invoking the native + directory picker. +- Focused stability evidence: + `pnpm exec playwright test -c test/e2e/playwright.config.ts test/e2e/specs/01-launch.smoke.spec.ts test/e2e/specs/06-settings-ipc-boundary.smoke.spec.ts test/e2e/specs/21-project-readonly-route.smoke.spec.ts` + passed with 3 smoke tests. +- Manual follow-up remains required for native directory picker, open-directory behavior, and + remote/default-workdir flows because those depend on OS dialogs and shell integration. + +Agent session evidence: + +- Added `sessions.getUsageDashboard` and `sessions.retryRtkHealthCheck`. +- Replaced Dashboard usage and Remote settings agent list with `SessionClient`. +- Evidence: `pnpm exec vitest run test/main/routes/contracts.test.ts test/main/routes/dispatcher.test.ts test/renderer/api/clients.test.ts test/renderer/components/DashboardSettings.test.ts test/renderer/components/RemoteSettings.test.ts` + passed with 5 files / 84 tests. +- Runtime read-only evidence: + `pnpm exec playwright test -c test/e2e/playwright.config.ts test/e2e/specs/15-dashboard-readonly-route.smoke.spec.ts --reporter=list` + passed with 1 smoke test. It opens the real Settings Overview dashboard surface and verifies the + typed `sessions.getUsageDashboard` route shape without triggering `sessions.retryRtkHealthCheck` + or mutating session data. + +## T3 - Typed Events Before Heavy Route Work + +- [x] Remove legacy stream terminal fallback in `messageIpc.ts` or add the missing typed refresh event. +- [x] Migrate context-menu raw channels to a typed event or narrow preload API. +- [x] Migrate settings navigation/provider-install/notification raw events. +- [x] Migrate `CONFIG_EVENTS.AGENTS_CHANGED`, `RAG_EVENTS.*`, `RATE_LIMIT_EVENTS.*`, + `SKILL_SYNC_EVENTS.*`, `ACP_DEBUG_EVENTS.EVENT`, and `skill:*` listeners. +- [x] Migrate ACP terminal/init raw channels to typed routes/events. +- [x] Remove legacy dialog request and workspace invalidation raw renderer events after typed + events had consumers. +- [x] Remove legacy device reset completion raw notification after typed app-runtime event had a + consumer. +- [x] Remove legacy system notification click raw notification after typed app-runtime event had a + consumer. +- [x] Remove legacy Ollama pull-progress raw event after typed provider event had a consumer. +- [x] Remove legacy skill catalog/session raw events after typed skill events had consumers. +- [x] Remove legacy YoBrowser raw lifecycle/open events after typed browser events had consumers. +- [x] Remove legacy MCP sampling raw events after typed MCP sampling events had consumers. +- [x] Remove legacy config font-size raw event after typed settings changed event had a consumer. +- [x] Remove legacy NowledgeMem config raw event after typed config routes had consumers. +- [x] Remove legacy MCP config renderer send while keeping main-internal MCP config event and typed + bridge. +- [x] Remove legacy ACP workspace raw events after typed session ACP ready events had consumers. + +Automated tests: + +- `test/renderer/api/createBridge.test.ts`. +- New event contract tests. +- Affected store/component tests. + +Manual tests: + +- Send a chat message and ensure terminal refresh is stable. +- Use selected text context menu for translate and ask-AI. +- Open settings via deeplink/provider install. +- ACP terminal initialization/input/kill and external dependency prompt. + +Settings/window/notification/ACP evidence: + +- Added typed events for settings navigation, provider install, update check, notification error, + database repair suggestion, and ACP terminal lifecycle/output/dependency events. +- Added `window.notifySettingsReady`, `acpTerminal.input`, and `acpTerminal.kill` routes. +- Replaced settings shell, About update check, ACP settings reload, Skills catalog reload, and ACP + terminal listeners with typed clients. +- Evidence: `pnpm exec vitest run test/main/routes/contracts.test.ts test/main/routes/dispatcher.test.ts test/renderer/api/clients.test.ts test/renderer/components/SettingsApp.test.ts test/renderer/components/SettingsApp.providerDeeplink.test.ts test/renderer/components/AboutUsSettings.test.ts` + passed with 6 files / 92 tests. +- Additional evidence: `pnpm exec vitest run test/main/routes/contracts.test.ts test/main/routes/dispatcher.test.ts test/renderer/api/clients.test.ts test/renderer/components/AcpSettings.test.ts` + passed with 4 files / 77 tests. +- Upgrade typed-event cleanup evidence: + `pnpm exec vitest run test/main/presenter/upgradePresenter.test.ts test/main/routes/contracts.test.ts test/renderer/api/clients.test.ts test/renderer/components/AboutUsSettings.test.ts --silent --reporter=dot` + passed with 4 files / 64 tests. `upgradePresenter` no longer sends renderer-visible + `UPDATE_EVENTS.STATUS_CHANGED`, `PROGRESS`, `WILL_RESTART`, or `ERROR` raw channels; renderer + update state is delivered through typed `upgrade.status.changed`, `upgrade.progress`, + `upgrade.willRestart`, and `upgrade.error` events. `UPDATE_EVENTS.STATE_CHANGED` remains only as a + main-internal upgrade/lifecycle signal. +- Dialog typed-event cleanup evidence: + `pnpm exec vitest run test/main/presenter/dialogPresenter.test.ts test/main/routes/contracts.test.ts test/main/routes/dispatcher.test.ts test/renderer/api/clients.test.ts test/renderer/stores/dialogStore.test.ts --silent --reporter=dot` + passed with 5 files / 82 tests. `DialogPresenter.showDialog` now emits only typed + `dialog.requested`; retired `dialog:request` / `dialog:response` constants were removed from main + and renderer event files. Runtime stability evidence: + `pnpm exec playwright test test/e2e/specs/01-launch.smoke.spec.ts test/e2e/specs/06-settings-ipc-boundary.smoke.spec.ts --workers=1` + passed with 2 smoke tests after rebuilding. +- Workspace invalidation cleanup evidence: + `pnpm exec vitest run test/main/presenter/workspacePresenter.test.ts test/main/routes/contracts.test.ts test/main/routes/dispatcher.test.ts test/renderer/api/clients.test.ts --silent --reporter=dot` + passed with 4 files / 94 tests. Workspace watchers now emit only typed `workspace.invalidated`; + retired `workspace:files-changed` invalidation constants were removed from main and renderer + event files. User-flow route evidence: + `pnpm exec playwright test test/e2e/specs/01-launch.smoke.spec.ts test/e2e/specs/09-main-ipc-boundary.smoke.spec.ts test/e2e/specs/29-workspace-readonly-route.smoke.spec.ts --workers=1` + passed with 3 smoke tests after rebuilding. The e2e opens the real main renderer, registers the + current repository as an allowed workspace, reads directory/search/git status routes, and + unregisters in `finally` without starting watchers, opening files, or revealing paths. +- Device reset completion cleanup evidence: + `pnpm exec vitest run test/main/presenter/devicePresenter.test.ts test/main/routes/contracts.test.ts test/main/routes/dispatcher.test.ts test/renderer/api/clients.test.ts test/renderer/components/DataSettings.test.ts --silent --reporter=dot` + passed with 5 files / 103 tests. `DevicePresenter` now publishes typed + `appRuntime.dataResetCompleteDev` directly in the development reset completion branch; the retired + `notification:data-reset-complete-dev` constant was removed from main and renderer event files, + and the `WindowPresenter` legacy-channel translation case was removed. Source scan: + `rg "DATA_RESET_COMPLETE_DEV|notification:data-reset-complete-dev" src/main src/renderer test -g '*.ts' -g '*.vue'` + returns no hits. User-flow stability evidence: + `pnpm exec playwright test test/e2e/specs/01-launch.smoke.spec.ts test/e2e/specs/06-settings-ipc-boundary.smoke.spec.ts test/e2e/specs/20-data-security-readonly-route.smoke.spec.ts --workers=1` + passed with 3 smoke tests after rebuilding. The e2e opens the real Data Settings page and reads + read-only device/database routes without triggering destructive data reset. The actual reset + button flow remains a disposable-profile manual check. +- System notification click cleanup evidence: + `pnpm exec vitest run test/main/presenter/notificationPresenter.test.ts test/main/routes/contracts.test.ts test/renderer/api/clients.test.ts test/renderer/components/App.startup.test.ts --silent --reporter=dot` + passed with 4 files / 67 tests. `NotificationPresenter` now publishes typed + `appRuntime.systemNotificationClicked` directly when an Electron system notification is clicked; + the retired `notification:sys-notify-clicked` translation case was removed from + `WindowPresenter`, and the old `NOTIFICATION_EVENTS` constants were removed from main and + renderer event files. Source scan: + `rg "NOTIFICATION_EVENTS|notification:sys-notify-clicked|SYS_NOTIFY_CLICKED" src/main src/renderer -g '*.ts' -g '*.vue'` + returns no hits. User-flow stability evidence: + `pnpm exec playwright test test/e2e/specs/01-launch.smoke.spec.ts test/e2e/specs/09-main-ipc-boundary.smoke.spec.ts --workers=1` + passed with 2 smoke tests after rebuilding. Actual OS notification display/click behavior remains + a platform manual check because it depends on notification permissions and desktop environment. +- Ollama pull-progress cleanup evidence: + `pnpm exec vitest run test/main/presenter/llmProviderPresenter/ollamaManager.test.ts test/main/routes/contracts.test.ts test/renderer/api/clients.test.ts test/renderer/stores/ollamaStore.test.ts --silent --reporter=dot` + passed with 4 files / 58 tests. `OllamaManager` now emits only typed + `providers.ollama.pull.progress`; the retired `ollama:pull-model-progress` constants were + removed from main and renderer event files. Source scan: + `rg "OLLAMA_EVENTS|ollama:pull-model-progress|PULL_MODEL_PROGRESS" src/main src/renderer test -g '*.ts' -g '*.vue'` + returns no hits. User-flow stability evidence: + `pnpm exec playwright test test/e2e/specs/01-launch.smoke.spec.ts test/e2e/specs/06-settings-ipc-boundary.smoke.spec.ts test/e2e/specs/18-provider-readonly-route.smoke.spec.ts --workers=1` + passed with 3 smoke tests after rebuilding. The e2e opens the real Model Providers settings + surface without pulling a model or requiring a live Ollama daemon. +- Skill catalog/session cleanup evidence: + `pnpm exec vitest run test/main/presenter/skillPresenter/skillPresenter.test.ts test/main/routes/contracts.test.ts test/renderer/api/clients.test.ts test/renderer/components/McpIndicator.test.ts test/renderer/components/SkillsSettings.test.ts test/renderer/components/SkillEditorSheet.test.ts --silent --reporter=dot` + passed with 5 files / 151 tests. `SkillPresenter` now emits only typed + `skills.catalog.changed` and `skills.session.changed` for discovery, install/uninstall, + activation/deactivation, and watcher metadata changes; retired `skill:*` constants were removed + from main and renderer event files. Source scan: + `rg "SKILL_EVENTS|skill:activated|skill:deactivated|skill:discovered|skill:installed|skill:uninstalled|skill:metadata-updated" src/main src/renderer test -g '*.ts' -g '*.vue'` + returns no hits. User-flow stability evidence: + `pnpm exec playwright test test/e2e/specs/01-launch.smoke.spec.ts test/e2e/specs/06-settings-ipc-boundary.smoke.spec.ts test/e2e/specs/16-skills-readonly-route.smoke.spec.ts --workers=1` + passed with 3 smoke tests after rebuilding. The e2e opens the real Skills settings surface and + reads skill routes without installing, uninstalling, saving, or editing skill files. +- YoBrowser lifecycle/open cleanup evidence: + `pnpm exec vitest run test/main/presenter/YoBrowserPresenter.test.ts test/main/routes/contracts.test.ts test/renderer/api/clients.test.ts test/renderer/components/BrowserPanel.test.ts --silent --reporter=dot` + passed with 4 files / 71 tests. `YoBrowserPresenter` now emits only typed + `browser.status.changed`, `browser.open.requested`, and `browser.activity.changed`; retired + `yo-browser:*` constants were removed from main and renderer event files. The old + `yo-browser:window-count-changed` event had no business consumer and was retired without a typed + replacement. Source scan: + `rg "YO_BROWSER_EVENTS|yo-browser:" src/main src/renderer test -g '*.ts' -g '*.vue'` + returns no hits. User-flow evidence: `test/e2e/specs/08-browser-route.smoke.spec.ts` passed in + the 3-spec run and validated browser typed routes. `01-launch` and `06-settings-ipc-boundary` + passed individually after the same build; a 3-spec rerun hit an app fixture setup timeout in + `06-settings-ipc-boundary`, which is recorded as existing e2e harness startup instability rather + than a browser route failure. +- MCP sampling cleanup evidence: + `pnpm exec vitest run test/main/presenter/mcpPresenter.test.ts test/main/routes/contracts.test.ts test/renderer/api/clients.test.ts test/renderer/stores/mcpSampling.test.ts --silent --reporter=dot` + passed with 4 files / 68 tests. `McpPresenter` no longer sends retired + `mcp:sampling-request`, `mcp:sampling-decision`, or `mcp:sampling-cancelled` raw renderer + channels; sampling approval, decision, and cancellation notifications are delivered through typed + `mcp.sampling.request`, `mcp.sampling.decision`, and `mcp.sampling.cancelled` events. Source scan: + `rg "mcp:sampling-request|mcp:sampling-decision|mcp:sampling-cancelled|SAMPLING_REQUEST|SAMPLING_DECISION|SAMPLING_CANCELLED" src/main src/renderer test -g '*.ts' -g '*.vue'` + returns no hits. User-flow stability evidence: + `pnpm exec playwright test test/e2e/specs/01-launch.smoke.spec.ts test/e2e/specs/06-settings-ipc-boundary.smoke.spec.ts test/e2e/specs/13-mcp-readonly-route.smoke.spec.ts --workers=1` + passed with 3 smoke tests after rebuilding. The e2e opens the real MCP Settings page and verifies + typed MCP read-only routes, but it does not exercise a live MCP sampling request because that + requires a test MCP server and model invocation path. +- Config font-size cleanup evidence: + `pnpm exec vitest run test/main/presenter/configPresenter/fontSizeSettings.test.ts test/main/routes/contracts.test.ts test/main/routes/dispatcher.test.ts test/main/routes/settingsHandler.test.ts test/renderer/api/clients.test.ts test/renderer/stores/uiSettingsStore.test.ts --silent --reporter=dot` + passed with 6 files / 88 tests. `ConfigPresenter.setSetting('fontSizeLevel', value)` now relies + on typed `settings.changed` only; retired `config:font-size-changed` constants were removed from + main and renderer event files. Source scan: + `rg "config:font-size-changed|FONT_SIZE_CHANGED" src/main src/renderer test -g '*.ts' -g '*.vue'` + returns no hits. User-flow stability evidence: + `pnpm exec playwright test test/e2e/specs/01-launch.smoke.spec.ts test/e2e/specs/06-settings-ipc-boundary.smoke.spec.ts test/e2e/specs/23-config-readonly-route.smoke.spec.ts --workers=1` + passed with 3 smoke tests after rebuilding. Actual font-size UI adjustment and cross-window class + synchronization remain manual or future dedicated e2e because the current config e2e is + read-only. +- NowledgeMem config cleanup evidence: + `pnpm exec vitest run test/main/presenter/configPresenter/fontSizeSettings.test.ts test/main/routes/contracts.test.ts test/main/routes/dispatcher.test.ts test/renderer/api/clients.test.ts test/renderer/components/NowledgeMemSettings.test.ts --silent --reporter=dot` + passed with 5 files / 83 tests. `ConfigPresenter.setNowledgeMemConfig` no longer sends retired + `config:nowledge-mem-config-updated`; NowledgeMem settings save/load behavior is carried by typed + `nowledgeMem.updateConfig` and `nowledgeMem.getConfig` routes. Source scan: + `rg "config:nowledge-mem-config-updated|NOWLEDGE_MEM_CONFIG_UPDATED" src/main src/renderer test -g '*.ts' -g '*.vue'` + returns no hits. User-flow evidence: + `pnpm exec playwright test test/e2e/specs/01-launch.smoke.spec.ts test/e2e/specs/06-settings-ipc-boundary.smoke.spec.ts test/e2e/specs/14-nowledgemem-config-route.smoke.spec.ts --workers=1` + passed with 3 smoke tests after rebuilding. The e2e opens real Knowledge Settings, writes a + temporary NowledgeMem config through UI/typed routes, verifies persistence, and restores the + original config; live Test Connection remains manual because it requires a running NowledgeMem + service. +- MCP config bridge cleanup evidence: + `pnpm exec vitest run test/main/presenter/configPresenter/mcpConfHelper.test.ts test/main/routes/contracts.test.ts test/main/routes/dispatcher.test.ts test/renderer/api/clients.test.ts test/renderer/stores/mcpStore.test.ts --silent --reporter=dot` + passed with 5 files / 89 tests. `McpConfHelper.batchImportMcpServers` no longer sends + `MCP_EVENTS.CONFIG_CHANGED` directly to renderer; it emits the main-internal MCP config event, + and `legacyTypedEventBridge` publishes typed `mcp.config.changed`. The unused renderer + `MCP_EVENTS` raw constants were removed. Source scan over the touched files confirms no + `eventBus.sendToRenderer` remains in `mcpConfHelper`. User-flow evidence: + `pnpm exec playwright test test/e2e/specs/01-launch.smoke.spec.ts test/e2e/specs/06-settings-ipc-boundary.smoke.spec.ts test/e2e/specs/13-mcp-readonly-route.smoke.spec.ts --workers=1` + passed with 3 smoke tests after rebuilding. Batch import from external marketplaces still needs + manual or opt-in e2e because it mutates MCP server config and can depend on network data. +- ACP workspace/debug cleanup evidence: + `pnpm exec vitest run test/main/presenter/acpProvider.test.ts test/main/presenter/llmProviderPresenter/acp/acpProcessManager.test.ts test/main/routes/contracts.test.ts test/renderer/api/clients.test.ts test/renderer/components/ChatStatusBar.test.ts test/renderer/components/AcpDebugDialog.test.ts --silent --reporter=dot` + passed with 6 files / 157 tests. ACP workspace readiness now uses typed + `sessions.acp.modes.ready`, `sessions.acp.commands.ready`, and + `sessions.acp.configOptions.ready`; retired `acp-workspace:*` constants were removed from main, + renderer, and tests. ACP debug events now enter the main event bus as `ACP_DEBUG_EVENTS.EVENT` + and are published to renderer through typed `providers.acp.debug.event` by the bridge. Source + scan: + `rg "ACP_WORKSPACE_EVENTS|acp-workspace:|SESSION_MODES_READY|SESSION_COMMANDS_READY|SESSION_CONFIG_OPTIONS_READY|eventBus\\.sendToRenderer\\(" src/main/presenter/llmProviderPresenter src/main/events.ts src/renderer/src/events.ts test/main/presenter/acpProvider.test.ts test/main/presenter/llmProviderPresenter/acp/acpProcessManager.test.ts test/renderer/components/ChatStatusBar.test.ts -g '*.ts' -g '*.vue'` + returns no hits. User-flow evidence: + `pnpm exec playwright test test/e2e/specs/01-launch.smoke.spec.ts test/e2e/specs/06-settings-ipc-boundary.smoke.spec.ts test/e2e/specs/17-acp-readonly-route.smoke.spec.ts test/e2e/specs/18-provider-readonly-route.smoke.spec.ts --workers=1` + passed with 4 smoke tests after rebuilding. Real ACP process warmup, debug actions, mode/model + selection, and config option changes remain manual or opt-in e2e because they require runnable + ACP agents and local runtime dependencies. +- Runtime window-state evidence: + `pnpm exec playwright test -c test/e2e/playwright.config.ts test/e2e/specs/22-window-readonly-route.smoke.spec.ts` + passed with 1 smoke test. It reads `window.getCurrentState` from both the real main renderer and + the real Settings renderer, proving the context-aware route returns distinct current-window state + snapshots without minimizing, maximizing, focusing, or closing either window. +- Focused window stability evidence: + `pnpm exec playwright test -c test/e2e/playwright.config.ts test/e2e/specs/01-launch.smoke.spec.ts test/e2e/specs/06-settings-ipc-boundary.smoke.spec.ts test/e2e/specs/22-window-readonly-route.smoke.spec.ts` + passed with 3 smoke tests. +- Runtime provider preview evidence: + `pnpm exec playwright test -c test/e2e/playwright.config.ts test/e2e/specs/25-window-provider-deeplink-preview.smoke.spec.ts --reporter=list` + passed with 1 smoke test. It queues a custom provider install preview through the typed + `window.requeuePendingSettingsProviderInstall` route, opens the real Settings window, verifies the + Provider settings preview dialog shows the provider name, base URL, and masked key, and confirms + `window.consumePendingSettingsProviderInstall` is empty afterward without clicking confirm or + applying provider configuration. +- Focused provider preview stability evidence: + `pnpm exec playwright test -c test/e2e/playwright.config.ts test/e2e/specs/01-launch.smoke.spec.ts test/e2e/specs/06-settings-ipc-boundary.smoke.spec.ts test/e2e/specs/25-window-provider-deeplink-preview.smoke.spec.ts --reporter=list` + passed with 3 smoke tests. + +Context-menu/app-runtime/chat stream evidence: + +- Added typed app runtime and context-menu events. +- Replaced main-window deeplink/MCP install/shortcut/notification/context-menu sends with typed + event envelopes while preserving existing renderer UI behavior. +- Removed `messageIpc.ts` legacy `STREAM_EVENTS.END/ERROR` fallback. +- Evidence: `pnpm exec vitest run test/main/routes/contracts.test.ts test/main/routes/dispatcher.test.ts test/renderer/api/clients.test.ts test/renderer/components/App.startup.test.ts test/renderer/components/SettingsApp.test.ts test/renderer/lib/storeInitializer.test.ts test/renderer/components/message/SelectedTextContextMenu.test.ts --silent --reporter=dot` + passed with 7 files / 102 tests. +- Additional final-slice evidence: `test/renderer/stores/messageStore.test.ts` passed in the final + focused migration gate, proving the store no longer depends on the removed legacy stream fallback. + +## T4 - Config, ACP, Agent, And Settings Route Gaps + +- [x] Add typed ACP config/registry/manual-agent routes and `ConfigClient` methods. +- [x] Add DeepChat agent CRUD routes. +- [x] Add hooks notifications routes. +- [x] Add proxy/update-channel/logging-folder routes. +- [x] Add provider DB refresh route in the best owning domain. +- [x] Replace `AcpSettings`, `DeepChatAgentsSettings`, `NotificationsHooksSettings`, + `AboutUsSettings`, proxy/logging/default-model/common settings sections. + +Automated tests: + +- Contract tests for new route schemas. +- Route handler tests with mocked `configPresenter`. +- Component tests for ACP and agent settings. + +Manual tests: + +- ACP install/repair/uninstall/manual-agent CRUD. +- DeepChat agent advanced editing: model selection, default project, tool toggles, subagent slots, + and auto-compaction controls. +- Proxy/update channel/logging folder. + +Config/ACP read-only evidence: + +- Added typed ACP config/registry/manual-agent/shared-MCP routes and `ConfigClient` methods. +- Replaced `AcpSettings` with typed `ConfigClient` calls. +- Runtime read-only evidence: + `pnpm exec playwright test -c test/e2e/playwright.config.ts test/e2e/specs/17-acp-readonly-route.smoke.spec.ts --reporter=list` + passed with 1 smoke test. It opens the real ACP Settings page and reads + `config.getAcpState`, `config.listAcpRegistryAgents`, `config.listManualAcpAgents`, + `config.getAcpSharedMcpSelections`, and `config.listAgents` for DeepChat/ACP views without + toggling ACP, refreshing the registry, installing/repairing/uninstalling registry agents, or + mutating manual agents. +- Focused stability evidence: + `pnpm exec playwright test -c test/e2e/playwright.config.ts test/e2e/specs/01-launch.smoke.spec.ts test/e2e/specs/06-settings-ipc-boundary.smoke.spec.ts test/e2e/specs/17-acp-readonly-route.smoke.spec.ts --reporter=list` + passed with 3 smoke tests. +- Config settings read-only runtime evidence: + `pnpm exec playwright test -c test/e2e/playwright.config.ts test/e2e/specs/23-config-readonly-route.smoke.spec.ts --reporter=list` + passed with 1 smoke test. It opens the real DeepChat Agents, Notifications Hooks, and Shortcuts + settings pages, then reads `config.listAgents`, `config.resolveDeepChatAgentConfig`, + `config.getAgentMcpSelections`, `config.getHooksNotifications`, and `config.getShortcutKeys` + without creating/updating/deleting agents, saving hooks, testing hook commands, resetting + shortcuts, or changing global shortcut registration. +- Config settings focused stability evidence: + `pnpm exec playwright test -c test/e2e/playwright.config.ts test/e2e/specs/01-launch.smoke.spec.ts test/e2e/specs/06-settings-ipc-boundary.smoke.spec.ts test/e2e/specs/23-config-readonly-route.smoke.spec.ts --reporter=list` + passed with 3 smoke tests. +- Hooks notification command runtime evidence: + `pnpm exec playwright test -c test/e2e/playwright.config.ts test/e2e/specs/27-hooks-notification-command.smoke.spec.ts --reporter=list` + passed with 1 smoke test. It saves a temporary hook through `config.setHooksNotifications`, + verifies the real Notifications Hooks settings page renders it, runs a harmless local + `node -e` command through `config.testHookCommand`, checks the successful stdout/exit code, and + restores the original hooks config in `finally`. +- Hooks notification focused stability evidence: + `pnpm exec playwright test -c test/e2e/playwright.config.ts test/e2e/specs/01-launch.smoke.spec.ts test/e2e/specs/06-settings-ipc-boundary.smoke.spec.ts test/e2e/specs/27-hooks-notification-command.smoke.spec.ts --reporter=list` + passed with 3 smoke tests. +- DeepChat agent CRUD runtime evidence: + `pnpm exec playwright test -c test/e2e/playwright.config.ts test/e2e/specs/26-deepchat-agent-crud.smoke.spec.ts --reporter=list` + passed with 1 smoke test after rebuilding the app. It opens the real DeepChat Agents settings + page, creates a uniquely named temporary agent through the UI, verifies it through + `config.listAgents`, updates its name/description through the UI, deletes it through + `config.deleteDeepChatAgent`, and performs best-effort cleanup in `finally`. +- DeepChat agent CRUD focused stability evidence: + `pnpm exec playwright test -c test/e2e/playwright.config.ts test/e2e/specs/01-launch.smoke.spec.ts test/e2e/specs/06-settings-ipc-boundary.smoke.spec.ts test/e2e/specs/26-deepchat-agent-crud.smoke.spec.ts --reporter=list` + passed with 3 smoke tests. +- Config system read-only runtime evidence: + `pnpm exec playwright test -c test/e2e/playwright.config.ts test/e2e/specs/24-config-system-readonly-route.smoke.spec.ts --reporter=list` + passed with 1 smoke test. It opens the real About settings page, then reads + `config.getProxySettings`, `config.getUpdateChannel`, `config.getSyncSettings`, + `config.getSkillDraftSuggestions`, `config.getEntries` for model/default file-size settings, and + `upgrade.getStatus` without opening the General proxy section, changing proxy mode, checking for + updates, downloading updates, opening the logging folder, refreshing the provider database, or + changing the update channel. +- Config system focused stability evidence: + `pnpm exec playwright test -c test/e2e/playwright.config.ts test/e2e/specs/01-launch.smoke.spec.ts test/e2e/specs/06-settings-ipc-boundary.smoke.spec.ts test/e2e/specs/24-config-system-readonly-route.smoke.spec.ts --reporter=list` + passed with 3 smoke tests. +- Manual follow-up remains required for ACP install/repair/uninstall, manual-agent CRUD, and + external dependency terminal interaction because those write runtime directories or start + subprocess flows. DeepChat agent advanced editing paths, such as model selection, default project + path, tool toggles, subagent slots, and auto-compaction controls, remain manual or future + disposable-profile checks. Custom hook scripts/failure scenarios and real event dispatch remain + manual or future opt-in checks because user commands can touch local files or external services. + Shortcut Settings UI edit/clear/reset and OS-level global shortcut activation remain + manual/disposable-profile checks because they mutate user settings and depend on platform global + shortcut registration state. + Proxy/update-channel saves, logging-folder opening, and provider DB refresh also remain manual or + opt-in checks because they write configuration, invoke OS shell behavior, or touch network-backed + provider metadata. + +## T5 - Provider, Model, OAuth, And ACP Debug + +- [x] Add provider key status and rate-limit update routes. +- [x] Add embedding dimensions route or extend model capabilities route. +- [x] Add ModelScope MCP sync route. +- [x] Add ACP debug action route and typed debug event. +- [x] Add GitHub Copilot OAuth routes. +- [x] Replace `ProviderApiConfig`, `BuiltinKnowledgeSettings`, `ModelScopeMcpSync`, + `ProviderRateLimitConfig`, `AcpDebugDialog`. +- [x] Replace `GitHubCopilotOAuth`. + +Automated tests: + +- Provider/model route handler tests with mocked provider runtime. +- Renderer API and component tests. +- OAuth evidence: `pnpm exec vitest run test/main/routes/contracts.test.ts test/main/routes/dispatcher.test.ts test/renderer/api/clients.test.ts test/renderer/components/GitHubCopilotOAuth.test.ts` + passed with 4 files / 57 tests. +- Provider read-only runtime evidence: + `pnpm exec playwright test -c test/e2e/playwright.config.ts test/e2e/specs/18-provider-readonly-route.smoke.spec.ts` + passed with 1 smoke test. It opens the real Model Providers settings page, waits for provider + rows, and reads `providers.listSummaries`, `providers.listDefaults`, `providers.listModels`, and + `providers.getRateLimitStatus` without saving provider settings, refreshing models, testing live + connectivity, running OAuth, syncing ModelScope MCP servers, or starting ACP debug actions. +- Focused provider stability evidence: + `pnpm exec playwright test -c test/e2e/playwright.config.ts test/e2e/specs/01-launch.smoke.spec.ts test/e2e/specs/06-settings-ipc-boundary.smoke.spec.ts test/e2e/specs/18-provider-readonly-route.smoke.spec.ts` + passed with 3 smoke tests. + +Manual tests: + +- Refresh models, update provider rate limit, run ACP debug, live provider connection checks, and + provider key-status reads that depend on real credentials/network state. +- GitHub Copilot auth: in Settings -> Provider -> GitHub Copilot, run device flow and traditional + OAuth against a real GitHub account, then verify the provider shows connected and model + verification can use the saved token. This is not fully automatable because it depends on an + external browser/device-code consent flow. + +## T6 - Knowledge Routes And Events + +- [x] Add `knowledge.*` routes and `KnowledgeClient`. +- [x] Add typed `knowledge.file.updated/progress` events. +- [x] Replace `KnowledgeBaseSettings`, `KnowledgeFile`, `KnowledgeFileItem`, + `BuiltinKnowledgeSettings` knowledge calls. + +Automated tests: + +- Route contract and handler tests. +- Knowledge settings component tests. +- Evidence: `pnpm exec vitest run test/main/routes/contracts.test.ts test/main/routes/dispatcher.test.ts test/renderer/api/clients.test.ts test/renderer/components/BuiltinKnowledgeSettings.test.ts test/renderer/components/KnowledgeFile.test.ts test/renderer/components/KnowledgeFileItem.test.ts` + passed with 6 files / 54 tests. +- E2E read-only evidence: + `pnpm exec playwright test -c test/e2e/playwright.config.ts test/e2e/specs/12-knowledge-readonly-route.smoke.spec.ts --reporter=list` + passed with 1 smoke test. It opens the real Knowledge Settings page and reads + `knowledge.isSupported`, `knowledge.getSupportedLanguages`, + `knowledge.getSeparatorsForLanguage`, and `knowledge.getSupportedFileExtensions` without adding + files, running ingestion, or mutating knowledge-base data. + +Manual tests: + +- Add/delete/re-add a file, pause/resume ingestion, run similarity query. + +## T7 - Skill Sync Routes And Events + +- [x] Add `skillSync.*` routes and `SkillSyncClient`. +- [x] Add typed discovery/scan/import/export events. +- [x] Replace sync prompt/status/import/export components. + +Automated tests: + +- Contract tests for import/export input. +- Handler tests with mocked scanner/converter. +- Wizard component tests. +- Evidence: `pnpm exec vitest run test/main/routes/contracts.test.ts test/main/routes/dispatcher.test.ts test/renderer/api/clients.test.ts test/renderer/components/SkillSyncSettings.test.ts` + passed with 4 files / 53 tests. +- Runtime read-only evidence: + `pnpm exec playwright test -c test/e2e/playwright.config.ts test/e2e/specs/19-skill-sync-readonly-route.smoke.spec.ts` + passed with 1 smoke test after rebuilding the app. It opens the real Skills settings page, verifies + the sync status surface is present, reads `skillSync.getRegisteredTools`, + `skillSync.getNewDiscoveries`, and `skillSync.scanExternalTools`, and confirms the typed + `skillSync.scan.started/completed` events are delivered. It does not acknowledge discoveries or + preview/execute import/export. +- Focused stability evidence: + `pnpm exec playwright test -c test/e2e/playwright.config.ts test/e2e/specs/01-launch.smoke.spec.ts test/e2e/specs/06-settings-ipc-boundary.smoke.spec.ts test/e2e/specs/19-skill-sync-readonly-route.smoke.spec.ts` + passed with 3 smoke tests. + +Manual tests: + +- Import skills, export skills, and resolve conflicts against real external tool directories. + +## T8 - Remote Control Routes + +- [x] Add `remoteControl.*` routes and `RemoteControlClient`. +- [x] Replace `RemoteControlRuntime.ts` and `RemoteSettings.vue`. +- [x] Remove `remoteControlPresenter:call` after no consumers remain. + +Automated tests: + +- Route schema/handler tests for all channels. +- Remote settings component tests. + +Manual tests: + +- Telegram pair/bind/unbind. +- Feishu/QQBot/Discord status and settings. +- Weixin iLink login/restart/remove. + +Evidence: + +- Added typed routes for channel list/settings/status/bindings/pairing and Weixin iLink account + operations. +- Replaced `RemoteControlRuntime`, `RemoteSettings`, and the main-window `WindowSideBar` remote + status polling with `RemoteControlClient`; `src/renderer/api/RemoteControlRuntime.ts` has been + deleted. +- Evidence: + `pnpm exec vitest run test/renderer/components/WindowSideBar.test.ts test/renderer/components/RemoteSettings.test.ts test/renderer/api/clients.test.ts test/main/routes/contracts.test.ts test/main/routes/dispatcher.test.ts --silent --reporter=dot` + passed with 5 files / 126 tests. +- Main-window runtime evidence: + `pnpm exec playwright test test/e2e/specs/01-launch.smoke.spec.ts test/e2e/specs/09-main-ipc-boundary.smoke.spec.ts test/e2e/specs/11-remote-control-readonly-route.smoke.spec.ts --workers=1` + passed with 3 smoke tests. The main renderer IPC boundary smoke now reads + `remoteControl.listChannels` and `remoteControl.getChannelStatus` from the real main chat + renderer, covering the same typed route family used by `WindowSideBar` without mutating remote + control settings. +- Manual follow-up: exercise Telegram pairing and Weixin iLink login against real services. Unit + tests validate route wiring and component state only. +- Final transport evidence: source scans for `RemoteControlRuntime`, `createRemoteControlRuntime`, + and `remoteControlPresenter:call` return no hits in `src/main`, `src/renderer`, `src/preload`, or + renderer tests. + +## T9 - Remaining Operational Domains + +- [x] Add `skills.readFile` route and replace skill editor. +- [x] Add MCP Router market routes and replace `McpBuiltinMarket`. +- [x] Add NowledgeMem routes and replace `NowledgeMemSettings`. +- [x] Add database repair route and replace `sqlitePresenter.repairSchema`. +- [x] Add browser sandbox clear route and replace `yoBrowserPresenter.clearSandboxData`. +- [x] Decide whether renderer shortcut registration should be removed or typed. + +Automated tests: + +- Focused route handler/client/component tests. + +Manual tests: + +- Skill editor read/save. +- MCP Router API key/list/install. +- NowledgeMem config/test. +- Database repair on copied profile. +- Browser sandbox clear. +- Global shortcut enable/disable behavior. + +MCP Router evidence: + +- Added MCP Router API key/list/install/auth routes and `McpClient` methods. +- Replaced `McpBuiltinMarket` with typed client calls. +- Evidence: `pnpm exec vitest run test/main/routes/contracts.test.ts test/main/routes/dispatcher.test.ts test/renderer/api/clients.test.ts test/renderer/components/McpBuiltinMarket.test.ts` + passed with 4 files / 70 tests. +- MCP read-only runtime evidence: + `pnpm exec playwright test -c test/e2e/playwright.config.ts test/e2e/specs/13-mcp-readonly-route.smoke.spec.ts --reporter=list` + passed with 1 smoke test. It opens the real MCP Settings page and reads `mcp.getEnabled`, + `mcp.getServers`, `mcp.getClients`, `mcp.listToolDefinitions`, `mcp.listPrompts`, + `mcp.listResources`, and `mcp.getNpmRegistryStatus` without toggling MCP, refreshing registry + metadata, installing marketplace servers, or starting/stopping MCP servers. +- Manual follow-up: save a real MCP Router API key, list marketplace servers, install one server, + and verify it appears in MCP settings. This depends on network and live credentials. + +Shortcut evidence: + +- Added `shortcut.register`, `shortcut.unregister`, and `shortcut.destroy` routes. +- Replaced `ShortcutRuntime` legacy presenter dependency with `ShortcutClient`; the renderer + shortcut store imports `ShortcutClient` directly and `src/renderer/api/ShortcutRuntime.ts` has + been deleted. +- Moved `config.shortcutKeys.changed` publishing into `ConfigPresenter.setShortcutKey` and + `ConfigPresenter.resetShortcutKeys`; `legacyTypedEventBridge` no longer monkey patches + `configPresenter` shortcut methods. +- Evidence: `pnpm exec vitest run test/main/routes/contracts.test.ts test/main/routes/dispatcher.test.ts test/renderer/api/clients.test.ts test/renderer/components/AcpSettings.test.ts` + passed with 4 files / 81 tests after the direct shortcut event publish cleanup. +- Runtime route/event evidence: + `pnpm exec playwright test test/e2e/specs/28-shortcut-route-restore.smoke.spec.ts` passed with 1 + smoke test. It opens the real Settings Shortcuts page, writes a temporary `QuickSearch` shortcut + through the typed `config.setShortcutKeys` route from the Settings renderer, verifies + `config.shortcutKeys.changed`, calls `shortcut.destroy`, `shortcut.register`, and + `shortcut.unregister`, and restores the original shortcut config in `finally`. +- Focused shortcut stability evidence: + `pnpm exec playwright test test/e2e/specs/01-launch.smoke.spec.ts test/e2e/specs/06-settings-ipc-boundary.smoke.spec.ts test/e2e/specs/28-shortcut-route-restore.smoke.spec.ts --workers=1` + passed with 3 smoke tests before and after removing the shortcut monkey patch from the legacy + typed event bridge. The `--workers=1` flag is required for combined Electron specs because the app + enforces a single-instance `SingletonLock`. +- Manual follow-up: use the real Shortcut Settings UI to edit, clear, reset, and save shortcuts; + focus/blur the app; press the configured OS global shortcut; and confirm duplicate registration or + accelerator conflicts are handled on the target OS. The automated route smoke proves IPC reachability + and restoration, not the platform global-shortcut side effect. + +Data settings evidence: + +- Added `databaseSecurity.repairSchema` and `browser.clearSandboxData`. +- Replaced Data Settings repair/sandbox actions with `DatabaseSecurityClient` and `BrowserClient`. +- Evidence: `pnpm exec vitest run test/main/routes/contracts.test.ts test/main/routes/dispatcher.test.ts test/renderer/api/clients.test.ts test/renderer/components/DataSettings.test.ts` + passed with 4 files / 80 tests. +- Runtime read-only evidence: + `pnpm exec playwright test -c test/e2e/playwright.config.ts test/e2e/specs/20-data-security-readonly-route.smoke.spec.ts` + passed with 1 smoke test after rebuilding the app. It opens the real Data Settings page, verifies + the database encryption, database repair, and YoBrowser sandbox surfaces are visible, then reads + `databaseSecurity.getStatus`, `device.getInfo`, and `device.getAppVersion` without enabling + encryption, changing passwords, repairing schema, resetting data, or clearing browser sandbox + data. +- Focused stability evidence: + `pnpm exec playwright test -c test/e2e/playwright.config.ts test/e2e/specs/01-launch.smoke.spec.ts test/e2e/specs/06-settings-ipc-boundary.smoke.spec.ts test/e2e/specs/20-data-security-readonly-route.smoke.spec.ts` + passed with 3 smoke tests. +- Manual follow-up: enable/change/disable database encryption in a disposable encrypted profile, run + database repair against a copied real profile, reset each data type in a disposable profile, and + clear YoBrowser sandbox, then confirm browser state/cookies are reset. These require local + profile/browser state and are not fully automatable in unit tests. + +NowledgeMem evidence: + +- Added `nowledgeMem.getConfig`, `nowledgeMem.updateConfig`, and + `nowledgeMem.testConnection`. +- Replaced `NowledgeMemSettings` with `NowledgeMemClient`. +- Evidence: `pnpm exec vitest run test/main/routes/contracts.test.ts test/main/routes/dispatcher.test.ts test/renderer/api/clients.test.ts test/renderer/components/NowledgeMemSettings.test.ts` + passed with 4 files / 64 tests. +- Runtime UI evidence: + `pnpm exec playwright test -c test/e2e/playwright.config.ts test/e2e/specs/14-nowledgemem-config-route.smoke.spec.ts --reporter=list` + passed with 1 smoke test. It opens the real Knowledge Settings page, expands the NowledgeMem + panel, saves a temporary base URL/API key through the UI, verifies + `nowledgeMem.getConfig/updateConfig`, and restores the original config in `finally`. +- Manual follow-up: configure a real NowledgeMem endpoint/API key and run Test Connection. This + depends on a running external service, so automated tests only validate routing, config + persistence, restore behavior, and component state. + +Skill editor evidence: + +- Added `skills.readFile` and `SkillClient.readSkillFile`. +- Replaced `SkillEditorSheet` file loading with `SkillClient`. +- Evidence: `pnpm exec vitest run test/main/routes/contracts.test.ts test/main/routes/dispatcher.test.ts test/renderer/api/clients.test.ts test/renderer/components/SkillEditorSheet.test.ts` + passed with 4 files / 67 tests. +- Runtime read-only evidence: + `pnpm exec playwright test -c test/e2e/playwright.config.ts test/e2e/specs/16-skills-readonly-route.smoke.spec.ts --reporter=list` + passed with 1 smoke test. It opens the real Skills Settings page, reads + `skills.getDirectory` and `skills.listMetadata`, and, when an installed skill exists, reads + `skills.readFile`, `skills.getFolderTree`, `skills.getExtension`, and `skills.listScripts` + without installing, uninstalling, or saving skill files. +- Focused stability evidence: + `pnpm exec playwright test -c test/e2e/playwright.config.ts test/e2e/specs/01-launch.smoke.spec.ts test/e2e/specs/06-settings-ipc-boundary.smoke.spec.ts test/e2e/specs/16-skills-readonly-route.smoke.spec.ts --reporter=list` + passed with 3 smoke tests after tightening main-window detection so floating/settings/splash + windows are not treated as the main chat window. +- Manual follow-up: open an installed skill, edit/save/reopen it, and verify script/runtime + settings persist. Unit tests validate loading and IPC routing only. + +## T10 - Secondary Renderer Hardening + +- [x] Replace splash `exposeElectronAPI()` usage with dedicated typed splash API. +- [x] Add payload validation to browser overlay activity API or move it to `createBridge`. +- [x] Move floating widget channel constants to shared contracts and validate payloads. +- [x] Keep plugin settings as typed-route backed specialized API; add tests if missing. + +Automated tests: + +- Preload bridge tests for splash/floating/browser overlay APIs. +- Existing floating presenter tests. + +Manual tests: + +- Splash database unlock. +- Floating widget drag/open session/language/theme. +- Browser overlay activity display. +- Plugin settings enable/disable/action invocation. + +Evidence: + +- Splash renderer now uses `window.deepchatSplash`; raw splash IPC remains only inside + `src/preload/splash-preload.ts`. The preload boundary test verifies that the exposed API is + limited to splash update/unlock methods, uses scoped `database-security:*` channels, returns + unsubscribe functions, and drops invalid submit/cancel payloads. +- Floating widget now uses shared `FLOATING_BUTTON_EVENTS`, validates renderer-to-main payloads, + validates main-to-renderer events, and returns scoped unsubscribe functions instead of exposing + `removeAllListeners`. +- Browser overlay validates `browser.activity.changed` with the shared event schema before invoking + renderer callbacks. +- Plugin settings preload is covered by `test/renderer/api/preloadBoundaries.test.ts`, which verifies + `window.deepchatPlugin` calls typed plugin routes through `createBridge`. +- Floating button and floating chat windows now load the dev renderer only when + `ELECTRON_RENDERER_URL` is present; built/e2e mode falls back to bundled renderer files instead of + `http://localhost:5173/*`. +- Evidence: `pnpm exec vitest run test/renderer/api/preloadBoundaries.test.ts test/main/presenter/floatingButtonPresenter/index.test.ts test/renderer/components/BrowserActivityOverlay.test.ts test/renderer/api/clients.test.ts test/main/routes/contracts.test.ts test/main/scripts/architectureGuard.test.ts --silent --reporter=dot` + passed before the latest splash boundary addition with 6 files / 68 tests. The full focused gate + below includes the new splash boundary case. +- User-flow evidence: `pnpm exec playwright test -c test/e2e/playwright.config.ts test/e2e/specs/01-launch.smoke.spec.ts test/e2e/specs/04-settings-navigation.smoke.spec.ts --reporter=list` + passed with 2 tests, covering Electron launch and settings control-center navigation. +- Additional user-flow evidence: + `pnpm exec playwright test -c test/e2e/playwright.config.ts test/e2e/specs/06-settings-ipc-boundary.smoke.spec.ts --reporter=list` + passed with 1 test, covering the real settings window typed bridge, legacy + `presenter:call` rejection, and migrated knowledge/skills/remote/MCP/data settings surfaces. + +## T11 - Retire Legacy Transport + +- [x] Verify no renderer business imports `@api/legacy/presenters` or `@api/legacy/runtime`. +- [x] Delete or empty `RemoteControlRuntime.ts` and `ShortcutRuntime.ts` legacy dependencies. +- [x] Remove `presenter:call` and `remoteControlPresenter:call` handlers. +- [x] Remove `Presenter.DISPATCHABLE_PRESENTERS` and `Presenter.REMOTE_CONTROL_METHODS` if unused. +- [x] Delete `src/renderer/api/legacy/**` once there are no consumers. +- [x] Update `docs/ARCHITECTURE.md`, `docs/FLOWS.md`, `docs/guides/code-navigation.md`, and baseline + reports to reflect the real final state. + +Final automated gate: + +```bash +rg "useLegacyPresenter|useLegacyRemoteControlPresenter|useLegacyShortcutPresenter" src/renderer +rg "window\\.electron|window\\.api" src/renderer +node scripts/architecture-guard.mjs +pnpm run format +pnpm run i18n +pnpm run lint +pnpm run typecheck +pnpm test +``` + +Current scan evidence: + +- `rg "window\\.electron(\\?|\\.)\\.ipcRenderer|useLegacyPresenter|useLegacyRemoteControlPresenter|useLegacyShortcutPresenter|legacy/presenters" src/renderer src/main src/preload` + shows raw IPC only inside preload/bridge internals and no source legacy presenter bridge. +- `rg "presenter:call|remoteControlPresenter:call|DISPATCHABLE_PRESENTERS|REMOTE_CONTROL_METHODS|src/renderer/api/legacy" src/main src/renderer src/preload -g '*.ts' -g '*.vue' -g '*.d.ts'` + returns no hits. +- `rg "UPDATE_EVENTS\\.(STATUS_CHANGED|PROGRESS|WILL_RESTART|ERROR)|update:status-changed|update:error|update:progress|update:will-restart" src test -g '*.ts' -g '*.vue'` + returns no hits. `UPDATE_EVENTS` now only exposes `STATE_CHANGED`, which is used inside main by + `upgradePresenter` and `lifecyclePresenter`. +- `rg "DIALOG_EVENTS|dialog:request|dialog:response|eventBus\\.sendToRenderer\\(DIALOG_EVENTS" src/main src/renderer test -g '*.ts' -g '*.vue'` + returns no hits; dialog requests now use the typed deepchat event channel and respond/error routes. +- `rg "WORKSPACE_EVENTS\\.INVALIDATED|workspace:files-changed|eventBus\\.sendToRenderer\\(WORKSPACE_EVENTS" src/main src/renderer test -g '*.ts' -g '*.vue'` + returns no hits; workspace invalidation now uses typed `workspace.invalidated`. The remaining + `WORKSPACE_EVENTS.INSERT_REFERENCE_REQUESTED` is a renderer-local DOM event, not main IPC. +- `rg "originalSetShortcutKey|originalResetShortcutKeys|configPresenter\\.setShortcutKey|configPresenter\\.resetShortcutKeys" src/main/routes/legacyTypedEventBridge.ts` + returns no hits; shortcut typed event publishing now lives with the owning config presenter. +- Renderer test harness cleanup: `rg "@api/legacy|useLegacyPresenter|legacy/runtime" test/renderer test/main -n` + now reports only the intentional failing fixture in `test/main/scripts/architectureGuard.test.ts`. + Migrated component/store tests mock typed clients instead of recreating virtual legacy modules. +- `pnpm exec vitest run test/renderer/api/preloadBoundaries.test.ts test/main/presenter/floatingButtonPresenter/index.test.ts test/renderer/components/BrowserActivityOverlay.test.ts test/renderer/api/clients.test.ts test/main/routes/contracts.test.ts test/main/scripts/architectureGuard.test.ts test/main/presenter/toolPresenter/agentTools/chatSettingsTools.test.ts test/main/presenter/deeplinkPresenter.test.ts test/main/presenter/presenterCallErrorHandler.test.ts test/main/presenter/skillSyncPresenter/index.test.ts test/main/presenter/lifecyclePresenter/SplashWindowManager.display.test.ts test/renderer/components/AcpDebugDialog.test.ts test/renderer/stores/messageStore.test.ts --silent --reporter=dot` + passed with 13 files / 130 tests after adding the splash preload boundary case. +- `pnpm run format`, `pnpm run i18n`, `pnpm run lint`, `pnpm run typecheck`, and `pnpm run build` + passed in the full migration gate. During the later RemoteControlRuntime cleanup, + `pnpm run typecheck` passed and `pnpm exec electron-vite build` passed after a duplicate + `pnpm run build` typecheck sub-process hung in `vue-tsgo`; the hung build process was stopped + before rerunning the bundler directly. +- Later upgrade raw-event cleanup evidence: `pnpm run typecheck` and `pnpm exec electron-vite build` + passed; `pnpm exec playwright test test/e2e/specs/01-launch.smoke.spec.ts test/e2e/specs/06-settings-ipc-boundary.smoke.spec.ts test/e2e/specs/24-config-system-readonly-route.smoke.spec.ts --workers=1` + passed with 3 smoke tests. +- Latest cleanup gate after the upgrade raw-event and shortcut bridge cleanup slices: + `pnpm run format`, `pnpm run i18n`, `pnpm run lint`, and `pnpm run typecheck` passed. Targeted + scans for legacy presenter imports, retired presenter channels, `RemoteControlRuntime`, + `ShortcutRuntime`, old renderer update raw events, and shortcut bridge monkey patching returned no + hits. +- Full `pnpm test -- --silent --reporter=dot` passed after project-level Vitest worker concurrency + was capped at `maxWorkers: 2`: 376 files passed, 6 skipped; 3175 tests passed, 41 skipped. +- `pnpm exec playwright test -c test/e2e/playwright.config.ts test/e2e/specs/01-launch.smoke.spec.ts test/e2e/specs/04-settings-navigation.smoke.spec.ts --reporter=list` + passed with 2 smoke tests. +- `pnpm exec playwright test -c test/e2e/playwright.config.ts test/e2e/specs/06-settings-ipc-boundary.smoke.spec.ts --reporter=list` + passed with 1 smoke test. The test evaluates the real settings renderer window and proves + `window.deepchat.invoke/on` are present, broad `window.electron` / `api.ipcRenderer` are absent, + and `window.deepchat.invoke('presenter:call', {})` is rejected as an unknown route. +- `pnpm exec playwright test -c test/e2e/playwright.config.ts test/e2e/specs/09-main-ipc-boundary.smoke.spec.ts --reporter=list` + passed with 1 smoke test. The test evaluates the real main chat renderer window, calls the typed + `device.getAppVersion`, `remoteControl.listChannels`, and `remoteControl.getChannelStatus` + routes, proves `window.deepchat.invoke/on` are present, verifies broad `window.electron` / + `api.ipcRenderer` are absent, and confirms `presenter:call` is rejected as an unknown route. +- `pnpm exec playwright test -c test/e2e/playwright.config.ts test/e2e/specs/10-settings-privacy-route.smoke.spec.ts --reporter=list` + passed with 1 smoke test. The test opens the real Data Settings page, toggles Privacy Mode through + the UI, verifies the typed `settings.getSnapshot/settings.update` route state, and restores the + original `privacyModeEnabled` value. +- `pnpm exec playwright test -c test/e2e/playwright.config.ts test/e2e/specs/11-remote-control-readonly-route.smoke.spec.ts --reporter=list` + passed with 1 smoke test. The test opens the real Remote Settings page, verifies visible channel + tabs for Telegram, Feishu, QQBot, Discord, and Weixin iLink, and reads + `remoteControl.listChannels`, `remoteControl.getChannelSettings`, + `remoteControl.getChannelStatus`, and `remoteControl.getChannelBindings` for each channel without + live remote accounts or config mutation. +- `pnpm exec playwright test -c test/e2e/playwright.config.ts test/e2e/specs/12-knowledge-readonly-route.smoke.spec.ts --reporter=list` + passed with 1 smoke test. The test opens the real Knowledge Settings page and verifies + read-only knowledge support, language, separator, and file-extension routes. +- `pnpm exec playwright test -c test/e2e/playwright.config.ts test/e2e/specs/13-mcp-readonly-route.smoke.spec.ts --reporter=list` + passed with 1 smoke test. The test opens the real MCP Settings page and verifies read-only MCP + server/client/tool/prompt/resource and NPM registry-status routes. +- `pnpm exec playwright test -c test/e2e/playwright.config.ts test/e2e/specs/14-nowledgemem-config-route.smoke.spec.ts --reporter=list` + passed with 1 smoke test. The test opens the real Knowledge Settings page, saves a temporary + NowledgeMem config through UI controls, verifies the typed config routes, and restores the + original config. +- `pnpm exec playwright test -c test/e2e/playwright.config.ts test/e2e/specs/15-dashboard-readonly-route.smoke.spec.ts --reporter=list` + passed with 1 smoke test. The test opens the real Settings Overview dashboard and verifies + `sessions.getUsageDashboard` summary, calendar, provider/model breakdown, and RTK snapshot shape + without triggering RTK retry. +- `pnpm exec playwright test -c test/e2e/playwright.config.ts test/e2e/specs/16-skills-readonly-route.smoke.spec.ts --reporter=list` + passed with 1 smoke test. The test opens the real Skills Settings page and verifies read-only + skill directory, metadata, file, folder tree, extension, and script routes when installed skill + data is available. +- `pnpm exec playwright test -c test/e2e/playwright.config.ts test/e2e/specs/17-acp-readonly-route.smoke.spec.ts --reporter=list` + passed with 1 smoke test. The test opens the real ACP Settings page and verifies read-only ACP + state, registry-agent, manual-agent, shared-MCP, and DeepChat/ACP agent list routes. +- `pnpm exec playwright test -c test/e2e/playwright.config.ts test/e2e/specs/18-provider-readonly-route.smoke.spec.ts` + passed with 1 smoke test. The test opens the real Model Providers settings page and verifies + read-only provider summary/default/model catalog and rate-limit status routes without provider + mutation or live external actions. +- `pnpm exec playwright test -c test/e2e/playwright.config.ts test/e2e/specs/19-skill-sync-readonly-route.smoke.spec.ts` + passed with 1 smoke test after rebuilding the app. The test opens the real Skills Settings page, + verifies SkillSync read-only routes, and confirms typed scan started/completed events. +- `pnpm exec playwright test -c test/e2e/playwright.config.ts test/e2e/specs/20-data-security-readonly-route.smoke.spec.ts` + passed with 1 smoke test after rebuilding the app. The test opens the real Data Settings page and + verifies database-security/device read-only routes plus visible repair/sandbox surfaces without + running destructive actions. +- `pnpm exec playwright test -c test/e2e/playwright.config.ts test/e2e/specs/21-project-readonly-route.smoke.spec.ts` + passed with 1 smoke test. The test opens the real Environments Settings page and verifies + project recent/environments/path-existence routes without opening native dialogs. +- `pnpm exec playwright test -c test/e2e/playwright.config.ts test/e2e/specs/22-window-readonly-route.smoke.spec.ts` + passed with 1 smoke test. The test reads current window state from the real main and Settings + renderers without changing window state. +- Focused ACP stability gate: + `pnpm exec playwright test -c test/e2e/playwright.config.ts test/e2e/specs/01-launch.smoke.spec.ts test/e2e/specs/06-settings-ipc-boundary.smoke.spec.ts test/e2e/specs/17-acp-readonly-route.smoke.spec.ts --reporter=list` + passed with 3 smoke tests. +- Focused Provider stability gate: + `pnpm exec playwright test -c test/e2e/playwright.config.ts test/e2e/specs/01-launch.smoke.spec.ts test/e2e/specs/06-settings-ipc-boundary.smoke.spec.ts test/e2e/specs/18-provider-readonly-route.smoke.spec.ts` + passed with 3 smoke tests. +- Focused SkillSync stability gate: + `pnpm exec playwright test -c test/e2e/playwright.config.ts test/e2e/specs/01-launch.smoke.spec.ts test/e2e/specs/06-settings-ipc-boundary.smoke.spec.ts test/e2e/specs/19-skill-sync-readonly-route.smoke.spec.ts` + passed with 3 smoke tests. +- Focused Data Security stability gate: + `pnpm exec playwright test -c test/e2e/playwright.config.ts test/e2e/specs/01-launch.smoke.spec.ts test/e2e/specs/06-settings-ipc-boundary.smoke.spec.ts test/e2e/specs/20-data-security-readonly-route.smoke.spec.ts` + passed with 3 smoke tests. +- Focused Device reset notification cleanup gate: + `pnpm exec vitest run test/main/presenter/devicePresenter.test.ts test/main/routes/contracts.test.ts test/main/routes/dispatcher.test.ts test/renderer/api/clients.test.ts test/renderer/components/DataSettings.test.ts --silent --reporter=dot` + passed with 5 files / 103 tests, and + `pnpm exec playwright test test/e2e/specs/01-launch.smoke.spec.ts test/e2e/specs/06-settings-ipc-boundary.smoke.spec.ts test/e2e/specs/20-data-security-readonly-route.smoke.spec.ts --workers=1` + passed with 3 smoke tests after `pnpm exec electron-vite build`. +- Focused system notification click cleanup gate: + `pnpm exec vitest run test/main/presenter/notificationPresenter.test.ts test/main/routes/contracts.test.ts test/renderer/api/clients.test.ts test/renderer/components/App.startup.test.ts --silent --reporter=dot` + passed with 4 files / 67 tests, and + `pnpm exec playwright test test/e2e/specs/01-launch.smoke.spec.ts test/e2e/specs/09-main-ipc-boundary.smoke.spec.ts --workers=1` + passed with 2 smoke tests after `pnpm exec electron-vite build`. +- Focused Ollama pull-progress cleanup gate: + `pnpm exec vitest run test/main/presenter/llmProviderPresenter/ollamaManager.test.ts test/main/routes/contracts.test.ts test/renderer/api/clients.test.ts test/renderer/stores/ollamaStore.test.ts --silent --reporter=dot` + passed with 4 files / 58 tests, and + `pnpm exec playwright test test/e2e/specs/01-launch.smoke.spec.ts test/e2e/specs/06-settings-ipc-boundary.smoke.spec.ts test/e2e/specs/18-provider-readonly-route.smoke.spec.ts --workers=1` + passed with 3 smoke tests after `pnpm exec electron-vite build`. +- Focused Skill catalog/session cleanup gate: + `pnpm exec vitest run test/main/presenter/skillPresenter/skillPresenter.test.ts test/main/routes/contracts.test.ts test/renderer/api/clients.test.ts test/renderer/components/McpIndicator.test.ts test/renderer/components/SkillsSettings.test.ts test/renderer/components/SkillEditorSheet.test.ts --silent --reporter=dot` + passed with 5 files / 151 tests, and + `pnpm exec playwright test test/e2e/specs/01-launch.smoke.spec.ts test/e2e/specs/06-settings-ipc-boundary.smoke.spec.ts test/e2e/specs/16-skills-readonly-route.smoke.spec.ts --workers=1` + passed with 3 smoke tests after `pnpm exec electron-vite build`. +- Focused YoBrowser cleanup gate: + `pnpm exec vitest run test/main/presenter/YoBrowserPresenter.test.ts test/main/routes/contracts.test.ts test/renderer/api/clients.test.ts test/renderer/components/BrowserPanel.test.ts --silent --reporter=dot` + passed with 4 files / 71 tests. `test/e2e/specs/08-browser-route.smoke.spec.ts` passed as part + of the focused run after `pnpm exec electron-vite build`; `01-launch` and + `06-settings-ipc-boundary` passed when rerun individually after a combined-run app fixture setup + timeout. +- Focused Project stability gate: + `pnpm exec playwright test -c test/e2e/playwright.config.ts test/e2e/specs/01-launch.smoke.spec.ts test/e2e/specs/06-settings-ipc-boundary.smoke.spec.ts test/e2e/specs/21-project-readonly-route.smoke.spec.ts` + passed with 3 smoke tests. +- Focused Window stability gate: + `pnpm exec playwright test -c test/e2e/playwright.config.ts test/e2e/specs/01-launch.smoke.spec.ts test/e2e/specs/06-settings-ipc-boundary.smoke.spec.ts test/e2e/specs/22-window-readonly-route.smoke.spec.ts` + passed with 3 smoke tests. +- Combined stable user-flow gate: + `pnpm exec playwright test -c test/e2e/playwright.config.ts test/e2e/specs/01-launch.smoke.spec.ts test/e2e/specs/04-settings-navigation.smoke.spec.ts test/e2e/specs/06-settings-ipc-boundary.smoke.spec.ts test/e2e/specs/07-floating-ipc-boundary.smoke.spec.ts test/e2e/specs/08-browser-route.smoke.spec.ts test/e2e/specs/09-main-ipc-boundary.smoke.spec.ts test/e2e/specs/10-settings-privacy-route.smoke.spec.ts test/e2e/specs/11-remote-control-readonly-route.smoke.spec.ts test/e2e/specs/12-knowledge-readonly-route.smoke.spec.ts test/e2e/specs/13-mcp-readonly-route.smoke.spec.ts test/e2e/specs/14-nowledgemem-config-route.smoke.spec.ts test/e2e/specs/15-dashboard-readonly-route.smoke.spec.ts --reporter=list` + passed with 12 smoke tests after the e2e launcher main-window wait was increased to 60 seconds to + avoid false cold-start failures in long sequential smoke runs. +- Candidate 13-smoke expansion including `16-skills-readonly-route.smoke.spec.ts` was run but is + not promoted to stable yet: `01-launch` and `08-browser-route` hit Electron app setup timeouts in + the long sequential run, while the same two specs passed when rerun individually and the focused + `01 + 06 + 16` gate passed. This is tracked as e2e harness stability, not a skill route failure. +- Floating user-flow gate: + `pnpm exec playwright test -c test/e2e/playwright.config.ts test/e2e/specs/07-floating-ipc-boundary.smoke.spec.ts --reporter=list` + passed with 1 smoke test after verifying the real floating renderer window loads from bundled + files in built/e2e mode, exposes only `floatingButtonAPI`, returns a valid widget snapshot, and + does not expose broad `window.electron`, `window.deepchat`, or `api.ipcRenderer`. +- Browser route user-flow gate: + `pnpm exec playwright test -c test/e2e/playwright.config.ts test/e2e/specs/08-browser-route.smoke.spec.ts --reporter=list` + passed with 1 smoke test after loading a local `data:` page through `browser.loadUrl`, polling + `browser.getStatus` until ready, receiving typed `browser.status.changed` events, and destroying + the session browser. This deliberately avoids destructive sandbox clearing in the real profile. +- Upper-level docs now describe `src/renderer/api/legacy/**` as retired/deleted instead of an active + quarantine. `docs/FLOWS.md` already describes the current typed chat stream and had no active + legacy transport references. +- Focused Session/Conversation/Stream runtime cleanup: + `AgentSessionPresenter` no longer double-sends old `session:*` renderer events; `AgentRuntimePresenter`, + `dispatch`, `echo`, and `PendingInputCoordinator` publish `chat.stream.*`, + `sessions.status.changed`, `sessions.pendingInputs.changed`, and the new + `sessions.compaction.changed` typed event only; legacy `sessionPresenter` conversation/tab/message + managers no longer broadcast unused `conversation:*` renderer channels; and + `LifecycleManager.notifyMessage` no longer exposes a dynamic raw renderer escape hatch. +- Source scan now shows `eventBus.sendToRenderer` in runtime code only at + `src/main/routes/publishDeepchatEvent.ts`, the typed event publisher. Source scans for old + `conversation:*`, `stream:*`, and `session:*` renderer channel strings under `src/main` and + `src/renderer` are clean. +- Focused session/runtime verification: + `pnpm exec vitest run test/main/presenter/configPresenter/fontSizeSettings.test.ts test/main/presenter/agentSessionPresenter/agentSessionPresenter.test.ts test/main/presenter/agentRuntimePresenter/echo.test.ts test/main/presenter/agentRuntimePresenter/pendingInputCoordinator.test.ts test/main/presenter/agentRuntimePresenter/dispatch.test.ts test/main/presenter/agentRuntimePresenter/process.test.ts test/main/presenter/agentRuntimePresenter/agentRuntimePresenter.test.ts test/main/routes/contracts.test.ts test/renderer/api/clients.test.ts --silent --reporter=dot` + passed with 9 files / 339 tests before the final repository-wide format/lint/typecheck/build/e2e + gate. +- Final session/runtime cleanup gate passed: + `pnpm run format`, `pnpm run i18n`, `pnpm run lint`, `pnpm run typecheck`, and + `pnpm exec electron-vite build` all passed. Electron e2e `01-launch`, `09-main-ipc-boundary`, + and `23-config-readonly-route` passed in the first focused run; `06-settings-ipc-boundary` hit an + Electron app fixture setup timeout in that four-spec run, then passed when rerun alone, and + `01-launch + 09-main-ipc-boundary` passed together with `--workers=1`. + +## T16 - Final Presenter Event Sweep + +- [x] Remove the remaining broad `eventBus.send(...)` usage from main/renderer source. +- [x] Delete `legacyTypedEventBridge` after every migrated publisher emits typed events directly. +- [x] Replace the last `sendToRenderer` runtime usage with `publishDeepchatEvent` only. +- [x] Remove dead window/tab renderer broadcasts with no consumer: + `system-theme-updated`, `window:maximized`, `window:unmaximized`, + `window:enter-full-screen`, `window:leave-full-screen`, `setActiveTab`, + `update-window-tabs`, and `tab:title-updated`. +- [x] Keep only explicit secondary-window/private preload protocols: + floating button `FLOATING_BUTTON_EVENTS.*`, splash/database-unlock startup channels, + browser overlay activity, and ACP terminal envelopes sent to a concrete settings webContents. + +Evidence: + +- `rg "eventBus\\.send\\(" src/main src/renderer -g "*.ts" -g "*.vue"` is clean. +- `rg "legacyTypedEventBridge|setupLegacyTypedEventBridge" src/main test/main -g "*.ts"` is clean. +- `rg "setActiveTab|update-window-tabs|tab:title-updated|TITLE_UPDATED" src test -g "*.ts" -g "*.vue"` + is clean after removing the dead tab IPC constants and sends. +- `rg "WINDOW_EVENTS|SYSTEM_EVENTS" src/renderer/src/events.ts src/renderer test/renderer -g "*.ts" -g "*.vue"` + is clean after removing the renderer-side dead window/system event constants. Main-process + `WINDOW_EVENTS.*` remain only as EventBus-internal presenter coordination for BrowserView bounds. +- `rg "webContents\\.send\\(" src/main/presenter -g "*.ts"` now reports only the private-window + allowlist above, plus ACP terminal typed envelopes. +- Focused boundary gate: + `pnpm exec vitest run test/main/routes/contracts.test.ts test/main/routes/dispatcher.test.ts test/renderer/api/clients.test.ts test/renderer/api/preloadBoundaries.test.ts --silent --reporter=dot` + passed with 4 files / 84 tests. +- Focused window gate: + `pnpm exec vitest run test/main/presenter/windowPresenter.test.ts --silent --reporter=dot` + passed with 1 file / 4 tests. +- User-flow e2e gate: + `pnpm exec playwright test -c test/e2e/playwright.config.ts test/e2e/specs/01-launch.smoke.spec.ts test/e2e/specs/06-settings-ipc-boundary.smoke.spec.ts test/e2e/specs/07-floating-ipc-boundary.smoke.spec.ts test/e2e/specs/09-main-ipc-boundary.smoke.spec.ts test/e2e/specs/22-window-readonly-route.smoke.spec.ts test/e2e/specs/23-config-readonly-route.smoke.spec.ts --workers=1` + passed with 6 tests after the e2e fixture was moved to an isolated temporary `userData` profile + and seeded with completed onboarding state. The earlier failure mode was the local real profile's + encrypted database splash blocking app startup, followed by first-run onboarding intercepting + settings clicks in a blank profile. +- Full local smoke e2e: + `pnpm exec playwright test -c test/e2e/playwright.config.ts test/e2e/specs/*.smoke.spec.ts --workers=1` + passed with 26 tests and 3 skipped. The skipped tests are the live provider/chat integration + checks (`02-chat-basic`, `03-session-persistence`, and `05-settings-provider`), which require + `RUN_PROVIDER_INTEGRATION=true` plus a configured provider/model/API key outside the default + isolated temporary profile. +- Final local gates after the renderer event cleanup and e2e fixture update: + `pnpm run format`, `pnpm run i18n`, `pnpm run lint`, `pnpm run typecheck`, and + `pnpm exec vitest run test/main/routes/contracts.test.ts test/main/routes/dispatcher.test.ts test/renderer/api/clients.test.ts test/renderer/api/preloadBoundaries.test.ts test/main/presenter/windowPresenter.test.ts --silent --reporter=dot` + passed. `src/renderer/src/env.d.ts` now explicitly declares Vite env defaults, CSS imports, + `?url` assets, and inline worker imports so `vue-tsgo` typecheck does not depend on implicit + `vite/client` merge behavior. +- Full Vitest gate: + `pnpm test -- --silent --reporter=dot` passed with 382 files passed, 6 skipped, 3192 tests + passed, and 41 skipped. During this final run, stale test expectations were updated so + AgentSession integration asserts typed `sessions.updated` / `chat.stream.completed` publication + instead of retired `session:activated` / `stream:end` channels, and Config helper tests mock both + `sendToMain` and typed renderer publication paths. + +Side effect: + +- TabPresenter still maintains its internal tab state, but no longer sends tab-list/title updates to + the main renderer because there is no subscriber. If a tab shell UI is reintroduced later, define + a shared typed event contract first instead of reusing raw tab channels. +- Floating, splash, and browser-overlay IPC remain intentionally scoped to their preload APIs. A + future convergence pass can move them onto `DEEPCHAT_EVENT_CHANNEL`, but that should be done as a + secondary-renderer contract migration with dedicated preload/e2e coverage rather than as a + presenter-only edit. +- Electron e2e now sets `DEEPCHAT_E2E_USER_DATA_DIR` to a temporary directory by default. This keeps + smoke tests deterministic and avoids reading or modifying the developer's real DeepChat profile, + including encrypted database state and onboarding progress. +- Live chat/provider smoke tests no longer run by default under the temporary profile. Run them with + `RUN_PROVIDER_INTEGRATION=true` and an explicit configured e2e profile/provider when verifying + real external model behavior. + +Final manual gate: + +- Complete all manual checks listed in `plan.md`. diff --git a/docs/architecture/presenter-ipc-migration-plan/verification.md b/docs/architecture/presenter-ipc-migration-plan/verification.md new file mode 100644 index 000000000..99e7aa51f --- /dev/null +++ b/docs/architecture/presenter-ipc-migration-plan/verification.md @@ -0,0 +1,538 @@ +# Presenter IPC Migration Verification Plan + +> Status: active execution checklist. Run the relevant slice after each presenter/domain migration, +> then run the full gate before declaring the legacy transport retired. + +## Verification Levels + +| Level | When to run | Required evidence | +| --- | --- | --- | +| Slice contract | Every new route/event/client | Contract schemas reject invalid payloads and accept valid legacy-equivalent payloads | +| Slice unit | Every changed main route/service/presenter adapter | Route handler calls the intended presenter method and returns typed output | +| Slice renderer | Every changed settings/component/store surface | Component/store uses typed client and keeps old UI behavior | +| Static gate | Every migration PR | No new legacy IPC outside allowlists; lint/typecheck pass | +| User-flow gate | After a slice passes static tests | E2E/manual checks for native dialogs, OAuth, ACP, remote channels, DB repair, or long-running tasks | +| Final gate | Before deleting legacy transport | All slice gates plus full `pnpm test` and zero business legacy hits | + +## Standard Commands + +Run after every code migration slice: + +```bash +pnpm run format +pnpm run i18n +pnpm run lint +pnpm run typecheck +``` + +Run targeted tests for the touched slice: + +```bash +pnpm test -- test/main/routes +pnpm test -- test/main/contracts +pnpm test -- test/renderer/api +pnpm test -- test/renderer/components/.test.ts +pnpm test -- test/renderer/stores/.test.ts +``` + +Run final transport-removal evidence: + +```bash +rg "useLegacyPresenter|useLegacyRemoteControlPresenter|useLegacyShortcutPresenter" src/renderer +rg "@api/legacy|legacy/presenters|legacy/runtime" src +rg "presenter:call|remoteControlPresenter:call" src/main src/renderer +rg "DISPATCHABLE_PRESENTERS|REMOTE_CONTROL_METHODS|src/renderer/api/legacy" src/main src/renderer src/preload +node scripts/architecture-guard.mjs +pnpm test +``` + +Run smoke-level Electron user flows after a successful build: + +```bash +pnpm exec playwright test -c test/e2e/playwright.config.ts \ + test/e2e/specs/01-launch.smoke.spec.ts \ + test/e2e/specs/04-settings-navigation.smoke.spec.ts \ + --reporter=list \ + --workers=1 +``` + +Use `--workers=1` when combining Electron e2e specs because DeepChat enforces a single running app +instance with `SingletonLock`. Parallel workers can fail during launch even when the route behavior +under test is healthy. + +Current raw IPC allowlist after transport retirement: + +- `src/preload/createBridge.ts` because it is the typed bridge implementation. +- `src/preload/index.ts` for the current synchronous window/webContents id bridge and the narrow + `window.api` runtime helpers still consumed through `src/renderer/api/runtime.ts`. +- `src/preload/plugin-settings-preload.ts` because it wraps `createBridge(ipcRenderer)` behind + the specialized `window.deepchatPlugin` API. +- `src/preload/splash-preload.ts` for startup database unlock before the full route runtime is + guaranteed available; renderer code must use `window.deepchatSplash`. +- `src/preload/floating-preload.ts` for the floating widget specialized API with shared channels, + scoped unsubscribe, and payload validation. +- `src/preload/browser-overlay-preload.ts` for browser overlay activity with shared event schema + validation. + +Any new hit outside these paths should be treated as a migration regression. + +## Presenter Slice Matrix + +| Slice | Automated verification | User-flow / E2E verification | +| --- | --- | --- | +| Guard coverage | Script tests or fixture proving settings legacy usage fails guard; `node scripts/architecture-guard.mjs` with current baseline | None | +| Existing-client replacements | Affected renderer component tests; `test/renderer/api/clients.test.ts` if client changed | File picker, prompt file import, remote default workdir selection | +| `configPresenter` | Config route contract tests, handler tests, ACP/agent/settings component tests | ACP toggle/install/repair/uninstall/manual CRUD; DeepChat agent advanced editing; proxy/update channel/logging folder | +| `llmproviderPresenter` | Provider/model route tests, ACP debug/rate-limit event tests, affected component tests; Provider settings read-only e2e | Refresh models; update rate limit; ACP debug run; GitHub Copilot auth | +| `devicePresenter` | Device/data route tests, affected component tests; Data Settings device read-only e2e | Native select files/directories; destructive data reset in disposable profile | +| `windowPresenter` | Context-aware route tests, settings app/provider deeplink tests; main/settings window-state read-only e2e | Settings navigation, provider install deeplink preview, focus/minimize/maximize/close flows | +| `skillSyncPresenter` | Skill sync route/event tests, import/export wizard tests; SkillSync settings read-only route/event e2e | Import/export with conflict handling | +| `projectPresenter` | Project route tests, environment/remote settings tests; Environments settings read-only e2e | Missing default workdir validation, native path picker, and open directory | +| `knowledgePresenter` | Knowledge route/event tests, knowledge settings tests | Add/delete/re-add file, progress, pause/resume, similarity query | +| `agentSessionPresenter` | Dashboard/RTK route tests, dashboard settings tests | Dashboard display and RTK retry | +| `remoteControlPresenter` | Channel route schema/handler tests, remote settings tests | Telegram pair/bind/unbind; Feishu/QQBot/Discord settings; Weixin iLink login | +| `skillPresenter` | `skills.readFile` route and editor tests | Open/edit/save/reopen installed skill | +| `mcpPresenter` | MCP Router route tests with mocked network | Save key, list market, install server | +| `exporter` / NowledgeMem | NowledgeMem route tests and settings tests | Save config, test success/failure, reload settings | +| `sqlitePresenter` | Database repair route tests; Data Settings database-status read-only e2e | Repair copied profile and inspect report | +| `yoBrowserPresenter` | Browser sandbox route tests; Data Settings sandbox surface e2e | Clear sandbox and confirm fresh browser state | +| `oauthPresenter` | OAuth route tests with mocked shell/deeplink | GitHub Copilot login/device flow | +| `shortcutPresenter` | Shortcut store/client tests; existing main shortcut tests | Global shortcuts register once after focus changes | +| Secondary renderers | Preload/API tests for splash/floating/browser overlay/plugin settings | Splash DB unlock; floating drag/open session/theme/language; browser overlay activity | + +## Current Verification Snapshot + +Last updated: 2026-06-13. + +Passed: + +- `pnpm run format` +- `pnpm run i18n` +- `pnpm run lint` +- `pnpm run typecheck` +- `pnpm run build` +- Full `pnpm test -- --silent --reporter=dot`: 376 files passed, 6 skipped; 3175 tests passed, + 41 skipped. The final full run used the project-level Vitest `maxWorkers: 2` setting to avoid + false cold-start timeouts in large renderer component suites. +- Focused migration gate covering preload boundaries, floating presenter, browser overlay, route + contracts, architecture guard, deeplink/error handlers, skill sync, splash, ACP debug, and message + stream store: 13 files / 130 tests passed after the latest splash preload boundary addition. +- `pnpm exec vitest run test/renderer/api/preloadBoundaries.test.ts --silent --reporter=dot` + passed with 1 file / 4 tests. The added splash case verifies that `window.deepchatSplash` exposes + only the dedicated splash update/unlock methods, uses scoped `database-security:*` channels, + returns unsubscribe functions, and rejects malformed submit/cancel payloads. +- Electron smoke e2e for launch and settings navigation: 2 tests passed. +- Electron settings IPC boundary e2e: + `test/e2e/specs/06-settings-ipc-boundary.smoke.spec.ts` passed with 1 test. It checks the real + settings renderer has `window.deepchat.invoke/on`, does not expose broad + `window.electron` / `api.ipcRenderer`, rejects `presenter:call` as an unknown route, and opens + migrated knowledge, skills, remote, MCP, and data settings surfaces. +- Electron floating IPC boundary e2e: + `test/e2e/specs/07-floating-ipc-boundary.smoke.spec.ts` passed with 1 test. It toggles the real + floating window through the typed config route, restores the previous user setting, checks the + floating renderer loads in built/e2e mode, and verifies the scoped `floatingButtonAPI` boundary. +- Electron browser route e2e: + `test/e2e/specs/08-browser-route.smoke.spec.ts` passed with 1 test. It exercises + `browser.loadUrl`, `browser.getStatus`, typed `browser.status.changed`, and `browser.destroy` + against a local `data:` page without clearing real profile sandbox data. +- Focused YoBrowser cleanup e2e: + `test/e2e/specs/08-browser-route.smoke.spec.ts` passed after rebuilding and verifies typed + browser route/event behavior. `test/e2e/specs/01-launch.smoke.spec.ts` and + `test/e2e/specs/06-settings-ipc-boundary.smoke.spec.ts` also passed when rerun individually. The + combined 3-spec run hit an app fixture setup timeout in `06-settings-ipc-boundary`, so the + combination is not promoted as stable evidence for this slice. +- Electron main renderer IPC boundary e2e: + `test/e2e/specs/09-main-ipc-boundary.smoke.spec.ts` passed with 1 test. It checks the real main + chat renderer has `window.deepchat.invoke/on`, can call the typed `device.getAppVersion`, + `remoteControl.listChannels`, and `remoteControl.getChannelStatus` routes, does not expose broad + `window.electron` / `api.ipcRenderer`, and rejects `presenter:call` as an unknown route. +- Electron Data Settings privacy mode e2e: + `test/e2e/specs/10-settings-privacy-route.smoke.spec.ts` passed with 1 test. It opens the real + Data Settings page, toggles the Privacy Mode switch through the UI, verifies + `settings.getSnapshot` reflects the typed `settings.update` result, and restores the original + `privacyModeEnabled` value before exit. +- Electron Remote Control read-only route e2e: + `test/e2e/specs/11-remote-control-readonly-route.smoke.spec.ts` passed with 1 test. It opens the + real Remote Settings page, verifies the visible channel tabs for Telegram, Feishu, QQBot, Discord, + and Weixin iLink, then reads `remoteControl.listChannels`, `getChannelSettings`, + `getChannelStatus`, and `getChannelBindings` for every channel without requiring live accounts or + mutating remote-control config. +- Focused Remote Control runtime cleanup e2e: + `test/e2e/specs/01-launch.smoke.spec.ts`, `09-main-ipc-boundary.smoke.spec.ts`, and + `11-remote-control-readonly-route.smoke.spec.ts` passed together with 3 tests using + `--workers=1` after deleting `src/renderer/api/RemoteControlRuntime.ts` and moving the main + `WindowSideBar` to `RemoteControlClient`. +- Focused Upgrade typed-event cleanup: + `pnpm exec vitest run test/main/presenter/upgradePresenter.test.ts test/main/routes/contracts.test.ts test/renderer/api/clients.test.ts test/renderer/components/AboutUsSettings.test.ts --silent --reporter=dot` + passed with 4 files / 64 tests. The legacy renderer-visible + `update:status-changed`, `update:error`, `update:progress`, and `update:will-restart` raw channels + no longer appear in source or test code; `UPDATE_EVENTS` only keeps the main-internal + `update:state-changed` lifecycle signal. +- Focused Dialog typed-event cleanup: + `pnpm exec vitest run test/main/presenter/dialogPresenter.test.ts test/main/routes/contracts.test.ts test/main/routes/dispatcher.test.ts test/renderer/api/clients.test.ts test/renderer/stores/dialogStore.test.ts --silent --reporter=dot` + passed with 5 files / 82 tests. `DialogPresenter.showDialog` no longer sends the retired + `dialog:request` raw event, renderer dialog state opens from typed `dialog.requested`, and dialog + responses still return through `dialog.respond` / `dialog.error` routes. +- Focused Workspace invalidation cleanup: + `pnpm exec vitest run test/main/presenter/workspacePresenter.test.ts test/main/routes/contracts.test.ts test/main/routes/dispatcher.test.ts test/renderer/api/clients.test.ts --silent --reporter=dot` + passed with 4 files / 94 tests. Workspace watchers no longer send the retired + `workspace:files-changed` raw event; watcher invalidations are delivered as typed + `workspace.invalidated` events. +- Focused Device reset completion cleanup: + `pnpm exec vitest run test/main/presenter/devicePresenter.test.ts test/main/routes/contracts.test.ts test/main/routes/dispatcher.test.ts test/renderer/api/clients.test.ts test/renderer/components/DataSettings.test.ts --silent --reporter=dot` + passed with 5 files / 103 tests. The development reset completion path now publishes typed + `appRuntime.dataResetCompleteDev` directly, the `WindowPresenter` legacy-channel translation case + was removed, and source scan + `rg "DATA_RESET_COMPLETE_DEV|notification:data-reset-complete-dev" src/main src/renderer test -g '*.ts' -g '*.vue'` + returns no hits. The destructive reset itself remains excluded from automated e2e and must be + verified in a disposable profile. +- Focused system notification click cleanup: + `pnpm exec vitest run test/main/presenter/notificationPresenter.test.ts test/main/routes/contracts.test.ts test/renderer/api/clients.test.ts test/renderer/components/App.startup.test.ts --silent --reporter=dot` + passed with 4 files / 67 tests. Electron notification clicks now publish typed + `appRuntime.systemNotificationClicked` directly with the existing `{ payload: id }` payload shape; + the `WindowPresenter` legacy-channel translation case and `NOTIFICATION_EVENTS` constants were + removed. Source scan + `rg "NOTIFICATION_EVENTS|notification:sys-notify-clicked|SYS_NOTIFY_CLICKED" src/main src/renderer -g '*.ts' -g '*.vue'` + returns no hits. Real OS notification display/click remains a platform manual check. +- Focused Ollama pull-progress cleanup: + `pnpm exec vitest run test/main/presenter/llmProviderPresenter/ollamaManager.test.ts test/main/routes/contracts.test.ts test/renderer/api/clients.test.ts test/renderer/stores/ollamaStore.test.ts --silent --reporter=dot` + passed with 4 files / 58 tests. Pull progress now emits only typed + `providers.ollama.pull.progress`; the old `ollama:pull-model-progress` constants were removed + from main and renderer event files. Source scan + `rg "OLLAMA_EVENTS|ollama:pull-model-progress|PULL_MODEL_PROGRESS" src/main src/renderer test -g '*.ts' -g '*.vue'` + returns no hits. Real model pulls remain an opt-in/manual check because they require a live Ollama + daemon and download or reuse local model data. +- Focused Skill catalog/session cleanup: + `pnpm exec vitest run test/main/presenter/skillPresenter/skillPresenter.test.ts test/main/routes/contracts.test.ts test/renderer/api/clients.test.ts test/renderer/components/McpIndicator.test.ts test/renderer/components/SkillsSettings.test.ts test/renderer/components/SkillEditorSheet.test.ts --silent --reporter=dot` + passed with 5 files / 151 tests. `SkillPresenter` no longer sends retired `skill:*` raw events; + discovery, install/uninstall, session activation/deactivation, and watcher metadata changes are + delivered through typed `skills.catalog.changed` and `skills.session.changed`. Source scan + `rg "SKILL_EVENTS|skill:activated|skill:deactivated|skill:discovered|skill:installed|skill:uninstalled|skill:metadata-updated" src/main src/renderer test -g '*.ts' -g '*.vue'` + returns no hits. Real skill install/edit/uninstall flows remain manual or dedicated e2e because + they write skill files. +- Focused YoBrowser lifecycle/open cleanup: + `pnpm exec vitest run test/main/presenter/YoBrowserPresenter.test.ts test/main/routes/contracts.test.ts test/renderer/api/clients.test.ts test/renderer/components/BrowserPanel.test.ts --silent --reporter=dot` + passed with 4 files / 71 tests. `YoBrowserPresenter` no longer sends retired `yo-browser:*` raw + events; lifecycle/open/activity updates are delivered through typed `browser.status.changed`, + `browser.open.requested`, and `browser.activity.changed`. The old window-count event had no + business consumer and was retired. Source scan + `rg "YO_BROWSER_EVENTS|yo-browser:" src/main src/renderer test -g '*.ts' -g '*.vue'` + returns no hits. Browser sandbox clearing remains a separate destructive manual check. +- Focused MCP sampling cleanup: + `pnpm exec vitest run test/main/presenter/mcpPresenter.test.ts test/main/routes/contracts.test.ts test/renderer/api/clients.test.ts test/renderer/stores/mcpSampling.test.ts --silent --reporter=dot` + passed with 4 files / 68 tests. `McpPresenter` no longer sends retired `mcp:sampling-*` raw + channels; request, decision, and cancellation state is delivered through typed + `mcp.sampling.request`, `mcp.sampling.decision`, and `mcp.sampling.cancelled` events. Source scan + `rg "mcp:sampling-request|mcp:sampling-decision|mcp:sampling-cancelled|SAMPLING_REQUEST|SAMPLING_DECISION|SAMPLING_CANCELLED" src/main src/renderer test -g '*.ts' -g '*.vue'` + returns no hits. The focused e2e group + `pnpm exec playwright test test/e2e/specs/01-launch.smoke.spec.ts test/e2e/specs/06-settings-ipc-boundary.smoke.spec.ts test/e2e/specs/13-mcp-readonly-route.smoke.spec.ts --workers=1` + passed with 3 smoke tests after rebuilding. A real approve/reject/cancel sampling dialog flow + remains manual or future dedicated e2e because it requires a disposable MCP server that issues a + sampling request and a runnable model path. +- Focused Config font-size cleanup: + `pnpm exec vitest run test/main/presenter/configPresenter/fontSizeSettings.test.ts test/main/routes/contracts.test.ts test/main/routes/dispatcher.test.ts test/main/routes/settingsHandler.test.ts test/renderer/api/clients.test.ts test/renderer/stores/uiSettingsStore.test.ts --silent --reporter=dot` + passed with 6 files / 88 tests. `fontSizeLevel` updates no longer send the retired + `config:font-size-changed` raw channel; renderer UI state is hydrated and updated through typed + `settings.changed`. Source scan + `rg "config:font-size-changed|FONT_SIZE_CHANGED" src/main src/renderer test -g '*.ts' -g '*.vue'` + returns no hits. The focused e2e group + `pnpm exec playwright test test/e2e/specs/01-launch.smoke.spec.ts test/e2e/specs/06-settings-ipc-boundary.smoke.spec.ts test/e2e/specs/23-config-readonly-route.smoke.spec.ts --workers=1` + passed with 3 smoke tests after rebuilding. Real display settings font-size changes and + cross-window class synchronization remain manual or future dedicated e2e because the existing + config smoke is read-only. +- Focused NowledgeMem config cleanup: + `pnpm exec vitest run test/main/presenter/configPresenter/fontSizeSettings.test.ts test/main/routes/contracts.test.ts test/main/routes/dispatcher.test.ts test/renderer/api/clients.test.ts test/renderer/components/NowledgeMemSettings.test.ts --silent --reporter=dot` + passed with 5 files / 83 tests. `ConfigPresenter.setNowledgeMemConfig` no longer sends retired + `config:nowledge-mem-config-updated`; renderer settings save/load behavior remains typed route + based through `NowledgeMemClient`. Source scan + `rg "config:nowledge-mem-config-updated|NOWLEDGE_MEM_CONFIG_UPDATED" src/main src/renderer test -g '*.ts' -g '*.vue'` + returns no hits. The focused e2e group + `pnpm exec playwright test test/e2e/specs/01-launch.smoke.spec.ts test/e2e/specs/06-settings-ipc-boundary.smoke.spec.ts test/e2e/specs/14-nowledgemem-config-route.smoke.spec.ts --workers=1` + passed with 3 smoke tests after rebuilding and includes temporary config write/restore through + the real settings UI. Live connection testing remains manual because it requires a running + NowledgeMem service. +- Focused MCP config bridge cleanup: + `pnpm exec vitest run test/main/presenter/configPresenter/mcpConfHelper.test.ts test/main/routes/contracts.test.ts test/main/routes/dispatcher.test.ts test/renderer/api/clients.test.ts test/renderer/stores/mcpStore.test.ts --silent --reporter=dot` + passed with 5 files / 89 tests. `McpConfHelper.batchImportMcpServers` now emits + `MCP_EVENTS.CONFIG_CHANGED` only on the main event bus; renderer updates continue through typed + `mcp.config.changed` published by `legacyTypedEventBridge`. The unused renderer `MCP_EVENTS` + constants were removed. The focused e2e group + `pnpm exec playwright test test/e2e/specs/01-launch.smoke.spec.ts test/e2e/specs/06-settings-ipc-boundary.smoke.spec.ts test/e2e/specs/13-mcp-readonly-route.smoke.spec.ts --workers=1` + passed with 3 smoke tests after rebuilding. External batch import remains manual or opt-in e2e + because it mutates MCP server config and may depend on marketplace/network data. +- Focused ACP workspace/debug cleanup: + `pnpm exec vitest run test/main/presenter/acpProvider.test.ts test/main/presenter/llmProviderPresenter/acp/acpProcessManager.test.ts test/main/routes/contracts.test.ts test/renderer/api/clients.test.ts test/renderer/components/ChatStatusBar.test.ts test/renderer/components/AcpDebugDialog.test.ts --silent --reporter=dot` + passed with 6 files / 157 tests. ACP readiness events now use typed + `sessions.acp.modes.ready`, `sessions.acp.commands.ready`, and + `sessions.acp.configOptions.ready`; `acp-workspace:*` raw constants were retired. ACP debug + events remain a main-internal `ACP_DEBUG_EVENTS.EVENT` bridge input and are renderer-visible only + as typed `providers.acp.debug.event`. Source scan + `rg "ACP_WORKSPACE_EVENTS|acp-workspace:|SESSION_MODES_READY|SESSION_COMMANDS_READY|SESSION_CONFIG_OPTIONS_READY|eventBus\\.sendToRenderer\\(" src/main/presenter/llmProviderPresenter src/main/events.ts src/renderer/src/events.ts test/main/presenter/acpProvider.test.ts test/main/presenter/llmProviderPresenter/acp/acpProcessManager.test.ts test/renderer/components/ChatStatusBar.test.ts -g '*.ts' -g '*.vue'` + returns no hits. The focused e2e group + `pnpm exec playwright test test/e2e/specs/01-launch.smoke.spec.ts test/e2e/specs/06-settings-ipc-boundary.smoke.spec.ts test/e2e/specs/17-acp-readonly-route.smoke.spec.ts test/e2e/specs/18-provider-readonly-route.smoke.spec.ts --workers=1` + passed with 4 smoke tests after rebuilding. Real ACP runtime warmup, debug action execution, + mode/model selection, and config option changes remain manual or opt-in e2e because they require + runnable ACP agents and local dependencies. +- Electron Knowledge read-only route e2e: + `test/e2e/specs/12-knowledge-readonly-route.smoke.spec.ts` passed with 1 test. It opens the real + Knowledge Settings page and reads `knowledge.isSupported`, `knowledge.getSupportedLanguages`, + `knowledge.getSeparatorsForLanguage`, and `knowledge.getSupportedFileExtensions` without adding + files, running ingestion, or mutating knowledge-base data. +- Electron MCP read-only route e2e: + `test/e2e/specs/13-mcp-readonly-route.smoke.spec.ts` passed with 1 test. It opens the real MCP + Settings page and reads `mcp.getEnabled`, `mcp.getServers`, `mcp.getClients`, + `mcp.listToolDefinitions`, `mcp.listPrompts`, `mcp.listResources`, and + `mcp.getNpmRegistryStatus` without toggling MCP, refreshing registry metadata, installing + marketplace servers, or starting/stopping MCP servers. +- Electron NowledgeMem config route e2e: + `test/e2e/specs/14-nowledgemem-config-route.smoke.spec.ts` passed with 1 test. It opens the real + Knowledge Settings page, expands the NowledgeMem settings panel, saves a temporary base URL/API + key through UI controls, verifies the typed `nowledgeMem.getConfig/updateConfig` routes, and + restores the original config. +- Electron Dashboard read-only route e2e: + `test/e2e/specs/15-dashboard-readonly-route.smoke.spec.ts` passed with 1 test. It opens the real + Settings Overview dashboard and verifies the typed `sessions.getUsageDashboard` summary, + calendar, provider/model breakdown, and RTK snapshot shape without triggering RTK retry. +- Electron Skills read-only route e2e: + `test/e2e/specs/16-skills-readonly-route.smoke.spec.ts` passed with 1 test. It opens the real + Skills Settings page, reads `skills.getDirectory` and `skills.listMetadata`, and, when an + installed skill exists, verifies `skills.readFile`, `skills.getFolderTree`, + `skills.getExtension`, and `skills.listScripts` without installing, uninstalling, or saving skill + files. +- Focused Skills stability e2e: + `test/e2e/specs/01-launch.smoke.spec.ts`, `06-settings-ipc-boundary.smoke.spec.ts`, and + `16-skills-readonly-route.smoke.spec.ts` passed together with 3 tests after main-window detection + was tightened to exclude floating/settings/splash renderer windows. +- Focused Skill catalog/session cleanup e2e: + `test/e2e/specs/01-launch.smoke.spec.ts`, `06-settings-ipc-boundary.smoke.spec.ts`, and + `16-skills-readonly-route.smoke.spec.ts` passed together with 3 tests after rebuilding. This + verifies the real Skills settings surface after retiring `skill:*` raw events; it does not + install, uninstall, save, or edit skill files. +- Electron ACP read-only route e2e: + `test/e2e/specs/17-acp-readonly-route.smoke.spec.ts` passed with 1 test. It opens the real ACP + Settings page and reads `config.getAcpState`, `config.listAcpRegistryAgents`, + `config.listManualAcpAgents`, `config.getAcpSharedMcpSelections`, and `config.listAgents` for + DeepChat/ACP views without toggling ACP, refreshing registry data, installing/repairing/ + uninstalling registry agents, or mutating manual agents. +- Focused ACP stability e2e: + `test/e2e/specs/01-launch.smoke.spec.ts`, `06-settings-ipc-boundary.smoke.spec.ts`, and + `17-acp-readonly-route.smoke.spec.ts` passed together with 3 tests. +- Electron Provider read-only route e2e: + `test/e2e/specs/18-provider-readonly-route.smoke.spec.ts` passed with 1 test. It opens the real + Model Providers settings page, waits for provider rows, and reads `providers.listSummaries`, + `providers.listDefaults`, `providers.listModels`, and `providers.getRateLimitStatus` while only + retaining redacted counts/types in the assertion snapshot. It does not save provider settings, + refresh models, test live connectivity, run OAuth, sync ModelScope MCP servers, or start ACP + debug actions. +- Focused Provider stability e2e: + `test/e2e/specs/01-launch.smoke.spec.ts`, `06-settings-ipc-boundary.smoke.spec.ts`, and + `18-provider-readonly-route.smoke.spec.ts` passed together with 3 tests. +- Focused Ollama pull-progress cleanup e2e: + `test/e2e/specs/01-launch.smoke.spec.ts`, `06-settings-ipc-boundary.smoke.spec.ts`, and + `18-provider-readonly-route.smoke.spec.ts` passed together with 3 tests after rebuilding. This + verifies the real Provider settings surface after retiring `ollama:pull-model-progress`; it does + not trigger a real Ollama pull. +- Electron SkillSync read-only route/event e2e: + `test/e2e/specs/19-skill-sync-readonly-route.smoke.spec.ts` passed with 1 test after rebuilding + the app. It opens the real Skills settings page, verifies the sync status surface, reads + `skillSync.getRegisteredTools`, `skillSync.getNewDiscoveries`, and + `skillSync.scanExternalTools`, and confirms typed `skillSync.scan.started/completed` events are + delivered. It does not acknowledge discoveries or preview/execute import/export. +- Focused SkillSync stability e2e: + `test/e2e/specs/01-launch.smoke.spec.ts`, `06-settings-ipc-boundary.smoke.spec.ts`, and + `19-skill-sync-readonly-route.smoke.spec.ts` passed together with 3 tests. +- Electron Data Security read-only route e2e: + `test/e2e/specs/20-data-security-readonly-route.smoke.spec.ts` passed with 1 test after + rebuilding the app. It opens the real Data Settings page, verifies database encryption, database + repair, and YoBrowser sandbox surfaces are visible, then reads `databaseSecurity.getStatus`, + `device.getInfo`, and `device.getAppVersion` without enabling encryption, changing passwords, + repairing schema, resetting data, or clearing browser sandbox data. +- Focused Data Security stability e2e: + `test/e2e/specs/01-launch.smoke.spec.ts`, `06-settings-ipc-boundary.smoke.spec.ts`, and + `20-data-security-readonly-route.smoke.spec.ts` passed together with 3 tests. +- Focused Device reset notification cleanup e2e: + `test/e2e/specs/01-launch.smoke.spec.ts`, `06-settings-ipc-boundary.smoke.spec.ts`, and + `20-data-security-readonly-route.smoke.spec.ts` passed together with 3 tests after rebuilding. + This verifies the real Data Settings surface and read-only device/database routes after retiring + `notification:data-reset-complete-dev`; it deliberately does not click reset-data actions. +- Focused system notification click cleanup e2e: + `test/e2e/specs/01-launch.smoke.spec.ts` and `09-main-ipc-boundary.smoke.spec.ts` passed together + with 2 tests after rebuilding. This proves the real main renderer typed IPC boundary still starts + cleanly after retiring `notification:sys-notify-clicked`; it deliberately does not depend on OS + notification permissions. +- Electron Project read-only route e2e: + `test/e2e/specs/21-project-readonly-route.smoke.spec.ts` passed with 1 test. It opens the real + Environments Settings page and reads `project.listRecent`, `project.listEnvironments`, and + `project.pathExists` for both an existing repository path and a generated missing path without + opening directories or invoking the native directory picker. +- Focused Project stability e2e: + `test/e2e/specs/01-launch.smoke.spec.ts`, `06-settings-ipc-boundary.smoke.spec.ts`, and + `21-project-readonly-route.smoke.spec.ts` passed together with 3 tests. +- Electron Workspace read-only route e2e: + `test/e2e/specs/29-workspace-readonly-route.smoke.spec.ts` passed with 1 test. It opens the real + main renderer, registers the current repository through `workspace.register`, reads + `workspace.readDirectory`, `workspace.searchFiles`, and `workspace.getGitStatus`, then unregisters + the workspace in `finally` without starting watchers, opening files, or revealing paths. +- Focused Workspace stability e2e: + `test/e2e/specs/01-launch.smoke.spec.ts`, `09-main-ipc-boundary.smoke.spec.ts`, and + `29-workspace-readonly-route.smoke.spec.ts` passed together with 3 tests. +- Electron Window read-only route e2e: + `test/e2e/specs/22-window-readonly-route.smoke.spec.ts` passed with 1 test. It reads + `window.getCurrentState` from both the real main renderer and the real Settings renderer, proving + the context-aware route returns distinct current window state snapshots without minimizing, + maximizing, focusing, or closing either window. +- Focused Window stability e2e: + `test/e2e/specs/01-launch.smoke.spec.ts`, `06-settings-ipc-boundary.smoke.spec.ts`, and + `22-window-readonly-route.smoke.spec.ts` passed together with 3 tests. +- Electron Provider install preview e2e: + `test/e2e/specs/25-window-provider-deeplink-preview.smoke.spec.ts` passed with 1 test. It queues + a custom provider install preview through `window.requeuePendingSettingsProviderInstall`, opens + the real Settings window, verifies the provider preview dialog renders the queued provider name, + base URL, and masked key, and confirms the pending preview queue has been consumed without + applying provider configuration. +- Focused Provider preview stability e2e: + `test/e2e/specs/01-launch.smoke.spec.ts`, `06-settings-ipc-boundary.smoke.spec.ts`, and + `25-window-provider-deeplink-preview.smoke.spec.ts` passed together with 3 tests. +- Electron Config settings read-only route e2e: + `test/e2e/specs/23-config-readonly-route.smoke.spec.ts` passed with 1 test. It opens the real + DeepChat Agents, Notifications Hooks, and Shortcuts settings pages and reads + `config.listAgents`, `config.resolveDeepChatAgentConfig`, `config.getAgentMcpSelections`, + `config.getHooksNotifications`, and `config.getShortcutKeys` without mutating agents, hooks, or + shortcuts. +- Focused Config settings stability e2e: + `test/e2e/specs/01-launch.smoke.spec.ts`, `06-settings-ipc-boundary.smoke.spec.ts`, and + `23-config-readonly-route.smoke.spec.ts` passed together with 3 tests. +- Electron Shortcut config route/event e2e: + `test/e2e/specs/28-shortcut-route-restore.smoke.spec.ts` passed with 1 test. It opens the real + Settings Shortcuts page, writes a temporary `QuickSearch` shortcut through + `config.setShortcutKeys` from the Settings renderer, receives + `config.shortcutKeys.changed`, calls `shortcut.destroy`, `shortcut.register`, and + `shortcut.unregister`, then restores the original shortcut config in `finally`. +- Focused Shortcut stability e2e: + `test/e2e/specs/01-launch.smoke.spec.ts`, `06-settings-ipc-boundary.smoke.spec.ts`, and + `28-shortcut-route-restore.smoke.spec.ts` passed together with 3 tests using `--workers=1`. +- Focused shortcut event bridge cleanup: + `ConfigPresenter.setShortcutKey` and `ConfigPresenter.resetShortcutKeys` now publish + `config.shortcutKeys.changed` directly, so `legacyTypedEventBridge` no longer monkey patches + config presenter methods. The focused shortcut route/client/component test group passed with + 4 files / 81 tests, and the same 3-spec shortcut e2e group passed after rebuilding. +- Electron Hooks notification command e2e: + `test/e2e/specs/27-hooks-notification-command.smoke.spec.ts` passed with 1 test. It saves a + temporary hook through `config.setHooksNotifications`, verifies the real Notifications Hooks page + renders it, executes a harmless local `node -e` command through `config.testHookCommand`, checks + successful stdout/exit code, and restores the original hooks config in `finally`. +- Focused Hooks notification stability e2e: + `test/e2e/specs/01-launch.smoke.spec.ts`, `06-settings-ipc-boundary.smoke.spec.ts`, and + `27-hooks-notification-command.smoke.spec.ts` passed together with 3 tests. +- Electron DeepChat agent CRUD e2e: + `test/e2e/specs/26-deepchat-agent-crud.smoke.spec.ts` passed with 1 test after rebuilding the app. + It opens the real DeepChat Agents settings page, creates a uniquely named temporary agent through + the UI, verifies it through `config.listAgents`, updates its name and description through the UI, + deletes it through `config.deleteDeepChatAgent`, and performs best-effort cleanup in `finally`. +- Focused DeepChat agent CRUD stability e2e: + `test/e2e/specs/01-launch.smoke.spec.ts`, `06-settings-ipc-boundary.smoke.spec.ts`, and + `26-deepchat-agent-crud.smoke.spec.ts` passed together with 3 tests. +- Electron Config system read-only route e2e: + `test/e2e/specs/24-config-system-readonly-route.smoke.spec.ts` passed with 1 test. It opens the + real About settings page, then reads `config.getProxySettings`, `config.getUpdateChannel`, + `config.getSyncSettings`, `config.getSkillDraftSuggestions`, `config.getEntries` for model + defaults/file-size settings, and `upgrade.getStatus` without opening the General proxy section, + checking for updates, downloading updates, or mutating config. +- Focused Config system stability e2e: + `test/e2e/specs/01-launch.smoke.spec.ts`, `06-settings-ipc-boundary.smoke.spec.ts`, and + `24-config-system-readonly-route.smoke.spec.ts` passed together with 3 tests. +- Focused Upgrade/About stability e2e: + `pnpm exec playwright test test/e2e/specs/01-launch.smoke.spec.ts test/e2e/specs/06-settings-ipc-boundary.smoke.spec.ts test/e2e/specs/24-config-system-readonly-route.smoke.spec.ts --workers=1` + passed with 3 tests after rebuilding with `pnpm exec electron-vite build`. +- Combined stable user-flow e2e for launch, settings navigation, settings IPC boundary, floating IPC + boundary, browser route lifecycle, main renderer IPC boundary, and Data Settings privacy mode + plus Remote Control, Knowledge, MCP, NowledgeMem, and Dashboard routes passed with 12 tests. The + e2e launcher waits up to 60 seconds for the main window to avoid false cold-start failures in long + sequential smoke runs. +- Candidate 13-test expansion including the Skills read-only spec is not yet promoted to stable: + the long sequential run hit Electron app setup timeouts in `01-launch` and `08-browser-route`, + while both specs passed when rerun individually. The failure is currently classified as e2e + harness stability rather than presenter-route behavior. +- Source scans show no renderer/main/preload business usage of `@api/legacy/**`, + `presenter:call`, `remoteControlPresenter:call`, `DISPATCHABLE_PRESENTERS`, or + `REMOTE_CONTROL_METHODS`. +- Renderer test harness scan: + `rg "@api/legacy|useLegacyPresenter|legacy/runtime" test/renderer test/main -n` reports only the + intentional architecture guard fixture. Migrated component/store tests now mock typed clients + directly instead of recreating virtual legacy modules. +- Session/conversation/stream cleanup source scans: + `rg "eventBus\\.sendToRenderer\\(|eventBus\\.sendToRendererIfAvailable\\(" src/main src/renderer -g "*.ts" -g "*.vue"` + reports only `src/main/routes/publishDeepchatEvent.ts`, and + `rg "conversation:list-updated|conversation:activated|conversation:deactivated|conversation:message-edited|conversation:scroll-to-message|stream:response|stream:end|stream:error|session:list-updated|session:activated|session:deactivated|session:status-changed|session:pending-inputs-updated|session:compaction-updated" src/main src/renderer -g "*.ts" -g "*.vue"` + is clean. +- Focused Session/Runtime typed-event gate: + `pnpm exec vitest run test/main/presenter/configPresenter/fontSizeSettings.test.ts test/main/presenter/agentSessionPresenter/agentSessionPresenter.test.ts test/main/presenter/agentRuntimePresenter/echo.test.ts test/main/presenter/agentRuntimePresenter/pendingInputCoordinator.test.ts test/main/presenter/agentRuntimePresenter/dispatch.test.ts test/main/presenter/agentRuntimePresenter/process.test.ts test/main/presenter/agentRuntimePresenter/agentRuntimePresenter.test.ts test/main/routes/contracts.test.ts test/renderer/api/clients.test.ts --silent --reporter=dot` + passed with 9 files / 339 tests. Coverage includes typed `chat.stream.updated/completed/failed`, + `sessions.status.changed`, `sessions.pendingInputs.changed`, `sessions.compaction.changed`, and + `sessions.updated` publication, plus renderer client subscription coverage. +- Session/Runtime final gate: + `pnpm run format`, `pnpm run i18n`, `pnpm run lint`, `pnpm run typecheck`, and + `pnpm exec electron-vite build` passed. User-angle e2e evidence: + `01-launch`, `09-main-ipc-boundary`, and `23-config-readonly-route` passed in the first focused + run; `06-settings-ipc-boundary` timed out during Electron app fixture setup in that four-spec run, + then passed when rerun alone; `01-launch + 09-main-ipc-boundary` passed together with + `--workers=1`. The timeout is classified with the existing Electron harness cold-start/setup + instability, because the failed spec did not reach assertions and passed independently. +- Final presenter event sweep: + `rg "eventBus\\.send\\(" src/main src/renderer -g "*.ts" -g "*.vue"` and + `rg "legacyTypedEventBridge|setupLegacyTypedEventBridge" src/main test/main -g "*.ts"` are clean. + The last broad dead renderer broadcasts were removed from `WindowPresenter` and `TabPresenter`. + `rg "setActiveTab|update-window-tabs|tab:title-updated|TITLE_UPDATED" src test -g "*.ts" -g "*.vue"` + is clean. Remaining + `webContents.send(...)` calls under `src/main/presenter` are limited to explicit secondary-window + protocols: floating button preload channels, splash/database-unlock startup channels, browser + overlay activity, and ACP terminal typed envelopes targeted at settings webContents. +- Final sweep focused tests: + `pnpm exec vitest run test/main/routes/contracts.test.ts test/main/routes/dispatcher.test.ts test/renderer/api/clients.test.ts test/renderer/api/preloadBoundaries.test.ts --silent --reporter=dot` + passed with 4 files / 84 tests, and + `pnpm exec vitest run test/main/presenter/windowPresenter.test.ts --silent --reporter=dot` + passed with 1 file / 4 tests. +- Final sweep e2e: + `pnpm exec playwright test -c test/e2e/playwright.config.ts test/e2e/specs/01-launch.smoke.spec.ts test/e2e/specs/06-settings-ipc-boundary.smoke.spec.ts test/e2e/specs/07-floating-ipc-boundary.smoke.spec.ts test/e2e/specs/09-main-ipc-boundary.smoke.spec.ts test/e2e/specs/22-window-readonly-route.smoke.spec.ts test/e2e/specs/23-config-readonly-route.smoke.spec.ts --workers=1` + passed with 6 tests. The e2e fixture now launches built Electron against an isolated temporary + `DEEPCHAT_E2E_USER_DATA_DIR` and seeds completed onboarding state, so automated smoke tests do not + depend on the developer's real encrypted database profile or first-run onboarding state. +- Final local full-smoke e2e: + `pnpm exec playwright test -c test/e2e/playwright.config.ts test/e2e/specs/*.smoke.spec.ts --workers=1` + passed with 26 tests and 3 skipped. The skipped specs are live provider/chat integration checks + and require `RUN_PROVIDER_INTEGRATION=true` plus an explicitly configured provider/model/API key. +- Final full Vitest: + `pnpm test -- --silent --reporter=dot` passed with 382 files passed, 6 skipped, 3192 tests + passed, and 41 skipped. The final fixes updated stale tests to the typed session/chat event + contracts and added complete EventBus mocks for Config helper publishers. +- Final renderer cleanup evidence: + `rg "WINDOW_EVENTS|SYSTEM_EVENTS" src/renderer/src/events.ts src/renderer test/renderer -g "*.ts" -g "*.vue"` + is clean, and `pnpm run typecheck` passes after explicitly declaring Vite env defaults, CSS + imports, `?url` assets, and inline worker imports in `src/renderer/src/env.d.ts`. + +Not yet passed: + +- External-service/manual flows remain open: GitHub Copilot OAuth, provider live connection/model + refresh/key-status/rate-limit update/ACP debug actions, live chat generation/session persistence + with real provider credentials, Telegram/Weixin/Feishu/QQBot/Discord + remote control, MCP Router marketplace install, NowledgeMem live connection, database encryption + enable/change/disable in a disposable encrypted profile, database repair on a copied real profile, + destructive data reset and browser sandbox reset in a disposable profile, advanced DeepChat agent + editing paths such as model/default-project/tool/subagent controls, hooks notification command + failure/custom-script scenarios, real hook event dispatch, Shortcut Settings UI edit/clear/reset + plus actual OS global shortcut activation/focus/blur/duplicate-registration behavior, + proxy/update-channel saves, logging-folder opening, provider DB refresh, real update + check/download/restart install, Project native path picker/open-directory behavior, Window + focus/minimize/maximize/close flows, OS-level `deepchat://provider/install` dispatch into the + preview queue, and real encrypted-database splash unlock against a disposable encrypted + profile/OS credential state. + +## Evidence Rules + +- A broad claim like "presenter migrated" requires both code search evidence and passing slice tests. +- A route/client replacement is incomplete if the renderer still imports the legacy presenter for the + same behavior. +- A typed event migration is incomplete while any renderer business component listens to the old raw + channel. +- Manual checks must name the OS/profile/service used. If a flow cannot be performed, record why and + keep the slice open. diff --git a/docs/guides/code-navigation.md b/docs/guides/code-navigation.md index bf07cc485..e75ba5df9 100644 --- a/docs/guides/code-navigation.md +++ b/docs/guides/code-navigation.md @@ -5,8 +5,8 @@ `phase5` 之后,如果你在 renderer 做新功能,默认心智模型应当是 single-track: 先看 `renderer/api`、shared contracts 和 typed events,再看 main route/runtime; 不要把 `useLegacyPresenter()`、`window.electron`、`window.api` 当作默认开发入口。 -如果你是在审计剩余兼容路径,直接看 `src/renderer/api/legacy/`,不要再从 -`src/renderer/api/legacy/presenters.ts` 找入口,它已经在 `P5` 退役。 +如果你是在审计历史兼容路径,先看 architecture guard、baseline 报告和本仓库历史; +`src/renderer/api/legacy/**` 已经退役并从当前树删除。 ## 先从哪里开始 @@ -35,7 +35,7 @@ | preload bridge builder | `src/preload/createBridge.ts` | 统一 `invoke/on` 协议 | | preload 暴露点 | `src/preload/index.ts` | 把 bridge 暴露到 `window.deepchat` | | renderer clients | `src/renderer/api/` | migrated path 的 renderer 主入口 | -| renderer legacy quarantine | `src/renderer/api/legacy/` | 仅保留 settings compatibility 所需的 legacy transport adapter | +| retired legacy transport | `src/renderer/api/legacy/**` | 已删除;guard 拒绝重新引入 legacy presenter transport | ### Settings diff --git a/docs/guides/getting-started.md b/docs/guides/getting-started.md index 27c916daa..6f38b618a 100644 --- a/docs/guides/getting-started.md +++ b/docs/guides/getting-started.md @@ -48,10 +48,11 @@ Renderer 如果你在旧提交里看到 `AgentPresenter`、`startStreamCompletion`、`agentLoopHandler`, 那已经是退休实现。 -如果你在现有代码里看到 `useLegacyPresenter()`、`window.electron`、`window.api`,请先把它理解为兼容层, +如果你在旧提交或历史文档里看到 `useLegacyPresenter()`、`presenter:call`、 +`remoteControlPresenter:call`、`window.electron`、`window.api`,请先把它理解为已退休兼容背景, 而不是新功能默认入口。当前默认规则写在 `docs/ARCHITECTURE.md`:新 renderer-main 能力走 -`renderer/api/*Client` + `window.deepchat` + shared contracts;临时 legacy transport 只允许放在 -`src/renderer/api/legacy/**`。 +`renderer/api/*Client` + `window.deepchat` + shared contracts;少数 runtime 能力只能封装在 +明确 allowlist 的 preload/API 边界内。 ## 项目目录速览 diff --git a/resources/acp-registry/registry.json b/resources/acp-registry/registry.json index 20d16222a..7e2855034 100644 --- a/resources/acp-registry/registry.json +++ b/resources/acp-registry/registry.json @@ -122,7 +122,7 @@ { "id": "cline", "name": "Cline", - "version": "3.0.23", + "version": "3.0.24", "description": "Autonomous coding agent CLI - capable of creating/editing files, running commands, using the browser, and more", "repository": "https://github.com/cline/cline", "website": "https://cline.bot/cli", @@ -133,7 +133,7 @@ "icon": "https://cdn.agentclientprotocol.com/registry/v1/latest/cline.svg", "distribution": { "npx": { - "package": "cline@3.0.23", + "package": "cline@3.0.24", "args": [ "--acp" ] @@ -143,7 +143,7 @@ { "id": "codebuddy-code", "name": "Codebuddy Code", - "version": "2.105.1", + "version": "2.105.2", "description": "Tencent Cloud's official intelligent coding tool", "website": "https://www.codebuddy.cn/cli/", "authors": [ @@ -152,7 +152,7 @@ "license": "Proprietary", "distribution": { "npx": { - "package": "@tencent-ai/codebuddy-code@2.105.1", + "package": "@tencent-ai/codebuddy-code@2.105.2", "args": [ "--acp" ] @@ -433,7 +433,7 @@ { "id": "dimcode", "name": "DimCode", - "version": "0.1.5", + "version": "0.1.8", "description": "A coding agent that puts leading models at your command.", "website": "https://dimcode.dev/docs/acp.html", "authors": [ @@ -442,7 +442,7 @@ "license": "proprietary", "distribution": { "npx": { - "package": "dimcode@0.1.5", + "package": "dimcode@0.1.8", "args": [ "acp" ] @@ -474,7 +474,7 @@ { "id": "factory-droid", "name": "Factory Droid", - "version": "0.144.1", + "version": "0.144.2", "description": "Factory Droid - AI coding agent powered by Factory AI", "website": "https://factory.ai/product/cli", "authors": [ @@ -483,7 +483,7 @@ "license": "proprietary", "distribution": { "npx": { - "package": "droid@0.144.1", + "package": "droid@0.144.2", "args": [ "exec", "--output-format", @@ -500,7 +500,7 @@ { "id": "fast-agent", "name": "fast-agent", - "version": "0.7.16", + "version": "0.7.17", "description": "Code and build agents with comprehensive multi-provider support", "repository": "https://github.com/evalstate/fast-agent", "website": "https://fast-agent.ai", @@ -510,7 +510,7 @@ "license": "Apache 2.0", "distribution": { "uvx": { - "package": "fast-agent-acp==0.7.16", + "package": "fast-agent-acp==0.7.17", "args": [ "-x" ] @@ -696,7 +696,7 @@ { "id": "junie", "name": "Junie", - "version": "1831.35.0", + "version": "1892.26.0", "description": "AI Coding Agent by JetBrains", "repository": "https://github.com/JetBrains/junie", "website": "https://junie.jetbrains.com", @@ -707,35 +707,35 @@ "distribution": { "binary": { "darwin-aarch64": { - "archive": "https://github.com/JetBrains/junie/releases/download/1831.35/junie-release-1831.35-macos-aarch64.zip", + "archive": "https://github.com/JetBrains/junie/releases/download/1892.26/junie-release-1892.26-macos-aarch64.zip", "cmd": "./Applications/junie.app/Contents/MacOS/junie", "args": [ "--acp=true" ] }, "darwin-x86_64": { - "archive": "https://github.com/JetBrains/junie/releases/download/1831.35/junie-release-1831.35-macos-amd64.zip", + "archive": "https://github.com/JetBrains/junie/releases/download/1892.26/junie-release-1892.26-macos-amd64.zip", "cmd": "./Applications/junie.app/Contents/MacOS/junie", "args": [ "--acp=true" ] }, "linux-aarch64": { - "archive": "https://github.com/JetBrains/junie/releases/download/1831.35/junie-release-1831.35-linux-aarch64.zip", + "archive": "https://github.com/JetBrains/junie/releases/download/1892.26/junie-release-1892.26-linux-aarch64.zip", "cmd": "./junie-app/bin/junie", "args": [ "--acp=true" ] }, "linux-x86_64": { - "archive": "https://github.com/JetBrains/junie/releases/download/1831.35/junie-release-1831.35-linux-amd64.zip", + "archive": "https://github.com/JetBrains/junie/releases/download/1892.26/junie-release-1892.26-linux-amd64.zip", "cmd": "./junie-app/bin/junie", "args": [ "--acp=true" ] }, "windows-x86_64": { - "archive": "https://github.com/JetBrains/junie/releases/download/1831.35/junie-release-1831.35-windows-amd64.zip", + "archive": "https://github.com/JetBrains/junie/releases/download/1892.26/junie-release-1892.26-windows-amd64.zip", "cmd": "./junie/junie.exe", "args": [ "--acp=true" @@ -915,7 +915,7 @@ { "id": "nova", "name": "Nova", - "version": "1.1.16", + "version": "1.1.17", "description": "Nova by Compass AI - a fully-fledged software engineer at your command", "repository": "https://github.com/Compass-Agentic-Platform/nova", "website": "https://www.compassap.ai/portfolio/nova.html", @@ -926,7 +926,7 @@ "icon": "https://cdn.agentclientprotocol.com/registry/v1/latest/nova.svg", "distribution": { "npx": { - "package": "@compass-ai/nova@1.1.16", + "package": "@compass-ai/nova@1.1.17", "args": [ "acp" ] @@ -936,7 +936,7 @@ { "id": "opencode", "name": "OpenCode", - "version": "1.17.0", + "version": "1.17.4", "description": "The open source coding agent", "repository": "https://github.com/anomalyco/opencode", "website": "https://opencode.ai", @@ -948,42 +948,42 @@ "distribution": { "binary": { "darwin-aarch64": { - "archive": "https://github.com/anomalyco/opencode/releases/download/v1.17.0/opencode-darwin-arm64.zip", + "archive": "https://github.com/anomalyco/opencode/releases/download/v1.17.4/opencode-darwin-arm64.zip", "cmd": "./opencode", "args": [ "acp" ] }, "darwin-x86_64": { - "archive": "https://github.com/anomalyco/opencode/releases/download/v1.17.0/opencode-darwin-x64.zip", + "archive": "https://github.com/anomalyco/opencode/releases/download/v1.17.4/opencode-darwin-x64.zip", "cmd": "./opencode", "args": [ "acp" ] }, "linux-aarch64": { - "archive": "https://github.com/anomalyco/opencode/releases/download/v1.17.0/opencode-linux-arm64.tar.gz", + "archive": "https://github.com/anomalyco/opencode/releases/download/v1.17.4/opencode-linux-arm64.tar.gz", "cmd": "./opencode", "args": [ "acp" ] }, "linux-x86_64": { - "archive": "https://github.com/anomalyco/opencode/releases/download/v1.17.0/opencode-linux-x64.tar.gz", + "archive": "https://github.com/anomalyco/opencode/releases/download/v1.17.4/opencode-linux-x64.tar.gz", "cmd": "./opencode", "args": [ "acp" ] }, "windows-aarch64": { - "archive": "https://github.com/anomalyco/opencode/releases/download/v1.17.0/opencode-windows-arm64.zip", + "archive": "https://github.com/anomalyco/opencode/releases/download/v1.17.4/opencode-windows-arm64.zip", "cmd": "./opencode", "args": [ "acp" ] }, "windows-x86_64": { - "archive": "https://github.com/anomalyco/opencode/releases/download/v1.17.0/opencode-windows-x64.zip", + "archive": "https://github.com/anomalyco/opencode/releases/download/v1.17.4/opencode-windows-x64.zip", "cmd": "./opencode.exe", "args": [ "acp" @@ -1157,7 +1157,7 @@ { "id": "stakpak", "name": "Stakpak", - "version": "0.3.86", + "version": "0.3.88", "description": "Open-source DevOps agent in Rust with enterprise-grade security", "repository": "https://github.com/stakpak/agent", "website": "https://stakpak.dev", @@ -1169,35 +1169,35 @@ "distribution": { "binary": { "darwin-aarch64": { - "archive": "https://github.com/stakpak/agent/releases/download/v0.3.86/stakpak-darwin-aarch64.tar.gz", + "archive": "https://github.com/stakpak/agent/releases/download/v0.3.88/stakpak-darwin-aarch64.tar.gz", "cmd": "./stakpak", "args": [ "acp" ] }, "darwin-x86_64": { - "archive": "https://github.com/stakpak/agent/releases/download/v0.3.86/stakpak-darwin-x86_64.tar.gz", + "archive": "https://github.com/stakpak/agent/releases/download/v0.3.88/stakpak-darwin-x86_64.tar.gz", "cmd": "./stakpak", "args": [ "acp" ] }, "linux-aarch64": { - "archive": "https://github.com/stakpak/agent/releases/download/v0.3.86/stakpak-linux-aarch64.tar.gz", + "archive": "https://github.com/stakpak/agent/releases/download/v0.3.88/stakpak-linux-aarch64.tar.gz", "cmd": "./stakpak", "args": [ "acp" ] }, "linux-x86_64": { - "archive": "https://github.com/stakpak/agent/releases/download/v0.3.86/stakpak-linux-x86_64.tar.gz", + "archive": "https://github.com/stakpak/agent/releases/download/v0.3.88/stakpak-linux-x86_64.tar.gz", "cmd": "./stakpak", "args": [ "acp" ] }, "windows-x86_64": { - "archive": "https://github.com/stakpak/agent/releases/download/v0.3.86/stakpak-windows-x86_64.zip", + "archive": "https://github.com/stakpak/agent/releases/download/v0.3.88/stakpak-windows-x86_64.zip", "cmd": "./stakpak.exe", "args": [ "acp" diff --git a/resources/model-db/providers.json b/resources/model-db/providers.json index 67e02412b..013ef216e 100644 --- a/resources/model-db/providers.json +++ b/resources/model-db/providers.json @@ -1,48 +1,57 @@ { "providers": { - "upstage": { - "id": "upstage", - "name": "Upstage", - "display_name": "Upstage", - "api": "https://api.upstage.ai/v1/solar", - "doc": "https://developers.upstage.ai/docs/apis/chat", + "requesty": { + "id": "requesty", + "name": "Requesty", + "display_name": "Requesty", + "api": "https://router.requesty.ai/v1", + "doc": "https://requesty.ai/solution/llm-routing/models", "models": [ { - "id": "solar-mini", - "name": "solar-mini", - "display_name": "solar-mini", + "id": "xai/grok-4", + "name": "Grok 4", + "display_name": "Grok 4", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 32768, - "output": 4096 + "context": 256000, + "output": 64000 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": false, + "extra_capabilities": { + "reasoning": { + "supported": true + } + }, + "attachment": true, "open_weights": false, - "knowledge": "2024-09", - "release_date": "2024-06-12", - "last_updated": "2025-04-22", + "knowledge": "2025-01", + "release_date": "2025-09-09", + "last_updated": "2025-09-09", "cost": { - "input": 0.15, - "output": 0.15 + "input": 3, + "output": 15, + "cache_read": 0.75, + "cache_write": 3 }, "type": "chat" }, { - "id": "solar-pro3", - "name": "solar-pro3", - "display_name": "solar-pro3", + "id": "xai/grok-4-fast", + "name": "Grok 4 Fast", + "display_name": "Grok 4 Fast", "modalities": { "input": [ "text" @@ -52,8 +61,8 @@ ] }, "limit": { - "context": 131072, - "output": 8192 + "context": 2000000, + "output": 64000 }, "temperature": true, "tool_call": true, @@ -61,32 +70,38 @@ "supported": true, "default": true }, - "attachment": false, + "attachment": true, "open_weights": false, - "knowledge": "2025-03", - "release_date": "2026-01", - "last_updated": "2026-01", + "knowledge": "2025-01", + "release_date": "2025-09-19", + "last_updated": "2025-09-19", "cost": { - "input": 0.25, - "output": 0.25 + "input": 0.2, + "output": 0.5, + "cache_read": 0.05, + "cache_write": 0.2 }, "type": "chat" }, { - "id": "solar-pro2", - "name": "solar-pro2", - "display_name": "solar-pro2", + "id": "google/gemini-2.5-pro", + "name": "Gemini 2.5 Pro", + "display_name": "Gemini 2.5 Pro", "modalities": { "input": [ - "text" + "text", + "image", + "audio", + "video", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 65536, - "output": 8192 + "context": 1048576, + "output": 65536 }, "temperature": true, "tool_call": true, @@ -94,75 +109,132 @@ "supported": true, "default": true }, - "attachment": false, + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": true, + "mode": "budget", + "budget": { + "default": -1, + "min": 128, + "max": 32768, + "auto": -1, + "unit": "tokens" + }, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thought_signatures" + ] + } + }, + "attachment": true, "open_weights": false, - "knowledge": "2025-03", - "release_date": "2025-05-20", - "last_updated": "2025-05-20", + "knowledge": "2025-01", + "release_date": "2025-03-20", + "last_updated": "2025-06-05", "cost": { - "input": 0.25, - "output": 0.25 + "input": 1.25, + "output": 10, + "cache_read": 0.31, + "cache_write": 2.375, + "tiers": [ + { + "input": 2.5, + "output": 15, + "cache_read": 0.25, + "tier": { + "type": "context", + "size": 200000 + } + } + ], + "context_over_200k": { + "input": 2.5, + "output": 15, + "cache_read": 0.25 + } }, "type": "chat" - } - ] - }, - "clarifai": { - "id": "clarifai", - "name": "Clarifai", - "display_name": "Clarifai", - "api": "https://api.clarifai.com/v2/ext/openai/v1", - "doc": "https://docs.clarifai.com/compute/inference/", - "models": [ + }, { - "id": "clarifai/main/models/mm-poly-8b", - "name": "MM Poly 8B", - "display_name": "MM Poly 8B", + "id": "google/gemini-2.5-flash", + "name": "Gemini 2.5 Flash", + "display_name": "Gemini 2.5 Flash", "modalities": { "input": [ "text", "image", - "video" + "audio", + "video", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 32768, - "output": 4096 + "context": 1048576, + "output": 65536 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": true, + "mode": "budget", + "budget": { + "default": -1, + "min": 0, + "max": 24576, + "auto": -1, + "off": 0, + "unit": "tokens" + }, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thought_signatures" + ] + } }, "attachment": true, "open_weights": false, - "release_date": "2025-06", - "last_updated": "2026-02-25", + "knowledge": "2025-01", + "release_date": "2025-06-17", + "last_updated": "2025-06-17", "cost": { - "input": 0.658, - "output": 1.11 + "input": 0.3, + "output": 2.5, + "cache_read": 0.075, + "cache_write": 0.55 }, "type": "chat" }, { - "id": "mistralai/completion/models/Ministral-3-3B-Reasoning-2512", - "name": "Ministral 3 3B Reasoning 2512", - "display_name": "Ministral 3 3B Reasoning 2512", + "id": "google/gemini-3-pro-preview", + "name": "Gemini 3 Pro", + "display_name": "Gemini 3 Pro", "modalities": { "input": [ "text", - "image" + "image", + "audio", + "video", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 262144, - "output": 262144 + "context": 1048576, + "output": 65536 }, "temperature": true, "tool_call": true, @@ -170,32 +242,55 @@ "supported": true, "default": true }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": true, + "mode": "level", + "level": "high", + "level_options": [ + "low", + "high" + ], + "summaries": true, + "visibility": "summary", + "continuation": [ + "thought_signatures" + ] + } + }, "attachment": true, - "open_weights": true, - "release_date": "2025-12", - "last_updated": "2026-02-25", + "open_weights": false, + "knowledge": "2025-01", + "release_date": "2025-11-18", + "last_updated": "2025-11-18", "cost": { - "input": 1.039, - "output": 0.54825 + "input": 2, + "output": 12, + "cache_read": 0.2, + "cache_write": 4.5 }, "type": "chat" }, { - "id": "mistralai/completion/models/Ministral-3-14B-Reasoning-2512", - "name": "Ministral 3 14B Reasoning 2512", - "display_name": "Ministral 3 14B Reasoning 2512", + "id": "google/gemini-3-flash-preview", + "name": "Gemini 3 Flash", + "display_name": "Gemini 3 Flash", "modalities": { "input": [ "text", - "image" + "image", + "audio", + "video", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 262144, - "output": 262144 + "context": 1048576, + "output": 65536 }, "temperature": true, "tool_call": true, @@ -203,98 +298,149 @@ "supported": true, "default": true }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": true, + "mode": "level", + "level": "high", + "level_options": [ + "minimal", + "low", + "medium", + "high" + ], + "summaries": true, + "visibility": "summary", + "continuation": [ + "thought_signatures" + ] + } + }, "attachment": true, - "open_weights": true, - "knowledge": "2025-12", - "release_date": "2025-12-01", - "last_updated": "2025-12-12", + "open_weights": false, + "knowledge": "2025-01", + "release_date": "2025-12-17", + "last_updated": "2025-12-17", "cost": { - "input": 2.5, - "output": 1.7 + "input": 0.5, + "output": 3, + "cache_read": 0.05, + "cache_write": 1 }, "type": "chat" }, { - "id": "arcee_ai/AFM/models/trinity-mini", - "name": "Trinity Mini", - "display_name": "Trinity Mini", + "id": "openai/gpt-5.2-chat", + "name": "GPT-5.2 Chat", + "display_name": "GPT-5.2 Chat", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 131072, - "output": 131072 + "context": 128000, + "output": 16384 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { "supported": true, "default": true }, - "attachment": false, - "open_weights": true, - "knowledge": "2024-10", - "release_date": "2025-12", - "last_updated": "2026-02-25", + "attachment": true, + "open_weights": false, + "knowledge": "2025-08-31", + "release_date": "2025-12-11", + "last_updated": "2025-12-11", "cost": { - "input": 0.045, - "output": 0.15 + "input": 1.75, + "output": 14, + "cache_read": 0.175 }, "type": "chat" }, { - "id": "qwen/qwenLM/models/Qwen3-30B-A3B-Instruct-2507", - "name": "Qwen3 30B A3B Instruct 2507", - "display_name": "Qwen3 30B A3B Instruct 2507", + "id": "openai/gpt-5.2-pro", + "name": "GPT-5.2 Pro", + "display_name": "GPT-5.2 Pro", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 262144, - "output": 262144 + "context": 400000, + "output": 128000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": false, - "open_weights": true, - "release_date": "2025-07-30", - "last_updated": "2026-02-25", + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": true, + "mode": "effort", + "effort": "high", + "effort_options": [ + "medium", + "high", + "xhigh" + ], + "verbosity": "medium", + "verbosity_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" + } + }, + "attachment": true, + "open_weights": false, + "knowledge": "2025-08-31", + "release_date": "2025-12-11", + "last_updated": "2025-12-11", "cost": { - "input": 0.3, - "output": 0.5 + "input": 21, + "output": 168 }, "type": "chat" }, { - "id": "qwen/qwenLM/models/Qwen3-30B-A3B-Thinking-2507", - "name": "Qwen3 30B A3B Thinking 2507", - "display_name": "Qwen3 30B A3B Thinking 2507", + "id": "openai/gpt-5", + "name": "GPT-5", + "display_name": "GPT-5", "modalities": { "input": [ - "text" + "text", + "audio", + "image", + "video" ], "output": [ - "text" + "text", + "audio", + "image" ] }, "limit": { - "context": 262144, - "output": 131072 + "context": 400000, + "output": 128000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { "supported": true, @@ -303,60 +449,74 @@ "extra_capabilities": { "reasoning": { "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] + "default_enabled": true, + "mode": "effort", + "effort": "medium", + "effort_options": [ + "minimal", + "low", + "medium", + "high" + ], + "verbosity": "medium", + "verbosity_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" } }, - "attachment": false, - "open_weights": true, - "release_date": "2025-07-31", - "last_updated": "2026-02-25", + "attachment": true, + "open_weights": false, + "knowledge": "2024-09-30", + "release_date": "2025-08-07", + "last_updated": "2025-08-07", "cost": { - "input": 0.36, - "output": 1.3 + "input": 1.25, + "output": 10, + "cache_read": 0.13 }, "type": "chat" }, { - "id": "qwen/qwenCoder/models/Qwen3-Coder-30B-A3B-Instruct", - "name": "Qwen3 Coder 30B A3B Instruct", - "display_name": "Qwen3 Coder 30B A3B Instruct", + "id": "openai/gpt-5-chat", + "name": "GPT-5 Chat (latest)", + "display_name": "GPT-5 Chat (latest)", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 262144, - "output": 65536 + "context": 400000, + "output": 128000 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": false, - "open_weights": true, - "knowledge": "2025-04", - "release_date": "2025-07-31", - "last_updated": "2026-02-12", + "attachment": true, + "open_weights": false, + "knowledge": "2024-09-30", + "release_date": "2025-08-07", + "last_updated": "2025-08-07", "cost": { - "input": 0.11458, - "output": 0.74812 + "input": 1.25, + "output": 10 }, "type": "chat" }, { - "id": "moonshotai/chat-completion/models/Kimi-K2_6", - "name": "Kimi K2.6", - "display_name": "Kimi K2.6", + "id": "openai/gpt-5-pro", + "name": "GPT-5 Pro", + "display_name": "GPT-5 Pro", "modalities": { "input": [ "text", @@ -367,10 +527,10 @@ ] }, "limit": { - "context": 262144, - "output": 262144 + "context": 400000, + "output": 272000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { "supported": true, @@ -379,29 +539,33 @@ "extra_capabilities": { "reasoning": { "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] + "default_enabled": true, + "mode": "fixed", + "effort": "high", + "verbosity": "medium", + "verbosity_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" } }, "attachment": true, - "open_weights": true, - "knowledge": "2025-01", - "release_date": "2026-04-21", - "last_updated": "2026-04-21", + "open_weights": false, + "knowledge": "2024-09-30", + "release_date": "2025-10-06", + "last_updated": "2025-10-06", "cost": { - "input": 0.95, - "output": 4 + "input": 15, + "output": 120 }, "type": "chat" }, { - "id": "deepseek-ai/deepseek-ocr/models/DeepSeek-OCR", - "name": "DeepSeek OCR", - "display_name": "DeepSeek OCR", + "id": "openai/o4-mini", + "name": "o4 Mini", + "display_name": "o4 Mini", "modalities": { "input": [ "text", @@ -412,39 +576,57 @@ ] }, "limit": { - "context": 8192, - "output": 8192 + "context": 200000, + "output": 100000 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": true, + "mode": "effort", + "effort": "medium", + "effort_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" + } }, "attachment": true, - "open_weights": true, - "release_date": "2025-10-20", - "last_updated": "2026-02-25", + "open_weights": false, + "knowledge": "2024-06", + "release_date": "2025-04-16", + "last_updated": "2025-04-16", "cost": { - "input": 0.2, - "output": 0.7 + "input": 1.1, + "output": 4.4, + "cache_read": 0.28 }, "type": "chat" }, { - "id": "minimaxai/chat-completion/models/MiniMax-M2_5-high-throughput", - "name": "MiniMax-M2.5 High Throughput", - "display_name": "MiniMax-M2.5 High Throughput", + "id": "openai/gpt-5.1-chat", + "name": "GPT-5.1 Chat", + "display_name": "GPT-5.1 Chat", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 204800, - "output": 131072 + "context": 128000, + "output": 16384 }, "temperature": true, "tool_call": true, @@ -452,193 +634,318 @@ "supported": true, "default": true }, - "attachment": false, - "open_weights": true, - "release_date": "2026-02-12", - "last_updated": "2026-02-25", + "attachment": true, + "open_weights": false, + "knowledge": "2024-09-30", + "release_date": "2025-11-13", + "last_updated": "2025-11-13", "cost": { - "input": 0.3, - "output": 1.2 + "input": 1.25, + "output": 10, + "cache_read": 0.125 }, "type": "chat" }, { - "id": "openai/chat-completion/models/gpt-oss-20b", - "name": "GPT OSS 20B", - "display_name": "GPT OSS 20B", + "id": "openai/gpt-5.1-codex", + "name": "GPT-5.1-Codex", + "display_name": "GPT-5.1-Codex", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 131072, - "output": 16384 + "context": 400000, + "output": 128000 }, "temperature": true, "tool_call": true, "reasoning": { "supported": true, - "default": true + "default": false }, "extra_capabilities": { "reasoning": { - "supported": true + "supported": true, + "default_enabled": false, + "mode": "effort", + "effort": "none", + "effort_options": [ + "none", + "low", + "medium", + "high" + ], + "verbosity": "medium", + "verbosity_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" } }, - "attachment": false, - "open_weights": true, - "release_date": "2025-08-05", - "last_updated": "2025-12-12", + "attachment": true, + "open_weights": false, + "knowledge": "2024-09-30", + "release_date": "2025-11-13", + "last_updated": "2025-11-13", "cost": { - "input": 0.045, - "output": 0.18 + "input": 1.25, + "output": 10, + "cache_read": 0.125 }, "type": "chat" }, { - "id": "openai/chat-completion/models/gpt-oss-120b-high-throughput", - "name": "GPT OSS 120B High Throughput", - "display_name": "GPT OSS 120B High Throughput", + "id": "openai/gpt-5.1-codex-max", + "name": "GPT-5.1-Codex-Max", + "display_name": "GPT-5.1-Codex-Max", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 131072, - "output": 16384 + "context": 400000, + "output": 128000 }, "temperature": true, "tool_call": true, "reasoning": { "supported": true, - "default": true + "default": false }, - "attachment": false, - "open_weights": true, - "release_date": "2025-08-05", - "last_updated": "2026-02-25", + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": false, + "mode": "effort", + "effort": "none", + "effort_options": [ + "none", + "low", + "medium", + "high" + ], + "verbosity": "medium", + "verbosity_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" + } + }, + "attachment": true, + "open_weights": false, + "knowledge": "2024-09-30", + "release_date": "2025-11-13", + "last_updated": "2025-11-13", "cost": { - "input": 0.09, - "output": 0.36 + "input": 1.1, + "output": 9, + "cache_read": 0.11 }, "type": "chat" - } - ] - }, - "the-grid-ai": { - "id": "the-grid-ai", - "name": "The Grid AI", - "display_name": "The Grid AI", - "api": "https://api.thegrid.ai/v1", - "doc": "https://thegrid.ai/docs", - "models": [ + }, { - "id": "text-prime", - "name": "Text Prime", - "display_name": "Text Prime", + "id": "openai/gpt-5.2", + "name": "GPT-5.2", + "display_name": "GPT-5.2", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 30000 + "context": 400000, + "output": 128000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { "supported": true, - "default": true + "default": false }, - "attachment": false, + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": false, + "mode": "effort", + "effort": "none", + "effort_options": [ + "none", + "low", + "medium", + "high", + "xhigh" + ], + "verbosity": "medium", + "verbosity_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" + } + }, + "attachment": true, "open_weights": false, - "release_date": "2026-02-26", - "last_updated": "2026-05-19", + "knowledge": "2025-08-31", + "release_date": "2025-12-11", + "last_updated": "2025-12-11", + "cost": { + "input": 1.75, + "output": 14, + "cache_read": 0.175 + }, "type": "chat" }, { - "id": "agent-standard", - "name": "Agent Standard", - "display_name": "Agent Standard", + "id": "openai/gpt-5.3-codex", + "name": "GPT-5.3-Codex", + "display_name": "GPT-5.3-Codex", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 16000 + "context": 400000, + "output": 128000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { "supported": true, "default": true }, - "attachment": false, + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": true, + "mode": "effort", + "effort": "medium", + "effort_options": [ + "low", + "medium", + "high", + "xhigh" + ], + "verbosity": "medium", + "verbosity_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" + } + }, + "attachment": true, "open_weights": false, - "release_date": "2026-05-04", - "last_updated": "2026-05-19", + "knowledge": "2025-08-31", + "release_date": "2026-02-24", + "last_updated": "2026-02-24", + "cost": { + "input": 1.75, + "output": 14, + "cache_read": 0.175 + }, "type": "chat" }, { - "id": "text-standard", - "name": "Text Standard", - "display_name": "Text Standard", + "id": "openai/gpt-5.1-codex-mini", + "name": "GPT-5.1-Codex-Mini", + "display_name": "GPT-5.1-Codex-Mini", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 16000 + "context": 400000, + "output": 100000 }, "temperature": true, "tool_call": true, "reasoning": { "supported": true, - "default": true + "default": false }, - "attachment": false, + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": false, + "mode": "effort", + "effort": "none", + "effort_options": [ + "none", + "low", + "medium", + "high" + ], + "verbosity": "medium", + "verbosity_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" + } + }, + "attachment": true, "open_weights": false, - "release_date": "2026-02-26", - "last_updated": "2026-05-19", + "knowledge": "2024-09-30", + "release_date": "2025-11-13", + "last_updated": "2025-11-13", + "cost": { + "input": 0.25, + "output": 2, + "cache_read": 0.025 + }, "type": "chat" }, { - "id": "agent-prime", - "name": "Agent Prime", - "display_name": "Agent Prime", + "id": "openai/gpt-5-image", + "name": "GPT-5 Image", + "display_name": "GPT-5 Image", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ - "text" + "text", + "image" ] }, "limit": { - "context": 128000, - "output": 64000 + "context": 400000, + "output": 128000 }, "temperature": true, "tool_call": true, @@ -646,44 +953,96 @@ "supported": true, "default": true }, - "attachment": false, + "attachment": true, "open_weights": false, - "release_date": "2026-05-04", - "last_updated": "2026-05-19", + "knowledge": "2024-10-01", + "release_date": "2025-10-14", + "last_updated": "2025-10-14", + "cost": { + "input": 5, + "output": 10, + "cache_read": 1.25 + }, "type": "chat" }, { - "id": "code-prime", - "name": "Code Prime", - "display_name": "Code Prime", + "id": "openai/gpt-5.4", + "name": "GPT-5.4", + "display_name": "GPT-5.4", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 64000 + "context": 1050000, + "output": 128000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { "supported": true, - "default": true + "default": false }, - "attachment": false, + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": false, + "mode": "effort", + "effort": "none", + "effort_options": [ + "none", + "low", + "medium", + "high", + "xhigh" + ], + "verbosity": "medium", + "verbosity_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" + } + }, + "attachment": true, "open_weights": false, - "release_date": "2026-05-04", - "last_updated": "2026-05-19", + "knowledge": "2025-08-31", + "release_date": "2026-03-05", + "last_updated": "2026-03-05", + "cost": { + "input": 2.5, + "output": 15, + "cache_read": 0.25, + "tiers": [ + { + "input": 5, + "output": 22.5, + "cache_read": 0.5, + "tier": { + "type": "context", + "size": 272000 + } + } + ], + "context_over_200k": { + "input": 5, + "output": 22.5, + "cache_read": 0.5 + } + }, "type": "chat" }, { - "id": "agent-max", - "name": "Agent Max", - "display_name": "Agent Max", + "id": "openai/gpt-4.1", + "name": "GPT-4.1", + "display_name": "GPT-4.1", "modalities": { "input": [ "text", @@ -694,39 +1053,34 @@ ] }, "limit": { - "context": 1000000, - "output": 128000 + "context": 1047576, + "output": 32768 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } + "supported": false }, - "attachment": false, + "attachment": true, "open_weights": false, - "release_date": "2026-05-04", - "last_updated": "2026-05-19", + "knowledge": "2024-04", + "release_date": "2025-04-14", + "last_updated": "2025-04-14", + "cost": { + "input": 2, + "output": 8, + "cache_read": 0.5 + }, "type": "chat" }, { - "id": "code-standard", - "name": "Code Standard", - "display_name": "Code Standard", + "id": "openai/gpt-5-mini", + "name": "GPT-5 Mini", + "display_name": "GPT-5 Mini", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" @@ -734,24 +1088,51 @@ }, "limit": { "context": 128000, - "output": 16000 + "output": 32000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { "supported": true, "default": true }, - "attachment": false, + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": true, + "mode": "effort", + "effort": "medium", + "effort_options": [ + "minimal", + "low", + "medium", + "high" + ], + "verbosity": "medium", + "verbosity_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" + } + }, + "attachment": true, "open_weights": false, - "release_date": "2026-05-04", - "last_updated": "2026-05-19", + "knowledge": "2024-05-30", + "release_date": "2025-08-07", + "last_updated": "2025-08-07", + "cost": { + "input": 0.25, + "output": 2, + "cache_read": 0.03 + }, "type": "chat" }, { - "id": "code-max", - "name": "Code Max", - "display_name": "Code Max", + "id": "openai/gpt-4.1-mini", + "name": "GPT-4.1 Mini", + "display_name": "GPT-4.1 Mini", "modalities": { "input": [ "text", @@ -762,50 +1143,43 @@ ] }, "limit": { - "context": 1000000, - "output": 128000 + "context": 1047576, + "output": 32768 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } - }, - "attachment": false, + "attachment": true, "open_weights": false, - "release_date": "2026-05-04", - "last_updated": "2026-05-19", + "knowledge": "2024-04", + "release_date": "2025-04-14", + "last_updated": "2025-04-14", + "cost": { + "input": 0.4, + "output": 1.6, + "cache_read": 0.1 + }, "type": "chat" }, { - "id": "text-max", - "name": "Text Max", - "display_name": "Text Max", + "id": "openai/gpt-5-nano", + "name": "GPT-5 Nano", + "display_name": "GPT-5 Nano", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 1000000, - "output": 128000 + "context": 16000, + "output": 4000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { "supported": true, @@ -814,46 +1188,55 @@ "extra_capabilities": { "reasoning": { "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] + "default_enabled": true, + "mode": "effort", + "effort": "medium", + "effort_options": [ + "minimal", + "low", + "medium", + "high" + ], + "verbosity": "medium", + "verbosity_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" } }, - "attachment": false, + "attachment": true, "open_weights": false, - "release_date": "2026-03-24", - "last_updated": "2026-05-19", + "knowledge": "2024-05-30", + "release_date": "2025-08-07", + "last_updated": "2025-08-07", + "cost": { + "input": 0.05, + "output": 0.4, + "cache_read": 0.01 + }, "type": "chat" - } - ] - }, - "fireworks-ai": { - "id": "fireworks-ai", - "name": "Fireworks AI", - "display_name": "Fireworks AI", - "api": "https://api.fireworks.ai/inference/v1/", - "doc": "https://fireworks.ai/docs/", - "models": [ + }, { - "id": "accounts/fireworks/models/minimax-m2p5", - "name": "MiniMax-M2.5", - "display_name": "MiniMax-M2.5", + "id": "openai/gpt-5.4-pro", + "name": "GPT-5.4 Pro", + "display_name": "GPT-5.4 Pro", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 196608, - "output": 196608 + "context": 1050000, + "output": 128000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { "supported": true, @@ -862,29 +1245,39 @@ "extra_capabilities": { "reasoning": { "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] + "default_enabled": true, + "mode": "effort", + "effort": "high", + "effort_options": [ + "medium", + "high", + "xhigh" + ], + "verbosity": "medium", + "verbosity_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" } }, - "attachment": false, - "open_weights": true, - "release_date": "2026-02-12", - "last_updated": "2026-02-12", + "attachment": true, + "open_weights": false, + "knowledge": "2025-08-31", + "release_date": "2026-03-05", + "last_updated": "2026-03-05", "cost": { - "input": 0.3, - "output": 1.2, - "cache_read": 0.03 + "input": 30, + "output": 180, + "cache_read": 30 }, "type": "chat" }, { - "id": "accounts/fireworks/models/qwen3p6-plus", - "name": "Qwen 3.6 Plus", - "display_name": "Qwen 3.6 Plus", + "id": "openai/gpt-4o-mini", + "name": "GPT-4o Mini", + "display_name": "GPT-4o Mini", "modalities": { "input": [ "text", @@ -895,41 +1288,42 @@ ] }, "limit": { - "context": 262144, - "output": 65536 + "context": 128000, + "output": 16384 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, "attachment": true, "open_weights": false, - "release_date": "2026-04-04", - "last_updated": "2026-04-04", + "knowledge": "2024-10", + "release_date": "2024-07-18", + "last_updated": "2024-07-18", "cost": { - "input": 0.5, - "output": 3, - "cache_read": 0.1 + "input": 0.15, + "output": 0.6, + "cache_read": 0.08 }, "type": "chat" }, { - "id": "accounts/fireworks/models/gpt-oss-120b", - "name": "GPT OSS 120B", - "display_name": "GPT OSS 120B", + "id": "openai/gpt-5-codex", + "name": "GPT-5 Codex", + "display_name": "GPT-5 Codex", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 131072, - "output": 32768 + "context": 400000, + "output": 128000 }, "temperature": true, "tool_call": true, @@ -939,35 +1333,53 @@ }, "extra_capabilities": { "reasoning": { - "supported": true + "supported": true, + "default_enabled": true, + "mode": "effort", + "effort": "medium", + "effort_options": [ + "minimal", + "low", + "medium", + "high" + ], + "verbosity": "medium", + "verbosity_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" } }, - "attachment": false, - "open_weights": true, - "release_date": "2025-08-05", - "last_updated": "2025-08-05", + "attachment": true, + "open_weights": false, + "knowledge": "2024-10-01", + "release_date": "2025-09-15", + "last_updated": "2025-09-15", "cost": { - "input": 0.15, - "output": 0.6, - "cache_read": 0.015 + "input": 1.25, + "output": 10, + "cache_read": 0.125 }, "type": "chat" }, { - "id": "accounts/fireworks/models/minimax-m2p7", - "name": "MiniMax-M2.7", - "display_name": "MiniMax-M2.7", + "id": "openai/gpt-5.2-codex", + "name": "GPT-5.2-Codex", + "display_name": "GPT-5.2-Codex", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 196608, - "output": 196608 + "context": 400000, + "output": 128000 }, "temperature": true, "tool_call": true, @@ -978,493 +1390,692 @@ "extra_capabilities": { "reasoning": { "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] + "default_enabled": true, + "mode": "effort", + "effort": "medium", + "effort_options": [ + "low", + "medium", + "high", + "xhigh" + ], + "verbosity": "medium", + "verbosity_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" } }, - "attachment": false, - "open_weights": true, - "release_date": "2026-04-12", - "last_updated": "2026-04-12", + "attachment": true, + "open_weights": false, + "knowledge": "2025-08-31", + "release_date": "2026-01-14", + "last_updated": "2026-01-14", "cost": { - "input": 0.3, - "output": 1.2, - "cache_read": 0.06 + "input": 1.75, + "output": 14, + "cache_read": 0.175 }, "type": "chat" }, { - "id": "accounts/fireworks/models/gpt-oss-20b", - "name": "GPT OSS 20B", - "display_name": "GPT OSS 20B", + "id": "openai/gpt-5.1", + "name": "GPT-5.1", + "display_name": "GPT-5.1", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 131072, - "output": 32768 + "context": 400000, + "output": 128000 }, "temperature": true, "tool_call": true, "reasoning": { "supported": true, - "default": true + "default": false }, "extra_capabilities": { "reasoning": { - "supported": true + "supported": true, + "default_enabled": false, + "mode": "effort", + "effort": "none", + "effort_options": [ + "none", + "low", + "medium", + "high" + ], + "verbosity": "medium", + "verbosity_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" } }, - "attachment": false, - "open_weights": true, - "release_date": "2025-08-05", - "last_updated": "2025-08-05", + "attachment": true, + "open_weights": false, + "knowledge": "2024-09-30", + "release_date": "2025-11-13", + "last_updated": "2025-11-13", "cost": { - "input": 0.07, - "output": 0.3, - "cache_read": 0.035 + "input": 1.25, + "output": 10, + "cache_read": 0.125 }, "type": "chat" }, { - "id": "accounts/fireworks/models/kimi-k2p5", - "name": "Kimi K2.5", - "display_name": "Kimi K2.5", + "id": "anthropic/claude-3-7-sonnet", + "name": "Claude Sonnet 3.7", + "display_name": "Claude Sonnet 3.7", "modalities": { "input": [ "text", "image", - "video" + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 256000, - "output": 256000 + "context": 200000, + "output": 64000 }, "temperature": true, "tool_call": true, "reasoning": { "supported": true, - "default": true + "default": false }, "extra_capabilities": { "reasoning": { "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", + "default_enabled": false, + "mode": "budget", + "budget": { + "min": 1024, + "unit": "tokens" + }, + "interleaved": false, + "summaries": false, + "visibility": "full", "continuation": [ "thinking_blocks" + ], + "notes": [ + "Anthropic uses thinking budget tokens" ] } }, "attachment": true, - "open_weights": true, - "knowledge": "2025-01", - "release_date": "2026-01-27", - "last_updated": "2026-01-27", + "open_weights": false, + "knowledge": "2024-01", + "release_date": "2025-02-19", + "last_updated": "2025-02-19", "cost": { - "input": 0.6, - "output": 3, - "cache_read": 0.1 + "input": 3, + "output": 15, + "cache_read": 0.3, + "cache_write": 3.75 }, "type": "chat" }, { - "id": "accounts/fireworks/models/kimi-k2p6", - "name": "Kimi K2.6", - "display_name": "Kimi K2.6", + "id": "anthropic/claude-sonnet-4", + "name": "Claude Sonnet 4", + "display_name": "Claude Sonnet 4", "modalities": { "input": [ "text", - "image" + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 262000, - "output": 262000 + "context": 200000, + "output": 64000 }, "temperature": true, "tool_call": true, "reasoning": { "supported": true, - "default": true + "default": false }, "extra_capabilities": { "reasoning": { "supported": true, + "default_enabled": false, + "mode": "budget", + "budget": { + "min": 1024, + "unit": "tokens" + }, "interleaved": true, "summaries": true, "visibility": "summary", "continuation": [ "thinking_blocks" + ], + "notes": [ + "Claude 4 manual thinking uses thinking.type = \"enabled\" with budget_tokens.", + "Interleaved thinking requires the interleaved-thinking-2025-05-14 beta header for this model family." ] } }, "attachment": true, - "open_weights": true, - "release_date": "2026-04-17", - "last_updated": "2026-04-17", + "open_weights": false, + "knowledge": "2025-03-31", + "release_date": "2025-05-22", + "last_updated": "2025-05-22", "cost": { - "input": 0.95, - "output": 4, - "cache_read": 0.16 + "input": 3, + "output": 15, + "cache_read": 0.3, + "cache_write": 3.75 }, "type": "chat" }, { - "id": "accounts/fireworks/models/deepseek-v4-flash", - "name": "DeepSeek V4 Flash", - "display_name": "DeepSeek V4 Flash", + "id": "anthropic/claude-opus-4-5", + "name": "Claude Opus 4.5", + "display_name": "Claude Opus 4.5", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 1000000, - "output": 384000 + "context": 200000, + "output": 64000 }, "temperature": true, "tool_call": true, "reasoning": { "supported": true, - "default": true + "default": false }, "extra_capabilities": { "reasoning": { "supported": true, + "default_enabled": false, + "mode": "mixed", + "budget": { + "min": 1024, + "unit": "tokens" + }, + "effort": "high", + "effort_options": [ + "low", + "medium", + "high" + ], "interleaved": true, "summaries": true, "visibility": "summary", "continuation": [ "thinking_blocks" + ], + "notes": [ + "Claude Opus 4.5 uses manual thinking.type = \"enabled\" with budget_tokens; effort can be used alongside the thinking budget.", + "Interleaved thinking requires the interleaved-thinking-2025-05-14 beta header." ] } }, - "attachment": false, - "open_weights": true, - "knowledge": "2025-05", - "release_date": "2026-04-24", - "last_updated": "2026-04-24", + "attachment": true, + "open_weights": false, + "knowledge": "2025-03-31", + "release_date": "2025-11-24", + "last_updated": "2025-11-24", "cost": { - "input": 0.14, - "output": 0.28, - "cache_read": 0.03 + "input": 5, + "output": 25, + "cache_read": 0.5, + "cache_write": 6.25 }, "type": "chat" }, { - "id": "accounts/fireworks/models/glm-5p1", - "name": "GLM 5.1", - "display_name": "GLM 5.1", + "id": "anthropic/claude-sonnet-4-5", + "name": "Claude Sonnet 4.5", + "display_name": "Claude Sonnet 4.5", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 202800, - "output": 131072 + "context": 1000000, + "output": 64000 }, "temperature": true, "tool_call": true, "reasoning": { "supported": true, - "default": true + "default": false }, "extra_capabilities": { "reasoning": { "supported": true, + "default_enabled": false, + "mode": "budget", + "budget": { + "min": 1024, + "unit": "tokens" + }, "interleaved": true, "summaries": true, "visibility": "summary", "continuation": [ "thinking_blocks" + ], + "notes": [ + "Claude 4 manual thinking uses thinking.type = \"enabled\" with budget_tokens.", + "Interleaved thinking requires the interleaved-thinking-2025-05-14 beta header for this model family." ] } }, - "attachment": false, - "open_weights": true, - "release_date": "2026-04-01", - "last_updated": "2026-04-01", + "attachment": true, + "open_weights": false, + "knowledge": "2025-07-31", + "release_date": "2025-09-29", + "last_updated": "2025-09-29", "cost": { - "input": 1.4, - "output": 4.4, - "cache_read": 0.26 + "input": 3, + "output": 15, + "cache_read": 0.3, + "cache_write": 3.75 }, "type": "chat" }, { - "id": "accounts/fireworks/models/deepseek-v4-pro", - "name": "DeepSeek V4 Pro", - "display_name": "DeepSeek V4 Pro", + "id": "anthropic/claude-opus-4-1", + "name": "Claude Opus 4.1", + "display_name": "Claude Opus 4.1", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 1000000, - "output": 384000 + "context": 200000, + "output": 32000 }, "temperature": true, "tool_call": true, "reasoning": { "supported": true, - "default": true + "default": false }, "extra_capabilities": { "reasoning": { "supported": true, + "default_enabled": false, + "mode": "budget", + "budget": { + "min": 1024, + "unit": "tokens" + }, "interleaved": true, "summaries": true, "visibility": "summary", "continuation": [ "thinking_blocks" + ], + "notes": [ + "Claude 4 manual thinking uses thinking.type = \"enabled\" with budget_tokens.", + "Interleaved thinking requires the interleaved-thinking-2025-05-14 beta header for this model family." ] } }, - "attachment": false, - "open_weights": true, - "knowledge": "2025-05", - "release_date": "2026-04-24", - "last_updated": "2026-04-24", + "attachment": true, + "open_weights": false, + "knowledge": "2025-03-31", + "release_date": "2025-08-05", + "last_updated": "2025-08-05", "cost": { - "input": 1.74, - "output": 3.48, - "cache_read": 0.145 + "input": 15, + "output": 75, + "cache_read": 1.5, + "cache_write": 18.75 }, "type": "chat" }, { - "id": "accounts/fireworks/routers/kimi-k2p6-fast", - "name": "Kimi K2.6 Fast", - "display_name": "Kimi K2.6 Fast", + "id": "anthropic/claude-haiku-4-5", + "name": "Claude Haiku 4.5", + "display_name": "Claude Haiku 4.5", "modalities": { "input": [ "text", - "image" + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 262000, - "output": 262000 + "context": 200000, + "output": 62000 }, "temperature": true, "tool_call": true, "reasoning": { "supported": true, - "default": true + "default": false }, "extra_capabilities": { "reasoning": { "supported": true, + "default_enabled": false, + "mode": "budget", + "budget": { + "min": 1024, + "unit": "tokens" + }, "interleaved": true, "summaries": true, "visibility": "summary", "continuation": [ "thinking_blocks" + ], + "notes": [ + "Claude 4 manual thinking uses thinking.type = \"enabled\" with budget_tokens.", + "Interleaved thinking requires the interleaved-thinking-2025-05-14 beta header for this model family." ] } }, - "attachment": false, - "open_weights": true, - "release_date": "2026-04-17", - "last_updated": "2026-06-05", + "attachment": true, + "open_weights": false, + "knowledge": "2025-02-01", + "release_date": "2025-10-15", + "last_updated": "2025-10-15", "cost": { - "input": 2, - "output": 8, - "cache_read": 0.3 + "input": 1, + "output": 5, + "cache_read": 0.1, + "cache_write": 1.25 }, "type": "chat" }, { - "id": "accounts/fireworks/routers/kimi-k2p6-turbo", - "name": "Kimi K2.6 Turbo", - "display_name": "Kimi K2.6 Turbo", + "id": "anthropic/claude-opus-4-6", + "name": "Claude Opus 4.6", + "display_name": "Claude Opus 4.6", "modalities": { "input": [ "text", - "image" + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 262000, - "output": 262000 + "context": 1000000, + "output": 128000 }, "temperature": true, "tool_call": true, "reasoning": { "supported": true, - "default": true + "default": false }, "extra_capabilities": { "reasoning": { "supported": true, + "default_enabled": false, + "mode": "mixed", + "budget": { + "min": 1024, + "unit": "tokens" + }, + "effort": "high", + "effort_options": [ + "low", + "medium", + "high", + "max" + ], "interleaved": true, "summaries": true, "visibility": "summary", "continuation": [ "thinking_blocks" + ], + "notes": [ + "Anthropic recommends adaptive thinking with effort for Claude 4.6; budget_tokens remains a deprecated compatibility path.", + "Anthropic API defaults effort to high; lower effort levels should be chosen per workload." ] } }, - "attachment": false, - "open_weights": true, - "release_date": "2026-04-17", - "last_updated": "2026-04-17", + "attachment": true, + "open_weights": false, + "knowledge": "2025-05-31", + "release_date": "2026-02-05", + "last_updated": "2026-02-05", "cost": { - "input": 2, - "output": 8, - "cache_read": 0.3 + "input": 5, + "output": 25, + "cache_read": 0.5, + "cache_write": 6.25, + "tiers": [ + { + "input": 10, + "output": 37.5, + "cache_read": 1, + "cache_write": 12.5, + "tier": { + "type": "context", + "size": 200000 + } + } + ], + "context_over_200k": { + "input": 10, + "output": 37.5, + "cache_read": 1, + "cache_write": 12.5 + } }, "type": "chat" }, { - "id": "accounts/fireworks/routers/glm-5p1-fast", - "name": "GLM 5.1 Fast", - "display_name": "GLM 5.1 Fast", + "id": "anthropic/claude-sonnet-4-6", + "name": "Claude Sonnet 4.6", + "display_name": "Claude Sonnet 4.6", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 202800, - "output": 131072 + "context": 1000000, + "output": 128000 }, "temperature": true, "tool_call": true, "reasoning": { "supported": true, - "default": true + "default": false }, "extra_capabilities": { "reasoning": { "supported": true, + "default_enabled": false, + "mode": "mixed", + "budget": { + "min": 1024, + "unit": "tokens" + }, + "effort": "high", + "effort_options": [ + "low", + "medium", + "high", + "max" + ], "interleaved": true, "summaries": true, "visibility": "summary", "continuation": [ "thinking_blocks" + ], + "notes": [ + "Anthropic recommends adaptive thinking with effort for Claude 4.6; budget_tokens remains a deprecated compatibility path.", + "Anthropic API defaults effort to high; lower effort levels should be chosen per workload." ] } }, - "attachment": false, - "open_weights": true, - "release_date": "2026-04-01", - "last_updated": "2026-04-01", + "attachment": true, + "open_weights": false, + "knowledge": "2025-08-31", + "release_date": "2026-02-17", + "last_updated": "2026-02-17", "cost": { - "input": 2.8, - "output": 8.8, - "cache_read": 0.52 + "input": 3, + "output": 15, + "cache_read": 0.3, + "cache_write": 3.75, + "tiers": [ + { + "input": 6, + "output": 22.5, + "cache_read": 0.6, + "cache_write": 7.5, + "tier": { + "type": "context", + "size": 200000 + } + } + ], + "context_over_200k": { + "input": 6, + "output": 22.5, + "cache_read": 0.6, + "cache_write": 7.5 + } }, "type": "chat" - } - ] - }, - "ambient": { - "id": "ambient", - "name": "Ambient", - "display_name": "Ambient", - "api": "https://api.ambient.xyz/v1", - "doc": "https://ambient.xyz", - "models": [ + }, { - "id": "zai-org/GLM-5.1-FP8", - "name": "GLM-5.1", - "display_name": "GLM-5.1", + "id": "anthropic/claude-opus-4", + "name": "Claude Opus 4", + "display_name": "Claude Opus 4", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 202752, - "output": 131072 + "context": 200000, + "output": 32000 }, "temperature": true, "tool_call": true, "reasoning": { "supported": true, - "default": true + "default": false }, "extra_capabilities": { "reasoning": { "supported": true, + "default_enabled": false, + "mode": "budget", + "budget": { + "min": 1024, + "unit": "tokens" + }, "interleaved": true, "summaries": true, "visibility": "summary", "continuation": [ "thinking_blocks" + ], + "notes": [ + "Claude 4 manual thinking uses thinking.type = \"enabled\" with budget_tokens.", + "Interleaved thinking requires the interleaved-thinking-2025-05-14 beta header for this model family." ] } }, - "attachment": false, - "open_weights": true, - "release_date": "2026-03-27", - "last_updated": "2026-03-27", + "attachment": true, + "open_weights": false, + "knowledge": "2025-03-31", + "release_date": "2025-05-22", + "last_updated": "2025-05-22", "cost": { - "input": 1.4, - "output": 4.4, - "cache_read": 0, - "cache_write": 0 + "input": 15, + "output": 75, + "cache_read": 1.5, + "cache_write": 18.75 }, "type": "chat" - }, + } + ] + }, + "qiniu-ai": { + "id": "qiniu-ai", + "name": "Qiniu", + "display_name": "Qiniu", + "api": "https://api.qnaigc.com/v1", + "doc": "https://developer.qiniu.com/aitokenapi", + "models": [ { - "id": "moonshotai/kimi-k2.6", - "name": "Kimi K2.6", - "display_name": "Kimi K2.6", + "id": "deepseek-r1-0528", + "name": "DeepSeek-R1-0528", + "display_name": "DeepSeek-R1-0528", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 262144, - "output": 262144 + "context": 128000, + "output": 32000 }, "temperature": true, "tool_call": true, @@ -1483,32 +2094,16 @@ ] } }, - "attachment": true, - "open_weights": true, - "knowledge": "2025-01", - "release_date": "2026-04-21", - "last_updated": "2026-04-21", - "cost": { - "input": 0.95, - "output": 4, - "cache_read": 0.2, - "cache_write": 0 - }, + "attachment": false, + "open_weights": false, + "release_date": "2025-08-05", + "last_updated": "2025-08-05", "type": "chat" - } - ] - }, - "stackit": { - "id": "stackit", - "name": "STACKIT", - "display_name": "STACKIT", - "api": "https://api.openai-compat.model-serving.eu01.onstackit.cloud/v1", - "doc": "https://docs.stackit.cloud/products/data-and-ai/ai-model-serving/basics/available-shared-models", - "models": [ + }, { - "id": "neuralmagic/Meta-Llama-3.1-8B-Instruct-FP8", - "name": "Llama 3.1 8B", - "display_name": "Llama 3.1 8B", + "id": "doubao-1.5-thinking-pro", + "name": "Doubao 1.5 Thinking Pro", + "display_name": "Doubao 1.5 Thinking Pro", "modalities": { "input": [ "text" @@ -1519,30 +2114,29 @@ }, "limit": { "context": 128000, - "output": 8192 + "output": 16000 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "attachment": false, - "open_weights": true, - "release_date": "2024-07-23", - "last_updated": "2024-07-23", - "cost": { - "input": 0.16, - "output": 0.27 - }, + "open_weights": false, + "release_date": "2025-08-05", + "last_updated": "2025-08-05", "type": "chat" }, { - "id": "neuralmagic/Mistral-Nemo-Instruct-2407-FP8", - "name": "Mistral Nemo", - "display_name": "Mistral Nemo", + "id": "qwen3-vl-30b-a3b-thinking", + "name": "Qwen3-Vl 30b A3b Thinking", + "display_name": "Qwen3-Vl 30b A3b Thinking", "modalities": { "input": [ - "text" + "text", + "image", + "video" ], "output": [ "text" @@ -1550,58 +2144,62 @@ }, "limit": { "context": 128000, - "output": 8192 + "output": 32000 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true }, - "attachment": false, - "open_weights": true, - "release_date": "2024-07-01", - "last_updated": "2024-07-01", - "cost": { - "input": 0.49, - "output": 0.71 + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } }, + "attachment": true, + "open_weights": false, + "release_date": "2026-02-09", + "last_updated": "2026-02-09", "type": "chat" }, { - "id": "intfloat/e5-mistral-7b-instruct", - "name": "E5 Mistral 7B", - "display_name": "E5 Mistral 7B", + "id": "claude-3.5-haiku", + "name": "Claude 3.5 Haiku", + "display_name": "Claude 3.5 Haiku", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 4096, - "output": 4096 + "context": 200000, + "output": 8192 }, - "temperature": false, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { "supported": false }, - "attachment": false, - "open_weights": true, - "release_date": "2023-12-11", - "last_updated": "2023-12-11", - "cost": { - "input": 0.02, - "output": 0.02 - }, + "attachment": true, + "open_weights": false, + "release_date": "2025-08-26", + "last_updated": "2025-08-26", "type": "chat" }, { - "id": "cortecs/Llama-3.3-70B-Instruct-FP8-Dynamic", - "name": "Llama 3.3 70B", - "display_name": "Llama 3.3 70B", + "id": "deepseek-v3-0324", + "name": "DeepSeek-V3-0324", + "display_name": "DeepSeek-V3-0324", "modalities": { "input": [ "text" @@ -1612,7 +2210,7 @@ }, "limit": { "context": 128000, - "output": 8192 + "output": 16000 }, "temperature": true, "tool_call": true, @@ -1620,115 +2218,96 @@ "supported": false }, "attachment": false, - "open_weights": true, - "release_date": "2024-12-05", - "last_updated": "2024-12-05", - "cost": { - "input": 0.49, - "output": 0.71 - }, + "open_weights": false, + "release_date": "2025-08-05", + "last_updated": "2025-08-05", "type": "chat" }, { - "id": "Qwen/Qwen3-VL-235B-A22B-Instruct-FP8", - "name": "Qwen3-VL 235B", - "display_name": "Qwen3-VL 235B", + "id": "qwen3-235b-a22b-instruct-2507", + "name": "Qwen3 235b A22B Instruct 2507", + "display_name": "Qwen3 235b A22B Instruct 2507", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 218000, - "output": 8192 + "context": 262144, + "output": 64000 }, "temperature": true, "tool_call": true, "reasoning": { "supported": false }, - "attachment": true, - "open_weights": true, - "release_date": "2024-11-01", - "last_updated": "2024-11-01", - "cost": { - "input": 1.64, - "output": 1.91 - }, + "attachment": false, + "open_weights": false, + "release_date": "2025-08-12", + "last_updated": "2025-08-12", "type": "chat" }, { - "id": "Qwen/Qwen3-VL-Embedding-8B", - "name": "Qwen3-VL Embedding 8B", - "display_name": "Qwen3-VL Embedding 8B", + "id": "deepseek-v3", + "name": "DeepSeek-V3", + "display_name": "DeepSeek-V3", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 32000, - "output": 4096 + "context": 128000, + "output": 16000 }, - "temperature": false, + "temperature": true, "tool_call": false, "reasoning": { "supported": false }, - "attachment": true, - "open_weights": true, - "release_date": "2026-02-05", - "last_updated": "2026-02-05", - "cost": { - "input": 0.09, - "output": 0.09 - }, + "attachment": false, + "open_weights": false, + "release_date": "2025-08-13", + "last_updated": "2025-08-13", "type": "chat" }, { - "id": "google/gemma-3-27b-it", - "name": "Gemma 3 27B", - "display_name": "Gemma 3 27B", + "id": "kimi-k2", + "name": "Kimi K2", + "display_name": "Kimi K2", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 37000, - "output": 8192 + "context": 128000, + "output": 128000 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { "supported": false }, - "attachment": true, - "open_weights": true, - "release_date": "2025-05-17", - "last_updated": "2025-05-17", - "cost": { - "input": 0.49, - "output": 0.71 - }, + "attachment": false, + "open_weights": false, + "release_date": "2025-08-05", + "last_updated": "2025-08-05", "type": "chat" }, { - "id": "openai/gpt-oss-120b", - "name": "GPT-OSS 120B", - "display_name": "GPT-OSS 120B", + "id": "qwen3-32b", + "name": "Qwen3 32B", + "display_name": "Qwen3 32B", "modalities": { "input": [ "text" @@ -1738,8 +2317,8 @@ ] }, "limit": { - "context": 131000, - "output": 8192 + "context": 40000, + "output": 4096 }, "temperature": true, "tool_call": true, @@ -1749,64 +2328,92 @@ }, "extra_capabilities": { "reasoning": { - "supported": true + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] } }, "attachment": false, - "open_weights": true, + "open_weights": false, "release_date": "2025-08-05", "last_updated": "2025-08-05", - "cost": { - "input": 0.49, - "output": 0.71 - }, "type": "chat" - } - ] - }, - "ovhcloud": { - "id": "ovhcloud", - "name": "OVHcloud AI Endpoints", - "display_name": "OVHcloud AI Endpoints", - "api": "https://oai.endpoints.kepler.ai.cloud.ovh.net/v1", - "doc": "https://www.ovhcloud.com/en/public-cloud/ai-endpoints/catalog//", - "models": [ + }, { - "id": "qwen2.5-vl-72b-instruct", - "name": "Qwen2.5-VL-72B-Instruct", - "display_name": "Qwen2.5-VL-72B-Instruct", + "id": "qwen3-max-preview", + "name": "Qwen3 Max Preview", + "display_name": "Qwen3 Max Preview", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 32768, - "output": 32768 + "context": 256000, + "output": 64000 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { - "supported": false + "supported": true }, - "attachment": true, - "open_weights": true, - "release_date": "2025-03-31", - "last_updated": "2025-03-31", - "cost": { - "input": 1.01, - "output": 1.01 + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } }, + "attachment": false, + "open_weights": false, + "release_date": "2025-09-06", + "last_updated": "2025-09-06", "type": "chat" }, { - "id": "qwen3guard-gen-8b", - "name": "Qwen3Guard-Gen-8B", - "display_name": "Qwen3Guard-Gen-8B", + "id": "claude-3.5-sonnet", + "name": "Claude 3.5 Sonnet", + "display_name": "Claude 3.5 Sonnet", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 200000, + "output": 8200 + }, + "temperature": true, + "tool_call": true, + "reasoning": { + "supported": true, + "default": true + }, + "attachment": true, + "open_weights": false, + "release_date": "2025-09-09", + "last_updated": "2025-09-09", + "type": "chat" + }, + { + "id": "qwen3-next-80b-a3b-instruct", + "name": "Qwen3 Next 80B A3B Instruct", + "display_name": "Qwen3 Next 80B A3B Instruct", "modalities": { "input": [ "text" @@ -1816,35 +2423,38 @@ ] }, "limit": { - "context": 32768, - "output": 16384 + "context": 131072, + "output": 32768 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { "supported": false }, "attachment": false, - "open_weights": true, - "release_date": "2026-01-22", - "last_updated": "2026-01-22", + "open_weights": false, + "release_date": "2025-09-12", + "last_updated": "2025-09-12", "type": "chat" }, { - "id": "qwen3-32b", - "name": "Qwen3-32B", - "display_name": "Qwen3-32B", + "id": "gemini-2.5-pro", + "name": "Gemini 2.5 Pro", + "display_name": "Gemini 2.5 Pro", "modalities": { "input": [ - "text" + "text", + "image", + "video", + "audio" ], "output": [ "text" ] }, "limit": { - "context": 32768, - "output": 32768 + "context": 1048576, + "output": 65536 }, "temperature": true, "tool_call": true, @@ -1855,90 +2465,90 @@ "extra_capabilities": { "reasoning": { "supported": true, - "interleaved": true, + "default_enabled": true, + "mode": "budget", + "budget": { + "default": -1, + "min": 128, + "max": 32768, + "auto": -1, + "unit": "tokens" + }, "summaries": true, "visibility": "summary", "continuation": [ - "thinking_blocks" + "thought_signatures" ] } }, - "attachment": false, - "open_weights": true, - "release_date": "2025-07-16", - "last_updated": "2025-07-16", - "cost": { - "input": 0.09, - "output": 0.25 - }, + "attachment": true, + "open_weights": false, + "release_date": "2025-08-05", + "last_updated": "2025-08-05", "type": "chat" }, { - "id": "qwen3-coder-30b-a3b-instruct", - "name": "Qwen3-Coder-30B-A3B-Instruct", - "display_name": "Qwen3-Coder-30B-A3B-Instruct", + "id": "claude-4.5-haiku", + "name": "Claude 4.5 Haiku", + "display_name": "Claude 4.5 Haiku", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 262144, - "output": 262144 + "context": 200000, + "output": 64000 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false - }, - "attachment": false, - "open_weights": true, - "release_date": "2025-10-28", - "last_updated": "2025-10-28", - "cost": { - "input": 0.07, - "output": 0.26 + "supported": true, + "default": true }, + "attachment": true, + "open_weights": false, + "release_date": "2025-10-16", + "last_updated": "2025-10-16", "type": "chat" }, { - "id": "mistral-7b-instruct-v0.3", - "name": "Mistral-7B-Instruct-v0.3", - "display_name": "Mistral-7B-Instruct-v0.3", + "id": "kling-v2-6", + "name": "Kling-V2 6", + "display_name": "Kling-V2 6", "modalities": { "input": [ - "text" + "text", + "image", + "video" ], "output": [ - "text" + "video" ] }, "limit": { - "context": 65536, - "output": 65536 + "context": 99999999, + "output": 99999999 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": false }, - "attachment": false, - "open_weights": true, - "release_date": "2025-04-01", - "last_updated": "2025-04-01", - "cost": { - "input": 0.11, - "output": 0.11 - }, + "attachment": true, + "open_weights": false, + "release_date": "2026-01-13", + "last_updated": "2026-01-13", "type": "chat" }, { - "id": "meta-llama-3_3-70b-instruct", - "name": "Meta-Llama-3_3-70B-Instruct", - "display_name": "Meta-Llama-3_3-70B-Instruct", + "id": "glm-4.5", + "name": "GLM 4.5", + "display_name": "GLM 4.5", "modalities": { "input": [ "text" @@ -1949,27 +2559,24 @@ }, "limit": { "context": 131072, - "output": 131072 + "output": 98304 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "attachment": false, - "open_weights": true, - "release_date": "2025-04-01", - "last_updated": "2025-04-01", - "cost": { - "input": 0.74, - "output": 0.74 - }, + "open_weights": false, + "release_date": "2025-08-05", + "last_updated": "2025-08-05", "type": "chat" }, { - "id": "mistral-small-3.2-24b-instruct-2506", - "name": "Mistral-Small-3.2-24B-Instruct-2506", - "display_name": "Mistral-Small-3.2-24B-Instruct-2506", + "id": "claude-4.1-opus", + "name": "Claude 4.1 Opus", + "display_name": "Claude 4.1 Opus", "modalities": { "input": [ "text", @@ -1980,40 +2587,39 @@ ] }, "limit": { - "context": 131072, - "output": 131072 + "context": 200000, + "output": 32000 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "attachment": true, - "open_weights": true, - "release_date": "2025-07-16", - "last_updated": "2025-07-16", - "cost": { - "input": 0.1, - "output": 0.31 - }, + "open_weights": false, + "release_date": "2025-08-06", + "last_updated": "2025-08-06", "type": "chat" }, { - "id": "qwen3.6-27b", - "name": "Qwen3.6-27B", - "display_name": "Qwen3.6-27B", + "id": "gemini-2.5-flash", + "name": "Gemini 2.5 Flash", + "display_name": "Gemini 2.5 Flash", "modalities": { "input": [ "text", - "image" + "image", + "audio", + "video" ], "output": [ "text" ] }, "limit": { - "context": 262144, - "output": 262144 + "context": 1048576, + "output": 64000 }, "temperature": true, "tool_call": true, @@ -2024,28 +2630,33 @@ "extra_capabilities": { "reasoning": { "supported": true, - "interleaved": true, + "default_enabled": true, + "mode": "budget", + "budget": { + "default": -1, + "min": 0, + "max": 24576, + "auto": -1, + "off": 0, + "unit": "tokens" + }, "summaries": true, "visibility": "summary", "continuation": [ - "thinking_blocks" + "thought_signatures" ] } }, "attachment": true, - "open_weights": true, - "release_date": "2026-06-01", - "last_updated": "2026-06-01", - "cost": { - "input": 0.47, - "output": 3.19 - }, + "open_weights": false, + "release_date": "2025-08-05", + "last_updated": "2025-08-05", "type": "chat" }, { - "id": "gpt-oss-120b", - "name": "gpt-oss-120b", - "display_name": "gpt-oss-120b", + "id": "qwen3-max", + "name": "Qwen3 Max", + "display_name": "Qwen3 Max", "modalities": { "input": [ "text" @@ -2055,81 +2666,78 @@ ] }, "limit": { - "context": 131072, - "output": 131072 + "context": 262144, + "output": 65536 }, + "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": true }, "extra_capabilities": { "reasoning": { - "supported": true + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] } }, "attachment": false, - "open_weights": true, - "release_date": "2025-08-28", - "last_updated": "2025-08-28", - "cost": { - "input": 0.09, - "output": 0.47 - }, + "open_weights": false, + "release_date": "2025-09-24", + "last_updated": "2025-09-24", "type": "chat" }, { - "id": "gpt-oss-20b", - "name": "gpt-oss-20b", - "display_name": "gpt-oss-20b", + "id": "doubao-seed-2.0-pro", + "name": "Doubao Seed 2.0 Pro", + "display_name": "Doubao Seed 2.0 Pro", "modalities": { "input": [ - "text" + "text", + "image", + "video" ], "output": [ "text" ] }, "limit": { - "context": 131072, - "output": 131072 + "context": 256000, + "output": 128000 }, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, "default": true }, - "extra_capabilities": { - "reasoning": { - "supported": true - } - }, - "attachment": false, - "open_weights": true, - "release_date": "2025-08-28", - "last_updated": "2025-08-28", - "cost": { - "input": 0.05, - "output": 0.18 - }, + "attachment": true, + "open_weights": false, + "release_date": "2026-02-14", + "last_updated": "2026-02-14", "type": "chat" }, { - "id": "qwen3.5-9b", - "name": "Qwen3.5-9B", - "display_name": "Qwen3.5-9B", + "id": "doubao-seed-1.6", + "name": "Doubao-Seed 1.6", + "display_name": "Doubao-Seed 1.6", "modalities": { "input": [ "text", - "image" + "image", + "video" ], "output": [ "text" ] }, "limit": { - "context": 262144, - "output": 262144 + "context": 256000, + "output": 32000 }, "temperature": true, "tool_call": true, @@ -2137,43 +2745,29 @@ "supported": true, "default": true }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } - }, "attachment": true, - "open_weights": true, - "release_date": "2026-04-22", - "last_updated": "2026-04-22", - "cost": { - "input": 0.12, - "output": 0.18 - }, + "open_weights": false, + "release_date": "2025-08-15", + "last_updated": "2025-08-15", "type": "chat" }, { - "id": "qwen3.5-397b-a17b", - "name": "Qwen3.5-397B-A17B", - "display_name": "Qwen3.5-397B-A17B", + "id": "doubao-seed-1.6-thinking", + "name": "Doubao-Seed 1.6 Thinking", + "display_name": "Doubao-Seed 1.6 Thinking", "modalities": { "input": [ + "image", "text", - "image" + "video" ], "output": [ "text" ] }, "limit": { - "context": 262144, - "output": 262144 + "context": 256000, + "output": 32000 }, "temperature": true, "tool_call": true, @@ -2181,62 +2775,46 @@ "supported": true, "default": true }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } - }, "attachment": true, - "open_weights": true, - "release_date": "2026-05-18", - "last_updated": "2026-05-18", - "cost": { - "input": 0.71, - "output": 4.25 - }, + "open_weights": false, + "release_date": "2025-08-15", + "last_updated": "2025-08-15", "type": "chat" }, { - "id": "llama-3.1-8b-instruct", - "name": "Llama-3.1-8B-Instruct", - "display_name": "Llama-3.1-8B-Instruct", + "id": "gemini-2.0-flash", + "name": "Gemini 2.0 Flash", + "display_name": "Gemini 2.0 Flash", "modalities": { "input": [ - "text" + "text", + "image", + "audio", + "video" ], "output": [ "text" ] }, "limit": { - "context": 131072, - "output": 131072 + "context": 1048576, + "output": 8192 }, "temperature": true, "tool_call": true, "reasoning": { "supported": false }, - "attachment": false, - "open_weights": true, - "release_date": "2025-06-11", - "last_updated": "2025-06-11", - "cost": { - "input": 0.11, - "output": 0.11 - }, + "attachment": true, + "open_weights": false, + "release_date": "2025-08-05", + "last_updated": "2025-08-05", "type": "chat" }, { - "id": "mistral-nemo-instruct-2407", - "name": "Mistral-Nemo-Instruct-2407", - "display_name": "Mistral-Nemo-Instruct-2407", + "id": "qwen-max-2025-01-25", + "name": "Qwen2.5-Max-2025-01-25", + "display_name": "Qwen2.5-Max-2025-01-25", "modalities": { "input": [ "text" @@ -2246,8 +2824,8 @@ ] }, "limit": { - "context": 65536, - "output": 65536 + "context": 128000, + "output": 4096 }, "temperature": true, "tool_call": true, @@ -2255,55 +2833,44 @@ "supported": false }, "attachment": false, - "open_weights": true, - "release_date": "2024-11-20", - "last_updated": "2024-11-20", - "cost": { - "input": 0.14, - "output": 0.14 - }, + "open_weights": false, + "release_date": "2025-08-05", + "last_updated": "2025-08-05", "type": "chat" }, { - "id": "qwen3guard-gen-0.6b", - "name": "Qwen3Guard-Gen-0.6B", - "display_name": "Qwen3Guard-Gen-0.6B", + "id": "claude-4.0-sonnet", + "name": "Claude 4.0 Sonnet", + "display_name": "Claude 4.0 Sonnet", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 32768, - "output": 16384 + "context": 200000, + "output": 64000 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": false, - "open_weights": true, - "release_date": "2026-01-22", - "last_updated": "2026-01-22", + "attachment": true, + "open_weights": false, + "release_date": "2025-08-05", + "last_updated": "2025-08-05", "type": "chat" - } - ] - }, - "iflowcn": { - "id": "iflowcn", - "name": "iFlow", - "display_name": "iFlow", - "api": "https://apis.iflow.cn/v1", - "doc": "https://platform.iflow.cn/en/docs", - "models": [ + }, { - "id": "qwen3-max-preview", - "name": "Qwen3-Max-Preview", - "display_name": "Qwen3-Max-Preview", + "id": "doubao-1.5-pro-32k", + "name": "Doubao 1.5 Pro 32k", + "display_name": "Doubao 1.5 Pro 32k", "modalities": { "input": [ "text" @@ -2313,40 +2880,24 @@ ] }, "limit": { - "context": 256000, - "output": 32000 + "context": 128000, + "output": 12000 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } + "supported": false }, "attachment": false, "open_weights": false, - "knowledge": "2024-12", - "release_date": "2025-01-01", - "last_updated": "2025-01-01", - "cost": { - "input": 0, - "output": 0 - }, + "release_date": "2025-08-05", + "last_updated": "2025-08-05", "type": "chat" }, { - "id": "glm-4.6", - "name": "GLM-4.6", - "display_name": "GLM-4.6", + "id": "qwen3-30b-a3b-instruct-2507", + "name": "Qwen3 30b A3b Instruct 2507", + "display_name": "Qwen3 30b A3b Instruct 2507", "modalities": { "input": [ "text" @@ -2356,35 +2907,24 @@ ] }, "limit": { - "context": 200000, - "output": 128000 + "context": 128000, + "output": 32000 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true - } + "supported": false }, "attachment": false, "open_weights": false, - "knowledge": "2024-10", - "release_date": "2024-12-01", - "last_updated": "2025-11-13", - "cost": { - "input": 0, - "output": 0 - }, + "release_date": "2026-02-04", + "last_updated": "2026-02-04", "type": "chat" }, { - "id": "qwen3-32b", - "name": "Qwen3-32B", - "display_name": "Qwen3-32B", + "id": "qwen3-next-80b-a3b-thinking", + "name": "Qwen3 Next 80B A3B Thinking", + "display_name": "Qwen3 Next 80B A3B Thinking", "modalities": { "input": [ "text" @@ -2394,13 +2934,14 @@ ] }, "limit": { - "context": 128000, - "output": 32000 + "context": 131072, + "output": 32768 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true + "supported": true, + "default": true }, "extra_capabilities": { "reasoning": { @@ -2414,20 +2955,15 @@ } }, "attachment": false, - "open_weights": true, - "knowledge": "2024-10", - "release_date": "2024-12-01", - "last_updated": "2024-12-01", - "cost": { - "input": 0, - "output": 0 - }, + "open_weights": false, + "release_date": "2025-09-12", + "last_updated": "2025-09-12", "type": "chat" }, { - "id": "qwen3-235b", - "name": "Qwen3-235B-A22B", - "display_name": "Qwen3-235B-A22B", + "id": "qwen3-235b-a22b-thinking-2507", + "name": "Qwen3 235B A22B Thinking 2507", + "display_name": "Qwen3 235B A22B Thinking 2507", "modalities": { "input": [ "text" @@ -2437,8 +2973,8 @@ ] }, "limit": { - "context": 128000, - "output": 32000 + "context": 262144, + "output": 4096 }, "temperature": true, "tool_call": true, @@ -2446,21 +2982,27 @@ "supported": true, "default": true }, - "attachment": false, - "open_weights": true, - "knowledge": "2024-10", - "release_date": "2024-12-01", - "last_updated": "2024-12-01", - "cost": { - "input": 0, - "output": 0 + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } }, + "attachment": false, + "open_weights": false, + "release_date": "2025-08-12", + "last_updated": "2025-08-12", "type": "chat" }, { - "id": "deepseek-v3.2", - "name": "DeepSeek-V3.2-Exp", - "display_name": "DeepSeek-V3.2-Exp", + "id": "deepseek-r1", + "name": "DeepSeek-R1", + "display_name": "DeepSeek-R1", "modalities": { "input": [ "text" @@ -2471,245 +3013,255 @@ }, "limit": { "context": 128000, - "output": 64000 + "output": 32000 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true + "supported": true, + "default": true }, "extra_capabilities": { "reasoning": { - "supported": true + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] } }, "attachment": false, - "open_weights": true, - "knowledge": "2024-12", - "release_date": "2025-01-01", - "last_updated": "2025-01-01", - "cost": { - "input": 0, - "output": 0 - }, + "open_weights": false, + "release_date": "2025-08-05", + "last_updated": "2025-08-05", "type": "chat" }, { - "id": "qwen3-235b-a22b-instruct", - "name": "Qwen3-235B-A22B-Instruct", - "display_name": "Qwen3-235B-A22B-Instruct", + "id": "doubao-1.5-vision-pro", + "name": "Doubao 1.5 Vision Pro", + "display_name": "Doubao 1.5 Vision Pro", "modalities": { "input": [ - "text" + "text", + "image", + "video" ], "output": [ "text" ] }, "limit": { - "context": 256000, - "output": 64000 + "context": 128000, + "output": 16000 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": false }, - "attachment": false, - "open_weights": true, - "knowledge": "2025-04", - "release_date": "2025-07-01", - "last_updated": "2025-07-01", - "cost": { - "input": 0, - "output": 0 - }, + "attachment": true, + "open_weights": false, + "release_date": "2025-08-05", + "last_updated": "2025-08-05", "type": "chat" }, { - "id": "qwen3-max", - "name": "Qwen3-Max", - "display_name": "Qwen3-Max", + "id": "gemini-3.0-pro-image-preview", + "name": "Gemini 3.0 Pro Image Preview", + "display_name": "Gemini 3.0 Pro Image Preview", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ - "text" + "text", + "image" ] }, "limit": { - "context": 256000, - "output": 32000 + "context": 32768, + "output": 8192 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true + "supported": true, + "default": true }, "extra_capabilities": { "reasoning": { "supported": true, - "interleaved": true, + "default_enabled": true, + "mode": "level", + "level": "high", + "level_options": [ + "low", + "high" + ], "summaries": true, "visibility": "summary", "continuation": [ - "thinking_blocks" + "thought_signatures" ] } }, - "attachment": false, + "attachment": true, "open_weights": false, - "knowledge": "2024-12", - "release_date": "2025-01-01", - "last_updated": "2025-01-01", - "cost": { - "input": 0, - "output": 0 - }, + "release_date": "2025-11-20", + "last_updated": "2025-11-20", "type": "chat" }, { - "id": "qwen3-coder-plus", - "name": "Qwen3-Coder-Plus", - "display_name": "Qwen3-Coder-Plus", + "id": "gemini-2.5-flash-image", + "name": "Gemini 2.5 Flash Image", + "display_name": "Gemini 2.5 Flash Image", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ - "text" + "image" ] }, "limit": { - "context": 256000, - "output": 64000 + "context": 32768, + "output": 8192 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": false }, - "attachment": false, - "open_weights": true, - "knowledge": "2025-04", - "release_date": "2025-07-01", - "last_updated": "2025-07-01", - "cost": { - "input": 0, - "output": 0 - }, - "type": "chat" + "attachment": true, + "open_weights": false, + "release_date": "2025-10-22", + "last_updated": "2025-10-22", + "type": "imageGeneration" }, { - "id": "deepseek-r1", - "name": "DeepSeek-R1", - "display_name": "DeepSeek-R1", + "id": "gemini-2.5-flash-lite", + "name": "Gemini 2.5 Flash Lite", + "display_name": "Gemini 2.5 Flash Lite", "modalities": { "input": [ - "text" + "text", + "image", + "audio", + "video" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 32000 + "context": 1048576, + "output": 64000 }, "temperature": true, "tool_call": true, "reasoning": { "supported": true, - "default": true + "default": false }, "extra_capabilities": { "reasoning": { "supported": true, - "interleaved": true, + "default_enabled": false, + "mode": "budget", + "budget": { + "default": -1, + "min": 512, + "max": 24576, + "auto": -1, + "unit": "tokens" + }, "summaries": true, "visibility": "summary", "continuation": [ - "thinking_blocks" + "thought_signatures" ] } }, - "attachment": false, - "open_weights": true, - "knowledge": "2024-12", - "release_date": "2025-01-20", - "last_updated": "2025-01-20", - "cost": { - "input": 0, - "output": 0 - }, + "attachment": true, + "open_weights": false, + "release_date": "2025-08-05", + "last_updated": "2025-08-05", "type": "chat" }, { - "id": "qwen3-235b-a22b-thinking-2507", - "name": "Qwen3-235B-A22B-Thinking", - "display_name": "Qwen3-235B-A22B-Thinking", + "id": "claude-3.7-sonnet", + "name": "Claude 3.7 Sonnet", + "display_name": "Claude 3.7 Sonnet", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 256000, - "output": 64000 + "context": 200000, + "output": 128000 }, "temperature": true, "tool_call": true, "reasoning": { "supported": true, - "default": true + "default": false }, "extra_capabilities": { "reasoning": { "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", + "default_enabled": false, + "mode": "budget", + "budget": { + "min": 1024, + "unit": "tokens" + }, + "interleaved": false, + "summaries": false, + "visibility": "full", "continuation": [ "thinking_blocks" + ], + "notes": [ + "Anthropic uses thinking budget tokens" ] } }, - "attachment": false, - "open_weights": true, - "knowledge": "2025-04", - "release_date": "2025-07-01", - "last_updated": "2025-07-01", - "cost": { - "input": 0, - "output": 0 - }, + "attachment": true, + "open_weights": false, + "release_date": "2025-08-05", + "last_updated": "2025-08-05", "type": "chat" }, { - "id": "qwen3-vl-plus", - "name": "Qwen3-VL-Plus", - "display_name": "Qwen3-VL-Plus", + "id": "qwen3-30b-a3b-thinking-2507", + "name": "Qwen3 30b A3b Thinking 2507", + "display_name": "Qwen3 30b A3b Thinking 2507", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 256000, + "context": 126000, "output": 32000 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true + "supported": true, + "default": true }, "extra_capabilities": { "reasoning": { @@ -2722,53 +3274,46 @@ ] } }, - "attachment": true, + "attachment": false, "open_weights": false, - "knowledge": "2024-12", - "release_date": "2025-01-01", - "last_updated": "2025-01-01", - "cost": { - "input": 0, - "output": 0 - }, + "release_date": "2026-02-04", + "last_updated": "2026-02-04", "type": "chat" }, { - "id": "kimi-k2-0905", - "name": "Kimi-K2-0905", - "display_name": "Kimi-K2-0905", + "id": "qwen2.5-vl-72b-instruct", + "name": "Qwen 2.5 VL 72B Instruct", + "display_name": "Qwen 2.5 VL 72B Instruct", "modalities": { "input": [ - "text" + "text", + "image", + "audio", + "video" ], "output": [ "text" ] }, "limit": { - "context": 256000, - "output": 64000 + "context": 128000, + "output": 8192 }, "temperature": true, "tool_call": true, "reasoning": { "supported": false }, - "attachment": false, + "attachment": true, "open_weights": false, - "knowledge": "2024-12", - "release_date": "2025-09-05", - "last_updated": "2025-09-05", - "cost": { - "input": 0, - "output": 0 - }, + "release_date": "2025-08-05", + "last_updated": "2025-08-05", "type": "chat" }, { - "id": "deepseek-v3", - "name": "DeepSeek-V3", - "display_name": "DeepSeek-V3", + "id": "gpt-oss-120b", + "name": "gpt-oss-120b", + "display_name": "gpt-oss-120b", "modalities": { "input": [ "text" @@ -2779,69 +3324,59 @@ }, "limit": { "context": 128000, - "output": 32000 + "output": 4096 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": false, - "open_weights": true, - "knowledge": "2024-10", - "release_date": "2024-12-26", - "last_updated": "2024-12-26", - "cost": { - "input": 0, - "output": 0 + "extra_capabilities": { + "reasoning": { + "supported": true + } }, + "attachment": false, + "open_weights": false, + "release_date": "2025-08-06", + "last_updated": "2025-08-06", "type": "chat" }, { - "id": "kimi-k2", - "name": "Kimi-K2", - "display_name": "Kimi-K2", + "id": "doubao-seed-1.6-flash", + "name": "Doubao-Seed 1.6 Flash", + "display_name": "Doubao-Seed 1.6 Flash", "modalities": { "input": [ - "text" + "text", + "image", + "video" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 64000 + "context": 256000, + "output": 32000 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": false, + "attachment": true, "open_weights": false, - "knowledge": "2024-10", - "release_date": "2024-12-01", - "last_updated": "2024-12-01", - "cost": { - "input": 0, - "output": 0 - }, + "release_date": "2025-08-15", + "last_updated": "2025-08-15", "type": "chat" - } - ] - }, - "302ai": { - "id": "302ai", - "name": "302.AI", - "display_name": "302.AI", - "api": "https://api.302.ai/v1", - "doc": "https://doc.302.ai", - "models": [ + }, { - "id": "kimi-k2-thinking-turbo", - "name": "kimi-k2-thinking-turbo", - "display_name": "kimi-k2-thinking-turbo", + "id": "deepseek-v3.1", + "name": "DeepSeek-V3.1", + "display_name": "DeepSeek-V3.1", "modalities": { "input": [ "text" @@ -2851,8 +3386,8 @@ ] }, "limit": { - "context": 262144, - "output": 262144 + "context": 128000, + "output": 32000 }, "temperature": true, "tool_call": true, @@ -2862,23 +3397,17 @@ }, "attachment": false, "open_weights": false, - "knowledge": "2025-06", - "release_date": "2025-09-05", - "last_updated": "2025-09-05", - "cost": { - "input": 1.265, - "output": 9.119 - }, + "release_date": "2025-08-19", + "last_updated": "2025-08-19", "type": "chat" }, { - "id": "chatgpt-4o-latest", - "name": "chatgpt-4o-latest", - "display_name": "chatgpt-4o-latest", + "id": "qwen3-235b-a22b", + "name": "Qwen 3 235B A22B", + "display_name": "Qwen 3 235B A22B", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" @@ -2886,61 +3415,61 @@ }, "limit": { "context": 128000, - "output": 16384 + "output": 32000 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { - "supported": false + "supported": true }, - "attachment": true, - "open_weights": false, - "knowledge": "2023-09", - "release_date": "2024-08-08", - "last_updated": "2024-08-08", - "cost": { - "input": 5, - "output": 15 + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } }, + "attachment": false, + "open_weights": false, + "release_date": "2025-08-05", + "last_updated": "2025-08-05", "type": "chat" }, { - "id": "grok-4.1", - "name": "grok-4.1", - "display_name": "grok-4.1", + "id": "qwen3-coder-480b-a35b-instruct", + "name": "Qwen3 Coder 480B A35B Instruct", + "display_name": "Qwen3 Coder 480B A35B Instruct", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 64000 + "context": 262000, + "output": 4096 }, "temperature": true, "tool_call": true, "reasoning": { "supported": false }, - "attachment": true, + "attachment": false, "open_weights": false, - "knowledge": "2025-06", - "release_date": "2025-11-18", - "last_updated": "2025-11-18", - "cost": { - "input": 2, - "output": 10 - }, + "release_date": "2025-08-14", + "last_updated": "2025-08-14", "type": "chat" }, { - "id": "doubao-seed-1-6-vision-250815", - "name": "doubao-seed-1-6-vision-250815", - "display_name": "doubao-seed-1-6-vision-250815", + "id": "qwen3.5-397b-a17b", + "name": "Qwen3.5 397B A17B", + "display_name": "Qwen3.5 397B A17B", "modalities": { "input": [ "text", @@ -2952,201 +3481,157 @@ }, "limit": { "context": 256000, - "output": 32000 + "output": 64000 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } }, "attachment": true, "open_weights": false, - "release_date": "2025-09-30", - "last_updated": "2025-09-30", - "cost": { - "input": 0.114, - "output": 1.143 - }, + "release_date": "2026-02-22", + "last_updated": "2026-02-22", "type": "chat" }, { - "id": "claude-opus-4-5", - "name": "claude-opus-4-5", - "display_name": "claude-opus-4-5", + "id": "mimo-v2-flash", + "name": "Mimo-V2-Flash", + "display_name": "Mimo-V2-Flash", "modalities": { "input": [ - "text", - "image", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 64000 + "context": 256000, + "output": 256000 }, "temperature": true, "tool_call": true, "reasoning": { "supported": true, - "default": false - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": false, - "mode": "mixed", - "budget": { - "min": 1024, - "unit": "tokens" - }, - "effort": "high", - "effort_options": [ - "low", - "medium", - "high" - ], - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ], - "notes": [ - "Claude Opus 4.5 uses manual thinking.type = \"enabled\" with budget_tokens; effort can be used alongside the thinking budget.", - "Interleaved thinking requires the interleaved-thinking-2025-05-14 beta header." - ] - } + "default": true }, - "attachment": true, - "open_weights": false, - "knowledge": "2025-03-31", - "release_date": "2025-11-25", - "last_updated": "2025-11-25", + "attachment": false, + "open_weights": true, + "knowledge": "2024-12-01", + "release_date": "2025-12-16", + "last_updated": "2026-02-04", "cost": { - "input": 5, - "output": 25 + "input": 0.1, + "output": 0.3, + "cache_read": 0.01 }, "type": "chat" }, { - "id": "gpt-5-pro", - "name": "gpt-5-pro", - "display_name": "gpt-5-pro", + "id": "qwen-vl-max-2025-01-25", + "name": "Qwen VL-MAX-2025-01-25", + "display_name": "Qwen VL-MAX-2025-01-25", "modalities": { "input": [ "text", - "image" + "image", + "audio", + "video" ], "output": [ "text" ] }, "limit": { - "context": 400000, - "output": 272000 + "context": 128000, + "output": 4096 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": true, - "mode": "fixed", - "effort": "high", - "verbosity": "medium", - "verbosity_options": [ - "low", - "medium", - "high" - ], - "visibility": "hidden" - } + "supported": false }, "attachment": true, "open_weights": false, - "knowledge": "2024-09-30", - "release_date": "2025-10-08", - "last_updated": "2025-10-08", - "cost": { - "input": 15, - "output": 120 - }, + "release_date": "2025-08-05", + "last_updated": "2025-08-05", "type": "chat" }, { - "id": "claude-sonnet-4-6", - "name": "claude-sonnet-4-6", - "display_name": "claude-sonnet-4-6", + "id": "qwen2.5-vl-7b-instruct", + "name": "Qwen 2.5 VL 7B Instruct", + "display_name": "Qwen 2.5 VL 7B Instruct", "modalities": { "input": [ "text", "image", - "pdf" + "audio", + "video" ], "output": [ "text" ] }, "limit": { - "context": 1000000, - "output": 64000 + "context": 128000, + "output": 8192 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": false - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": false, - "mode": "mixed", - "budget": { - "min": 1024, - "unit": "tokens" - }, - "effort": "high", - "effort_options": [ - "low", - "medium", - "high", - "max" - ], - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ], - "notes": [ - "Anthropic recommends adaptive thinking with effort for Claude 4.6; budget_tokens remains a deprecated compatibility path.", - "Anthropic API defaults effort to high; lower effort levels should be chosen per workload." - ] - } + "supported": false }, "attachment": true, "open_weights": false, - "knowledge": "2025-08-31", - "release_date": "2026-02-18", - "last_updated": "2026-03-13", - "cost": { - "input": 3, - "output": 15 + "release_date": "2025-08-05", + "last_updated": "2025-08-05", + "type": "chat" + }, + { + "id": "glm-4.5-air", + "name": "GLM 4.5 Air", + "display_name": "GLM 4.5 Air", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 131000, + "output": 4096 + }, + "temperature": true, + "tool_call": true, + "reasoning": { + "supported": true, + "default": true }, + "attachment": false, + "open_weights": false, + "release_date": "2025-08-05", + "last_updated": "2025-08-05", "type": "chat" }, { - "id": "gpt-5-mini", - "name": "gpt-5-mini", - "display_name": "gpt-5-mini", + "id": "claude-4.5-opus", + "name": "Claude 4.5 Opus", + "display_name": "Claude 4.5 Opus", "modalities": { "input": [ "text", @@ -3157,10 +3642,42 @@ ] }, "limit": { - "context": 400000, - "output": 128000 + "context": 200000, + "output": 200000 }, - "temperature": false, + "temperature": true, + "tool_call": true, + "reasoning": { + "supported": true, + "default": true + }, + "attachment": true, + "open_weights": false, + "release_date": "2025-11-25", + "last_updated": "2025-11-25", + "type": "chat" + }, + { + "id": "gemini-3.0-pro-preview", + "name": "Gemini 3.0 Pro Preview", + "display_name": "Gemini 3.0 Pro Preview", + "modalities": { + "input": [ + "text", + "image", + "video", + "pdf", + "audio" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 1000000, + "output": 64000 + }, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, @@ -3170,74 +3687,63 @@ "reasoning": { "supported": true, "default_enabled": true, - "mode": "effort", - "effort": "medium", - "effort_options": [ - "minimal", - "low", - "medium", - "high" - ], - "verbosity": "medium", - "verbosity_options": [ + "mode": "level", + "level": "high", + "level_options": [ "low", - "medium", "high" ], - "visibility": "hidden" + "summaries": true, + "visibility": "summary", + "continuation": [ + "thought_signatures" + ] } }, "attachment": true, "open_weights": false, - "knowledge": "2024-05-30", - "release_date": "2025-08-08", - "last_updated": "2025-08-08", - "cost": { - "input": 0.25, - "output": 2 - }, + "release_date": "2025-11-19", + "last_updated": "2025-11-19", "type": "chat" }, { - "id": "gemini-2.5-flash-image", - "name": "gemini-2.5-flash-image", - "display_name": "gemini-2.5-flash-image", + "id": "doubao-seed-2.0-mini", + "name": "Doubao Seed 2.0 Mini", + "display_name": "Doubao Seed 2.0 Mini", "modalities": { "input": [ "text", - "image" + "image", + "video" ], "output": [ "text" ] }, "limit": { - "context": 32768, - "output": 32768 + "context": 256000, + "output": 32000 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "attachment": true, "open_weights": false, - "knowledge": "2025-01", - "release_date": "2025-10-08", - "last_updated": "2025-10-08", - "cost": { - "input": 0.3, - "output": 30 - }, - "type": "imageGeneration" + "release_date": "2026-02-14", + "last_updated": "2026-02-14", + "type": "chat" }, { - "id": "glm-4.7-flashx", - "name": "glm-4.7-flashx", - "display_name": "glm-4.7-flashx", + "id": "claude-4.0-opus", + "name": "Claude 4.0 Opus", + "display_name": "Claude 4.0 Opus", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" @@ -3245,7 +3751,7 @@ }, "limit": { "context": 200000, - "output": 131072 + "output": 32000 }, "temperature": true, "tool_call": true, @@ -3253,26 +3759,19 @@ "supported": true, "default": true }, - "attachment": false, - "open_weights": true, - "knowledge": "2025-04", - "release_date": "2026-01-20", - "last_updated": "2026-01-20", - "cost": { - "input": 0.0715, - "output": 0.429 - }, + "attachment": true, + "open_weights": false, + "release_date": "2025-08-05", + "last_updated": "2025-08-05", "type": "chat" }, { - "id": "gpt-4o", - "name": "gpt-4o", - "display_name": "gpt-4o", + "id": "gpt-oss-20b", + "name": "gpt-oss-20b", + "display_name": "gpt-oss-20b", "modalities": { "input": [ - "text", - "image", - "pdf" + "text" ], "output": [ "text" @@ -3280,117 +3779,108 @@ }, "limit": { "context": 128000, - "output": 16384 + "output": 4096 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": true, - "open_weights": false, - "knowledge": "2023-09", - "release_date": "2024-05-13", - "last_updated": "2024-05-13", - "cost": { - "input": 2.5, - "output": 10 + "extra_capabilities": { + "reasoning": { + "supported": true + } }, + "attachment": false, + "open_weights": false, + "release_date": "2025-08-06", + "last_updated": "2025-08-06", "type": "chat" }, { - "id": "gpt-5.2", - "name": "gpt-5.2", - "display_name": "gpt-5.2", + "id": "gemini-3.0-flash-preview", + "name": "Gemini 3.0 Flash Preview", + "display_name": "Gemini 3.0 Flash Preview", "modalities": { "input": [ "text", - "image" + "image", + "audio", + "video", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 400000, - "output": 128000 + "context": 1000000, + "output": 64000 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, - "default": false + "default": true }, "extra_capabilities": { "reasoning": { "supported": true, - "default_enabled": false, - "mode": "effort", - "effort": "none", - "effort_options": [ - "none", - "low", - "medium", - "high", - "xhigh" - ], - "verbosity": "medium", - "verbosity_options": [ + "default_enabled": true, + "mode": "level", + "level": "high", + "level_options": [ + "minimal", "low", "medium", "high" ], - "visibility": "hidden" + "summaries": true, + "visibility": "summary", + "continuation": [ + "thought_signatures" + ] } }, "attachment": true, "open_weights": false, - "knowledge": "2025-08-31", - "release_date": "2025-12-12", - "last_updated": "2025-12-12", - "cost": { - "input": 1.75, - "output": 14 - }, + "release_date": "2025-12-18", + "last_updated": "2025-12-18", "type": "chat" }, { - "id": "ministral-14b-2512", - "name": "ministral-14b-2512", - "display_name": "ministral-14b-2512", + "id": "MiniMax-M1", + "name": "MiniMax M1", + "display_name": "MiniMax M1", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 128000 + "context": 1000000, + "output": 80000 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": true, + "attachment": false, "open_weights": false, - "knowledge": "2024-12", - "release_date": "2025-12-16", - "last_updated": "2025-12-16", - "cost": { - "input": 0.33, - "output": 0.33 - }, + "release_date": "2025-08-05", + "last_updated": "2025-08-05", "type": "chat" }, { - "id": "glm-4.6", - "name": "glm-4.6", - "display_name": "glm-4.6", + "id": "qwen-turbo", + "name": "Qwen-Turbo", + "display_name": "Qwen-Turbo", "modalities": { "input": [ "text" @@ -3400,8 +3890,8 @@ ] }, "limit": { - "context": 204800, - "output": 131072 + "context": 1000000, + "output": 4096 }, "temperature": true, "tool_call": true, @@ -3411,24 +3901,25 @@ }, "extra_capabilities": { "reasoning": { - "supported": true + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] } }, "attachment": false, - "open_weights": true, - "knowledge": "2025-04", - "release_date": "2025-09-30", - "last_updated": "2025-09-30", - "cost": { - "input": 0.286, - "output": 1.142 - }, + "open_weights": false, + "release_date": "2025-08-05", + "last_updated": "2025-08-05", "type": "chat" }, { - "id": "kimi-k2-thinking", - "name": "kimi-k2-thinking", - "display_name": "kimi-k2-thinking", + "id": "qwen3-30b-a3b", + "name": "Qwen3 30B A3B", + "display_name": "Qwen3 30B A3B", "modalities": { "input": [ "text" @@ -3438,8 +3929,8 @@ ] }, "limit": { - "context": 262144, - "output": 262144 + "context": 40000, + "output": 4096 }, "temperature": true, "tool_call": true, @@ -3460,24 +3951,18 @@ }, "attachment": false, "open_weights": false, - "knowledge": "2025-06", - "release_date": "2025-09-05", - "last_updated": "2025-09-05", - "cost": { - "input": 0.575, - "output": 2.3 - }, + "release_date": "2025-08-05", + "last_updated": "2025-08-05", "type": "chat" }, { - "id": "claude-haiku-4-5-20251001", - "name": "claude-haiku-4-5-20251001", - "display_name": "claude-haiku-4-5-20251001", + "id": "claude-4.5-sonnet", + "name": "Claude 4.5 Sonnet", + "display_name": "Claude 4.5 Sonnet", "modalities": { "input": [ "text", - "image", - "pdf" + "image" ], "output": [ "text" @@ -3491,162 +3976,109 @@ "tool_call": true, "reasoning": { "supported": true, - "default": false - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": false, - "mode": "budget", - "budget": { - "min": 1024, - "unit": "tokens" - }, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ], - "notes": [ - "Claude 4 manual thinking uses thinking.type = \"enabled\" with budget_tokens.", - "Interleaved thinking requires the interleaved-thinking-2025-05-14 beta header for this model family." - ] - } + "default": true }, "attachment": true, "open_weights": false, - "knowledge": "2025-02-28", - "release_date": "2025-10-16", - "last_updated": "2025-10-16", - "cost": { - "input": 1, - "output": 5 - }, + "release_date": "2025-09-30", + "last_updated": "2025-09-30", "type": "chat" }, { - "id": "MiniMax-M1", - "name": "MiniMax-M1", - "display_name": "MiniMax-M1", + "id": "doubao-seed-2.0-lite", + "name": "Doubao Seed 2.0 Lite", + "display_name": "Doubao Seed 2.0 Lite", "modalities": { "input": [ - "text" + "text", + "image", + "video" ], "output": [ "text" ] }, "limit": { - "context": 1000000, - "output": 128000 + "context": 256000, + "output": 32000 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": false, + "attachment": true, "open_weights": false, - "release_date": "2025-06-16", - "last_updated": "2025-06-16", - "cost": { - "input": 0.132, - "output": 1.254 - }, + "release_date": "2026-02-14", + "last_updated": "2026-02-14", "type": "chat" }, { - "id": "gpt-5", - "name": "gpt-5", - "display_name": "gpt-5", + "id": "gemini-2.0-flash-lite", + "name": "Gemini 2.0 Flash Lite", + "display_name": "Gemini 2.0 Flash Lite", "modalities": { "input": [ "text", - "image" + "image", + "audio", + "video" ], "output": [ "text" ] }, "limit": { - "context": 400000, - "output": 128000 + "context": 1048576, + "output": 8192 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, "default": true }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": true, - "mode": "effort", - "effort": "medium", - "effort_options": [ - "minimal", - "low", - "medium", - "high" - ], - "verbosity": "medium", - "verbosity_options": [ - "low", - "medium", - "high" - ], - "visibility": "hidden" - } - }, "attachment": true, "open_weights": false, - "knowledge": "2024-09-30", - "release_date": "2025-08-08", - "last_updated": "2025-08-08", - "cost": { - "input": 1.25, - "output": 10 - }, + "release_date": "2025-08-05", + "last_updated": "2025-08-05", "type": "chat" }, { - "id": "qwen3-max-2025-09-23", - "name": "qwen3-max-2025-09-23", - "display_name": "qwen3-max-2025-09-23", + "id": "doubao-seed-2.0-code", + "name": "Doubao Seed 2.0 Code", + "display_name": "Doubao Seed 2.0 Code", "modalities": { "input": [ - "text" + "text", + "image", + "video" ], "output": [ "text" ] }, "limit": { - "context": 258048, - "output": 65536 + "context": 256000, + "output": 128000 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": false, + "attachment": true, "open_weights": false, - "knowledge": "2025-04", - "release_date": "2025-09-24", - "last_updated": "2025-09-24", - "cost": { - "input": 0.86, - "output": 3.43 - }, + "release_date": "2026-02-14", + "last_updated": "2026-02-14", "type": "chat" }, { - "id": "qwen-flash", - "name": "Qwen-Flash", - "display_name": "Qwen-Flash", + "id": "moonshotai/kimi-k2-thinking", + "name": "Kimi K2 Thinking", + "display_name": "Kimi K2 Thinking", "modalities": { "input": [ "text" @@ -3656,8 +4088,8 @@ ] }, "limit": { - "context": 1000000, - "output": 32768 + "context": 256000, + "output": 100000 }, "temperature": true, "tool_call": true, @@ -3677,74 +4109,81 @@ }, "attachment": false, "open_weights": false, - "release_date": "2025-07-28", - "last_updated": "2025-07-28", - "cost": { - "input": 0.022, - "output": 0.22 - }, + "release_date": "2025-11-07", + "last_updated": "2025-11-07", "type": "chat" }, { - "id": "claude-haiku-4-5", - "name": "claude-haiku-4-5", - "display_name": "claude-haiku-4-5", + "id": "moonshotai/kimi-k2.5", + "name": "Moonshotai/Kimi-K2.5", + "display_name": "Moonshotai/Kimi-K2.5", "modalities": { "input": [ "text", "image", - "pdf" + "video" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 64000 + "context": 256000, + "output": 256000 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": false + "supported": true }, "extra_capabilities": { "reasoning": { "supported": true, - "default_enabled": false, - "mode": "budget", - "budget": { - "min": 1024, - "unit": "tokens" - }, "interleaved": true, "summaries": true, "visibility": "summary", "continuation": [ "thinking_blocks" - ], - "notes": [ - "Claude 4 manual thinking uses thinking.type = \"enabled\" with budget_tokens.", - "Interleaved thinking requires the interleaved-thinking-2025-05-14 beta header for this model family." ] } }, "attachment": true, "open_weights": false, - "knowledge": "2025-02-28", - "release_date": "2025-10-16", - "last_updated": "2025-10-16", - "cost": { - "input": 1, - "output": 5 + "release_date": "2026-01-28", + "last_updated": "2026-01-28", + "type": "chat" + }, + { + "id": "moonshotai/kimi-k2-0905", + "name": "Kimi K2 0905", + "display_name": "Kimi K2 0905", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 256000, + "output": 100000 + }, + "temperature": true, + "tool_call": true, + "reasoning": { + "supported": false }, + "attachment": false, + "open_weights": false, + "release_date": "2025-09-08", + "last_updated": "2025-09-08", "type": "chat" }, { - "id": "grok-4-fast-non-reasoning", - "name": "grok-4-fast-non-reasoning", - "display_name": "grok-4-fast-non-reasoning", + "id": "stepfun-ai/gelab-zero-4b-preview", + "name": "Stepfun-Ai/Gelab Zero 4b Preview", + "display_name": "Stepfun-Ai/Gelab Zero 4b Preview", "modalities": { "input": [ "text", @@ -3755,8 +4194,8 @@ ] }, "limit": { - "context": 2000000, - "output": 30000 + "context": 8192, + "output": 4096 }, "temperature": true, "tool_call": true, @@ -3765,19 +4204,14 @@ }, "attachment": true, "open_weights": false, - "knowledge": "2025-06", - "release_date": "2025-09-23", - "last_updated": "2025-09-23", - "cost": { - "input": 0.2, - "output": 0.5 - }, + "release_date": "2025-12-23", + "last_updated": "2025-12-23", "type": "chat" }, { - "id": "MiniMax-M2.7", - "name": "MiniMax-M2.7", - "display_name": "MiniMax-M2.7", + "id": "x-ai/grok-code-fast-1", + "name": "x-AI/Grok-Code-Fast 1", + "display_name": "x-AI/Grok-Code-Fast 1", "modalities": { "input": [ "text" @@ -3787,43 +4221,67 @@ ] }, "limit": { - "context": 204800, - "output": 131072 + "context": 256000, + "output": 10000 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true + "supported": true, + "default": true }, "extra_capabilities": { "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] + "supported": true } }, "attachment": false, "open_weights": false, - "release_date": "2026-03-19", - "last_updated": "2026-03-19", - "cost": { - "input": 0.3, - "output": 1.2 + "release_date": "2025-09-02", + "last_updated": "2025-09-02", + "type": "chat" + }, + { + "id": "x-ai/grok-4.1-fast-reasoning", + "name": "X-Ai/Grok 4.1 Fast Reasoning", + "display_name": "X-Ai/Grok 4.1 Fast Reasoning", + "modalities": { + "input": [ + "text", + "image", + "audio", + "video" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 20000000, + "output": 2000000 + }, + "temperature": true, + "tool_call": true, + "reasoning": { + "supported": true, + "default": true }, + "attachment": true, + "open_weights": false, + "release_date": "2025-12-19", + "last_updated": "2025-12-19", "type": "chat" }, { - "id": "gemini-2.0-flash-lite", - "name": "gemini-2.0-flash-lite", - "display_name": "gemini-2.0-flash-lite", + "id": "x-ai/grok-4.1-fast-non-reasoning", + "name": "X-Ai/Grok 4.1 Fast Non Reasoning", + "display_name": "X-Ai/Grok 4.1 Fast Non Reasoning", "modalities": { "input": [ "text", - "image" + "image", + "audio", + "video" ], "output": [ "text" @@ -3831,42 +4289,40 @@ }, "limit": { "context": 2000000, - "output": 8192 + "output": 2000000 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "attachment": true, "open_weights": false, - "knowledge": "2024-11", - "release_date": "2025-06-16", - "last_updated": "2025-06-16", - "cost": { - "input": 0.075, - "output": 0.3 - }, + "release_date": "2025-12-19", + "last_updated": "2025-12-19", "type": "chat" }, { - "id": "gpt-5.4-pro", - "name": "gpt-5.4-pro", - "display_name": "gpt-5.4-pro", + "id": "x-ai/grok-4-fast-reasoning", + "name": "X-Ai/Grok-4-Fast-Reasoning", + "display_name": "X-Ai/Grok-4-Fast-Reasoning", "modalities": { "input": [ "text", - "image" + "image", + "audio", + "video" ], "output": [ "text" ] }, "limit": { - "context": 1050000, - "output": 128000 + "context": 2000000, + "output": 2000000 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, @@ -3874,195 +4330,140 @@ }, "extra_capabilities": { "reasoning": { - "supported": true, - "default_enabled": true, - "mode": "effort", - "effort": "high", - "effort_options": [ - "medium", - "high", - "xhigh" - ], - "verbosity": "medium", - "verbosity_options": [ - "low", - "medium", - "high" - ], - "visibility": "hidden" + "supported": true } }, "attachment": true, "open_weights": false, - "knowledge": "2025-08-31", - "release_date": "2026-03-05", - "last_updated": "2026-03-05", - "cost": { - "input": 30, - "output": 180, - "cache_read": 0, - "cache_write": 0, - "tiers": [ - { - "input": 60, - "output": 270, - "tier": { - "type": "context", - "size": 272000 - } - } - ], - "context_over_200k": { - "input": 60, - "output": 270 - } - }, + "release_date": "2025-12-18", + "last_updated": "2025-12-18", "type": "chat" }, { - "id": "qwen-max-latest", - "name": "Qwen-Max-Latest", - "display_name": "Qwen-Max-Latest", + "id": "x-ai/grok-4-fast", + "name": "x-AI/Grok-4-Fast", + "display_name": "x-AI/Grok-4-Fast", "modalities": { "input": [ - "text" + "text", + "image", + "audio", + "video" ], "output": [ "text" ] }, "limit": { - "context": 131072, - "output": 8192 + "context": 2000000, + "output": 2000000 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": false, + "attachment": true, "open_weights": false, - "knowledge": "2024-11", - "release_date": "2024-04-03", - "last_updated": "2025-01-25", - "cost": { - "input": 0.343, - "output": 1.372 - }, + "release_date": "2025-09-20", + "last_updated": "2025-09-20", "type": "chat" }, { - "id": "doubao-seed-1-8-251215", - "name": "doubao-seed-1-8-251215", - "display_name": "doubao-seed-1-8-251215", + "id": "x-ai/grok-4-fast-non-reasoning", + "name": "X-Ai/Grok-4-Fast-Non-Reasoning", + "display_name": "X-Ai/Grok-4-Fast-Non-Reasoning", "modalities": { "input": [ "text", - "image" + "image", + "audio", + "video" ], "output": [ "text" ] }, "limit": { - "context": 224000, - "output": 64000 + "context": 2000000, + "output": 2000000 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "attachment": true, "open_weights": false, "release_date": "2025-12-18", "last_updated": "2025-12-18", - "cost": { - "input": 0.114, - "output": 0.286 - }, "type": "chat" }, { - "id": "gpt-4.1-mini", - "name": "gpt-4.1-mini", - "display_name": "gpt-4.1-mini", + "id": "x-ai/grok-4.1-fast", + "name": "x-AI/Grok-4.1-Fast", + "display_name": "x-AI/Grok-4.1-Fast", "modalities": { "input": [ - "text", - "image", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 1047576, - "output": 32768 + "context": 2000000, + "output": 2000000 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": true, + "attachment": false, "open_weights": false, - "knowledge": "2024-04", - "release_date": "2025-04-14", - "last_updated": "2025-04-14", - "cost": { - "input": 0.4, - "output": 1.6 - }, + "release_date": "2025-11-20", + "last_updated": "2025-11-20", "type": "chat" }, { - "id": "deepseek-v3.2", - "name": "deepseek-v3.2", - "display_name": "deepseek-v3.2", + "id": "z-ai/autoglm-phone-9b", + "name": "Z-Ai/Autoglm Phone 9b", + "display_name": "Z-Ai/Autoglm Phone 9b", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 8192 + "context": 12800, + "output": 4096 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true - } + "supported": false }, - "attachment": false, + "attachment": true, "open_weights": false, - "knowledge": "2024-12", - "release_date": "2025-12-01", - "last_updated": "2025-12-01", - "cost": { - "input": 0.29, - "output": 0.43 - }, + "release_date": "2025-12-23", + "last_updated": "2025-12-23", "type": "chat" }, { - "id": "claude-opus-4-20250514", - "name": "claude-opus-4-20250514", - "display_name": "claude-opus-4-20250514", + "id": "z-ai/glm-4.7", + "name": "Z-Ai/GLM 4.7", + "display_name": "Z-Ai/GLM 4.7", "modalities": { "input": [ - "text", - "image", - "pdf" + "text" ], "output": [ "text" @@ -4070,135 +4471,78 @@ }, "limit": { "context": 200000, - "output": 32000 + "output": 200000 }, "temperature": true, "tool_call": true, "reasoning": { "supported": true, - "default": false + "default": true }, "extra_capabilities": { "reasoning": { "supported": true, - "default_enabled": false, - "mode": "budget", - "budget": { - "min": 1024, - "unit": "tokens" - }, "interleaved": true, "summaries": true, "visibility": "summary", "continuation": [ "thinking_blocks" - ], - "notes": [ - "Claude 4 manual thinking uses thinking.type = \"enabled\" with budget_tokens.", - "Interleaved thinking requires the interleaved-thinking-2025-05-14 beta header for this model family." ] } }, - "attachment": true, + "attachment": false, "open_weights": false, - "knowledge": "2025-03-31", - "release_date": "2025-05-22", - "last_updated": "2025-05-22", - "cost": { - "input": 15, - "output": 75 - }, + "release_date": "2025-12-23", + "last_updated": "2025-12-23", "type": "chat" }, { - "id": "gpt-5.4", - "name": "gpt-5.4", - "display_name": "gpt-5.4", + "id": "z-ai/glm-4.6", + "name": "Z-AI/GLM 4.6", + "display_name": "Z-AI/GLM 4.6", "modalities": { "input": [ - "text", - "image", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 1050000, - "output": 128000 + "context": 200000, + "output": 200000 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": false + "supported": true }, "extra_capabilities": { "reasoning": { - "supported": true, - "default_enabled": false, - "mode": "effort", - "effort": "none", - "effort_options": [ - "none", - "low", - "medium", - "high", - "xhigh" - ], - "verbosity": "medium", - "verbosity_options": [ - "low", - "medium", - "high" - ], - "visibility": "hidden" + "supported": true } }, - "attachment": true, + "attachment": false, "open_weights": false, - "knowledge": "2025-08-31", - "release_date": "2026-03-05", - "last_updated": "2026-03-05", - "cost": { - "input": 2.5, - "output": 15, - "cache_read": 0.25, - "cache_write": 0, - "tiers": [ - { - "input": 5, - "output": 22.5, - "tier": { - "type": "context", - "size": 272000 - } - } - ], - "context_over_200k": { - "input": 5, - "output": 22.5 - } - }, + "release_date": "2025-10-11", + "last_updated": "2025-10-11", "type": "chat" }, { - "id": "gemini-3-flash-preview", - "name": "gemini-3-flash-preview", - "display_name": "gemini-3-flash-preview", + "id": "z-ai/glm-5", + "name": "Z-Ai/GLM 5", + "display_name": "Z-Ai/GLM 5", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 1000000, - "output": 65536 + "context": 200000, + "output": 128000 }, "temperature": true, "tool_call": true, @@ -4209,37 +4553,24 @@ "extra_capabilities": { "reasoning": { "supported": true, - "default_enabled": true, - "mode": "level", - "level": "high", - "level_options": [ - "minimal", - "low", - "medium", - "high" - ], + "interleaved": true, "summaries": true, "visibility": "summary", "continuation": [ - "thought_signatures" + "thinking_blocks" ] } }, - "attachment": true, + "attachment": false, "open_weights": false, - "knowledge": "2025-06", - "release_date": "2025-12-18", - "last_updated": "2025-12-18", - "cost": { - "input": 0.5, - "output": 3 - }, + "release_date": "2026-02-12", + "last_updated": "2026-02-12", "type": "chat" }, { - "id": "deepseek-reasoner", - "name": "Deepseek-Reasoner", - "display_name": "Deepseek-Reasoner", + "id": "openai/gpt-5", + "name": "OpenAI/GPT-5", + "display_name": "OpenAI/GPT-5", "modalities": { "input": [ "text" @@ -4249,7 +4580,7 @@ ] }, "limit": { - "context": 128000, + "context": 400000, "output": 128000 }, "temperature": true, @@ -4261,84 +4592,96 @@ "extra_capabilities": { "reasoning": { "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] + "default_enabled": true, + "mode": "effort", + "effort": "medium", + "effort_options": [ + "minimal", + "low", + "medium", + "high" + ], + "verbosity": "medium", + "verbosity_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" } }, "attachment": false, "open_weights": false, - "knowledge": "2024-07", - "release_date": "2025-01-20", - "last_updated": "2025-01-20", - "cost": { - "input": 0.29, - "output": 0.43 - }, + "release_date": "2025-09-19", + "last_updated": "2025-09-19", "type": "chat" }, { - "id": "qwen3-235b-a22b", - "name": "Qwen3-235B-A22B", - "display_name": "Qwen3-235B-A22B", + "id": "openai/gpt-5.2", + "name": "OpenAI/GPT-5.2", + "display_name": "OpenAI/GPT-5.2", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 16384 + "context": 400000, + "output": 128000 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true + "supported": true, + "default": false }, "extra_capabilities": { "reasoning": { "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] + "default_enabled": false, + "mode": "effort", + "effort": "none", + "effort_options": [ + "none", + "low", + "medium", + "high", + "xhigh" + ], + "verbosity": "medium", + "verbosity_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" } }, - "attachment": false, + "attachment": true, "open_weights": false, - "knowledge": "2025-04", - "release_date": "2025-04-29", - "last_updated": "2025-04-29", - "cost": { - "input": 0.29, - "output": 2.86 - }, + "release_date": "2025-12-11", + "last_updated": "2025-12-11", "type": "chat" }, { - "id": "grok-4.20-beta-0309-reasoning", - "name": "grok-4.20-beta-0309-reasoning", - "display_name": "grok-4.20-beta-0309-reasoning", + "id": "xiaomi/mimo-v2-flash", + "name": "Xiaomi/Mimo-V2-Flash", + "display_name": "Xiaomi/Mimo-V2-Flash", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 2000000, - "output": 30000 + "context": 256000, + "output": 256000 }, "temperature": true, "tool_call": true, @@ -4346,25 +4689,22 @@ "supported": true, "default": true }, - "extra_capabilities": { - "reasoning": { - "supported": true - } - }, - "attachment": true, - "open_weights": false, - "release_date": "2026-03-16", - "last_updated": "2026-03-16", + "attachment": false, + "open_weights": true, + "knowledge": "2024-12-01", + "release_date": "2025-12-16", + "last_updated": "2026-02-04", "cost": { - "input": 2, - "output": 6 + "input": 0.1, + "output": 0.3, + "cache_read": 0.01 }, "type": "chat" }, { - "id": "mistral-large-2512", - "name": "mistral-large-2512", - "display_name": "mistral-large-2512", + "id": "stepfun/step-3.5-flash", + "name": "Stepfun/Step-3.5 Flash", + "display_name": "Stepfun/Step-3.5 Flash", "modalities": { "input": [ "text", @@ -4375,29 +4715,24 @@ ] }, "limit": { - "context": 128000, - "output": 262144 + "context": 64000, + "output": 4096 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": false }, "attachment": true, "open_weights": false, - "knowledge": "2024-12", - "release_date": "2025-12-16", - "last_updated": "2025-12-16", - "cost": { - "input": 1.1, - "output": 3.3 - }, + "release_date": "2026-02-02", + "last_updated": "2026-02-02", "type": "chat" }, { - "id": "glm-4.7", - "name": "glm-4.7", - "display_name": "glm-4.7", + "id": "meituan/longcat-flash-lite", + "name": "Meituan/Longcat-Flash-Lite", + "display_name": "Meituan/Longcat-Flash-Lite", "modalities": { "input": [ "text" @@ -4407,108 +4742,109 @@ ] }, "limit": { - "context": 204800, - "output": 131072 + "context": 256000, + "output": 320000 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } + "supported": false }, "attachment": false, - "open_weights": true, - "knowledge": "2025-04", - "release_date": "2025-12-22", - "last_updated": "2025-12-22", - "cost": { - "input": 0.286, - "output": 1.142 + "open_weights": false, + "release_date": "2026-02-06", + "last_updated": "2026-02-06", + "type": "chat" + }, + { + "id": "meituan/longcat-flash-chat", + "name": "Meituan/Longcat-Flash-Chat", + "display_name": "Meituan/Longcat-Flash-Chat", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 131072, + "output": 131072 + }, + "temperature": true, + "tool_call": false, + "reasoning": { + "supported": false }, + "attachment": false, + "open_weights": false, + "release_date": "2025-11-05", + "last_updated": "2025-11-05", "type": "chat" }, { - "id": "claude-sonnet-4-6-thinking", - "name": "claude-sonnet-4-6-thinking", - "display_name": "claude-sonnet-4-6-thinking", + "id": "deepseek/deepseek-v3.1-terminus", + "name": "DeepSeek/DeepSeek-V3.1-Terminus", + "display_name": "DeepSeek/DeepSeek-V3.1-Terminus", "modalities": { "input": [ - "text", - "image", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 1000000, - "output": 64000 + "context": 128000, + "output": 32000 }, "temperature": true, "tool_call": true, + "reasoning": { + "supported": false + }, + "attachment": false, + "open_weights": false, + "release_date": "2025-09-22", + "last_updated": "2025-09-22", + "type": "chat" + }, + { + "id": "deepseek/deepseek-v3.1-terminus-thinking", + "name": "DeepSeek/DeepSeek-V3.1-Terminus-Thinking", + "display_name": "DeepSeek/DeepSeek-V3.1-Terminus-Thinking", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 128000, + "output": 32000 + }, + "temperature": true, + "tool_call": false, "reasoning": { "supported": true, "default": true }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": true, - "mode": "mixed", - "budget": { - "min": 1024, - "unit": "tokens" - }, - "effort": "high", - "effort_options": [ - "low", - "medium", - "high", - "max" - ], - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ], - "notes": [ - "Anthropic recommends adaptive thinking with effort for Claude 4.6; budget_tokens remains a deprecated compatibility path.", - "Anthropic API defaults effort to high; lower effort levels should be chosen per workload." - ] - } - }, - "attachment": true, + "attachment": false, "open_weights": false, - "knowledge": "2025-08", - "release_date": "2026-02-18", - "last_updated": "2026-03-13", - "cost": { - "input": 3, - "output": 15 - }, + "release_date": "2025-09-22", + "last_updated": "2025-09-22", "type": "chat" }, { - "id": "gpt-5.2-chat-latest", - "name": "gpt-5.2-chat-latest", - "display_name": "gpt-5.2-chat-latest", + "id": "deepseek/deepseek-v3.2-exp-thinking", + "name": "DeepSeek/DeepSeek-V3.2-Exp-Thinking", + "display_name": "DeepSeek/DeepSeek-V3.2-Exp-Thinking", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" @@ -4516,96 +4852,62 @@ }, "limit": { "context": 128000, - "output": 16384 + "output": 32000 }, - "temperature": false, - "tool_call": true, + "temperature": true, + "tool_call": false, "reasoning": { "supported": true, "default": true }, - "attachment": true, + "attachment": false, "open_weights": false, - "knowledge": "2025-08-31", - "release_date": "2025-12-12", - "last_updated": "2025-12-12", - "cost": { - "input": 1.75, - "output": 14 - }, + "release_date": "2025-09-29", + "last_updated": "2025-09-29", "type": "chat" }, { - "id": "gpt-5.1", - "name": "gpt-5.1", - "display_name": "gpt-5.1", + "id": "deepseek/deepseek-v3.2-exp", + "name": "DeepSeek/DeepSeek-V3.2-Exp", + "display_name": "DeepSeek/DeepSeek-V3.2-Exp", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 400000, - "output": 128000 + "context": 128000, + "output": 32000 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": false - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": false, - "mode": "effort", - "effort": "none", - "effort_options": [ - "none", - "low", - "medium", - "high" - ], - "verbosity": "medium", - "verbosity_options": [ - "low", - "medium", - "high" - ], - "visibility": "hidden" - } + "supported": false }, - "attachment": true, + "attachment": false, "open_weights": false, - "knowledge": "2024-09-30", - "release_date": "2025-11-14", - "last_updated": "2025-11-14", - "cost": { - "input": 1.25, - "output": 10 - }, + "release_date": "2025-09-29", + "last_updated": "2025-09-29", "type": "chat" }, { - "id": "grok-4-fast-reasoning", - "name": "grok-4-fast-reasoning", - "display_name": "grok-4-fast-reasoning", + "id": "deepseek/deepseek-v3.2-251201", + "name": "Deepseek/DeepSeek-V3.2", + "display_name": "Deepseek/DeepSeek-V3.2", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 2000000, - "output": 30000 + "context": 128000, + "output": 32000 }, "temperature": true, "tool_call": true, @@ -4613,71 +4915,55 @@ "supported": true, "default": true }, - "extra_capabilities": { - "reasoning": { - "supported": true - } - }, - "attachment": true, + "attachment": false, "open_weights": false, - "knowledge": "2025-06", - "release_date": "2025-09-23", - "last_updated": "2025-09-23", - "cost": { - "input": 0.2, - "output": 0.5 - }, + "release_date": "2025-12-01", + "last_updated": "2025-12-01", "type": "chat" }, { - "id": "grok-4-1-fast-non-reasoning", - "name": "grok-4-1-fast-non-reasoning", - "display_name": "grok-4-1-fast-non-reasoning", + "id": "deepseek/deepseek-math-v2", + "name": "Deepseek/Deepseek-Math-V2", + "display_name": "Deepseek/Deepseek-Math-V2", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 2000000, - "output": 30000 + "context": 160000, + "output": 160000 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": true, + "attachment": false, "open_weights": false, - "knowledge": "2025-06", - "release_date": "2025-11-20", - "last_updated": "2025-11-20", - "cost": { - "input": 0.2, - "output": 0.5 - }, + "release_date": "2025-12-04", + "last_updated": "2025-12-04", "type": "chat" }, { - "id": "claude-opus-4-1-20250805-thinking", - "name": "claude-opus-4-1-20250805-thinking", - "display_name": "claude-opus-4-1-20250805-thinking", + "id": "minimax/minimax-m2.5", + "name": "Minimax/Minimax-M2.5", + "display_name": "Minimax/Minimax-M2.5", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 32000 + "context": 204800, + "output": 128000 }, "temperature": true, "tool_call": true, @@ -4687,52 +4973,30 @@ }, "extra_capabilities": { "reasoning": { - "supported": true, - "default_enabled": true, - "mode": "budget", - "budget": { - "min": 1024, - "unit": "tokens" - }, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ], - "notes": [ - "Claude 4 manual thinking uses thinking.type = \"enabled\" with budget_tokens.", - "Interleaved thinking requires the interleaved-thinking-2025-05-14 beta header for this model family." - ] + "supported": true } }, - "attachment": true, + "attachment": false, "open_weights": false, - "knowledge": "2025-03", - "release_date": "2025-05-27", - "last_updated": "2025-05-27", - "cost": { - "input": 15, - "output": 75 - }, + "release_date": "2026-02-12", + "last_updated": "2026-02-12", "type": "chat" }, { - "id": "gemini-2.5-pro", - "name": "gemini-2.5-pro", - "display_name": "gemini-2.5-pro", + "id": "minimax/minimax-m2.1", + "name": "Minimax/Minimax-M2.1", + "display_name": "Minimax/Minimax-M2.1", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 1000000, - "output": 65536 + "context": 204800, + "output": 128000 }, "temperature": true, "tool_call": true, @@ -4742,43 +5006,22 @@ }, "extra_capabilities": { "reasoning": { - "supported": true, - "default_enabled": true, - "mode": "budget", - "budget": { - "default": -1, - "min": 128, - "max": 32768, - "auto": -1, - "unit": "tokens" - }, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thought_signatures" - ] + "supported": true } }, - "attachment": true, + "attachment": false, "open_weights": false, - "knowledge": "2025-01", - "release_date": "2025-06-17", - "last_updated": "2025-06-17", - "cost": { - "input": 1.25, - "output": 10 - }, + "release_date": "2025-12-23", + "last_updated": "2025-12-23", "type": "chat" }, { - "id": "claude-3-5-haiku-latest", - "name": "claude-3-5-haiku-latest", - "display_name": "claude-3-5-haiku-latest", + "id": "minimax/minimax-m2", + "name": "Minimax/Minimax-M2", + "display_name": "Minimax/Minimax-M2", "modalities": { "input": [ - "text", - "image", - "pdf" + "text" ], "output": [ "text" @@ -4786,41 +5029,40 @@ }, "limit": { "context": 200000, - "output": 8192 + "output": 128000 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": true, - "open_weights": false, - "knowledge": "2024-07-31", - "release_date": "2024-10-22", - "last_updated": "2024-10-22", - "cost": { - "input": 0.8, - "output": 4 + "extra_capabilities": { + "reasoning": { + "supported": true + } }, + "attachment": false, + "open_weights": false, + "release_date": "2025-10-28", + "last_updated": "2025-10-28", "type": "chat" }, { - "id": "glm-4.5v", - "name": "GLM-4.5V", - "display_name": "GLM-4.5V", + "id": "minimax/minimax-m2.5-highspeed", + "name": "Minimax/Minimax-M2.5 Highspeed", + "display_name": "Minimax/Minimax-M2.5 Highspeed", "modalities": { "input": [ - "text", - "image", - "video" + "text" ], "output": [ "text" ] }, "limit": { - "context": 64000, - "output": 16384 + "context": 204800, + "output": 128000 }, "temperature": true, "tool_call": true, @@ -4828,21 +5070,62 @@ "supported": true, "default": true }, - "attachment": true, + "extra_capabilities": { + "reasoning": { + "supported": true + } + }, + "attachment": false, + "open_weights": false, + "release_date": "2026-02-14", + "last_updated": "2026-02-14", + "type": "chat" + } + ] + }, + "alibaba-cn": { + "id": "alibaba-cn", + "name": "alibaba-cn", + "display_name": "alibaba-cn", + "api": "https://dashscope.aliyuncs.com/compatible-mode/v1", + "doc": "https://www.alibabacloud.com/help/en/model-studio/models", + "models": [ + { + "id": "qwen2-5-math-72b-instruct", + "name": "Qwen2.5-Math 72B Instruct", + "display_name": "Qwen2.5-Math 72B Instruct", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 4096, + "output": 3072 + }, + "temperature": true, + "tool_call": true, + "reasoning": { + "supported": false + }, + "attachment": false, "open_weights": true, - "knowledge": "2025-04", - "release_date": "2025-08-12", - "last_updated": "2025-08-12", + "knowledge": "2024-04", + "release_date": "2024-09", + "last_updated": "2024-09", "cost": { - "input": 0.29, - "output": 0.86 + "input": 0.574, + "output": 1.721 }, "type": "chat" }, { - "id": "qwen3-30b-a3b", - "name": "Qwen3-30B-A3B", - "display_name": "Qwen3-30B-A3B", + "id": "deepseek-r1-0528", + "name": "DeepSeek R1 0528", + "display_name": "DeepSeek R1 0528", "modalities": { "input": [ "text" @@ -4852,13 +5135,14 @@ ] }, "limit": { - "context": 128000, - "output": 8192 + "context": 131072, + "output": 16384 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true + "supported": true, + "default": true }, "extra_capabilities": { "reasoning": { @@ -4873,53 +5157,68 @@ }, "attachment": false, "open_weights": false, - "knowledge": "2025-04", - "release_date": "2025-04-29", - "last_updated": "2025-04-29", + "release_date": "2025-05-28", + "last_updated": "2025-05-28", "cost": { - "input": 0.11, - "output": 1.08 + "input": 0.574, + "output": 2.294 }, "type": "chat" }, { - "id": "gpt-4.1", - "name": "gpt-4.1", - "display_name": "gpt-4.1", + "id": "qwen3-omni-flash", + "name": "Qwen3-Omni Flash", + "display_name": "Qwen3-Omni Flash", "modalities": { "input": [ "text", "image", - "pdf" + "audio", + "video" ], "output": [ - "text" + "text", + "audio" ] }, "limit": { - "context": 1047576, - "output": 32768 + "context": 65536, + "output": 16384 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": true, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } + }, + "attachment": false, "open_weights": false, "knowledge": "2024-04", - "release_date": "2025-04-14", - "last_updated": "2025-04-14", + "release_date": "2025-09-15", + "last_updated": "2025-09-15", "cost": { - "input": 2, - "output": 8 + "input": 0.058, + "output": 0.23, + "input_audio": 3.584, + "output_audio": 7.168 }, "type": "chat" }, { - "id": "deepseek-v3.2-thinking", - "name": "DeepSeek-V3.2-Thinking", - "display_name": "DeepSeek-V3.2-Thinking", + "id": "deepseek-v4-flash", + "name": "DeepSeek V4 Flash", + "display_name": "DeepSeek V4 Flash", "modalities": { "input": [ "text" @@ -4929,8 +5228,8 @@ ] }, "limit": { - "context": 128000, - "output": 128000 + "context": 1000000, + "output": 384000 }, "temperature": true, "tool_call": true, @@ -4938,167 +5237,153 @@ "supported": true, "default": true }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } + }, "attachment": false, - "open_weights": false, - "knowledge": "2024-12", - "release_date": "2025-12-01", - "last_updated": "2025-12-01", + "open_weights": true, + "knowledge": "2025-05", + "release_date": "2026-04-24", + "last_updated": "2026-04-24", "cost": { - "input": 0.29, - "output": 0.43 + "input": 0.14, + "output": 0.28, + "cache_read": 0.0028 }, "type": "chat" }, { - "id": "claude-sonnet-4-5-20250929", - "name": "claude-sonnet-4-5-20250929", - "display_name": "claude-sonnet-4-5-20250929", + "id": "qwen-plus", + "name": "Qwen Plus", + "display_name": "Qwen Plus", "modalities": { "input": [ - "text", - "image", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 64000 + "context": 1000000, + "output": 32768 }, "temperature": true, "tool_call": true, "reasoning": { "supported": true, - "default": false + "default": false, + "budget": { + "default": 81920, + "min": 0, + "max": 81920 + } }, "extra_capabilities": { "reasoning": { "supported": true, - "default_enabled": false, - "mode": "budget", - "budget": { - "min": 1024, - "unit": "tokens" - }, "interleaved": true, "summaries": true, "visibility": "summary", "continuation": [ "thinking_blocks" - ], - "notes": [ - "Claude 4 manual thinking uses thinking.type = \"enabled\" with budget_tokens.", - "Interleaved thinking requires the interleaved-thinking-2025-05-14 beta header for this model family." ] } }, - "attachment": true, + "search": { + "supported": true, + "default": false, + "forced_search": false, + "search_strategy": "turbo" + }, + "attachment": false, "open_weights": false, - "knowledge": "2025-07-31", - "release_date": "2025-09-30", - "last_updated": "2025-09-30", + "knowledge": "2024-04", + "release_date": "2024-01-25", + "last_updated": "2025-09-11", "cost": { - "input": 3, - "output": 15 + "input": 0.115, + "output": 0.287, + "reasoning": 1.147 }, "type": "chat" }, { - "id": "claude-3-5-haiku-20241022", - "name": "claude-3-5-haiku-20241022", - "display_name": "claude-3-5-haiku-20241022", + "id": "qwen3-coder-30b-a3b-instruct", + "name": "Qwen3-Coder 30B-A3B Instruct", + "display_name": "Qwen3-Coder 30B-A3B Instruct", "modalities": { "input": [ - "text", - "image", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 8192 + "context": 262144, + "output": 65536 }, "temperature": true, "tool_call": true, "reasoning": { "supported": false }, - "attachment": true, - "open_weights": false, - "knowledge": "2024-07-31", - "release_date": "2024-10-22", - "last_updated": "2024-10-22", + "attachment": false, + "open_weights": true, + "knowledge": "2025-04", + "release_date": "2025-04", + "last_updated": "2025-04", "cost": { - "input": 0.8, - "output": 4 + "input": 0.216, + "output": 0.861 }, "type": "chat" }, { - "id": "gpt-5.4-mini-2026-03-17", - "name": "gpt-5.4-mini-2026-03-17", - "display_name": "gpt-5.4-mini-2026-03-17", + "id": "qwen2-5-coder-7b-instruct", + "name": "Qwen2.5-Coder 7B Instruct", + "display_name": "Qwen2.5-Coder 7B Instruct", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 400000, - "output": 128000 + "context": 131072, + "output": 8192 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": false - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": false, - "mode": "effort", - "effort": "none", - "effort_options": [ - "none", - "low", - "medium", - "high", - "xhigh" - ], - "verbosity": "medium", - "verbosity_options": [ - "low", - "medium", - "high" - ], - "visibility": "hidden" - } + "supported": false }, - "attachment": true, - "open_weights": false, - "knowledge": "2025-08-31", - "release_date": "2026-03-19", - "last_updated": "2026-03-19", + "attachment": false, + "open_weights": true, + "knowledge": "2024-04", + "release_date": "2024-11", + "last_updated": "2024-11", "cost": { - "input": 0.75, - "output": 4.5 + "input": 0.144, + "output": 0.287 }, "type": "chat" }, { - "id": "deepseek-chat", - "name": "Deepseek-Chat", - "display_name": "Deepseek-Chat", + "id": "deepseek-v3", + "name": "DeepSeek V3", + "display_name": "DeepSeek V3", "modalities": { "input": [ "text" @@ -5108,7 +5393,7 @@ ] }, "limit": { - "context": 128000, + "context": 65536, "output": 8192 }, "temperature": true, @@ -5118,87 +5403,66 @@ }, "attachment": false, "open_weights": false, - "knowledge": "2024-07", - "release_date": "2024-11-29", - "last_updated": "2024-11-29", + "release_date": "2024-12-01", + "last_updated": "2024-12-01", "cost": { - "input": 0.29, - "output": 0.43 + "input": 0.287, + "output": 1.147 }, "type": "chat" }, { - "id": "gpt-5.4-nano", - "name": "gpt-5.4-nano", - "display_name": "gpt-5.4-nano", + "id": "qwen3-omni-flash-realtime", + "name": "Qwen3-Omni Flash Realtime", + "display_name": "Qwen3-Omni Flash Realtime", "modalities": { "input": [ "text", - "image" + "image", + "audio" ], "output": [ - "text" + "text", + "audio" ] }, "limit": { - "context": 400000, - "output": 128000 + "context": 65536, + "output": 16384 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": false - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": false, - "mode": "effort", - "effort": "none", - "effort_options": [ - "none", - "low", - "medium", - "high", - "xhigh" - ], - "verbosity": "medium", - "verbosity_options": [ - "low", - "medium", - "high" - ], - "visibility": "hidden" - } + "supported": false }, - "attachment": true, + "attachment": false, "open_weights": false, - "knowledge": "2025-08-31", - "release_date": "2026-03-19", - "last_updated": "2026-03-19", + "knowledge": "2024-04", + "release_date": "2025-09-15", + "last_updated": "2025-09-15", "cost": { - "input": 0.2, - "output": 1.25 + "input": 0.23, + "output": 0.918, + "input_audio": 3.584, + "output_audio": 7.168 }, "type": "chat" }, { - "id": "claude-opus-4-5-20251101-thinking", - "name": "claude-opus-4-5-20251101-thinking", - "display_name": "claude-opus-4-5-20251101-thinking", + "id": "deepseek-r1-distill-llama-70b", + "name": "DeepSeek R1 Distill Llama 70B", + "display_name": "DeepSeek R1 Distill Llama 70B", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 64000 + "context": 32768, + "output": 16384 }, "temperature": true, "tool_call": true, @@ -5208,113 +5472,87 @@ }, "extra_capabilities": { "reasoning": { - "supported": true, - "default_enabled": true, - "mode": "mixed", - "budget": { - "min": 1024, - "unit": "tokens" - }, - "effort": "high", - "effort_options": [ - "low", - "medium", - "high" - ], - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ], - "notes": [ - "Claude Opus 4.5 uses manual thinking.type = \"enabled\" with budget_tokens; effort can be used alongside the thinking budget.", - "Interleaved thinking requires the interleaved-thinking-2025-05-14 beta header." - ] + "supported": true } }, - "attachment": true, + "attachment": false, "open_weights": false, - "knowledge": "2025-03", - "release_date": "2025-11-25", - "last_updated": "2025-11-25", + "release_date": "2025-01-01", + "last_updated": "2025-01-01", "cost": { - "input": 5, - "output": 25 + "input": 0.287, + "output": 0.861 }, "type": "chat" }, { - "id": "claude-opus-4-1-20250805", - "name": "claude-opus-4-1-20250805", - "display_name": "claude-opus-4-1-20250805", + "id": "qwen3-32b", + "name": "Qwen3 32B", + "display_name": "Qwen3 32B", "modalities": { "input": [ - "text", - "image", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 32000 + "context": 131072, + "output": 16384 }, "temperature": true, "tool_call": true, "reasoning": { "supported": true, - "default": false + "default": true, + "budget": { + "default": 38912, + "min": 0, + "max": 38912 + } }, "extra_capabilities": { "reasoning": { "supported": true, - "default_enabled": false, - "mode": "budget", - "budget": { - "min": 1024, - "unit": "tokens" - }, "interleaved": true, "summaries": true, "visibility": "summary", "continuation": [ "thinking_blocks" - ], - "notes": [ - "Claude 4 manual thinking uses thinking.type = \"enabled\" with budget_tokens.", - "Interleaved thinking requires the interleaved-thinking-2025-05-14 beta header for this model family." ] } }, - "attachment": true, - "open_weights": false, - "knowledge": "2025-03-31", - "release_date": "2025-08-05", - "last_updated": "2025-08-05", + "attachment": false, + "open_weights": true, + "knowledge": "2025-04", + "release_date": "2025-04", + "last_updated": "2025-04", "cost": { - "input": 15, - "output": 75 + "input": 0.287, + "output": 1.147, + "reasoning": 2.868 }, "type": "chat" }, { - "id": "qwen3-coder-480b-a35b-instruct", - "name": "qwen3-coder-480b-a35b-instruct", - "display_name": "qwen3-coder-480b-a35b-instruct", + "id": "qwen-omni-turbo-realtime", + "name": "Qwen-Omni Turbo Realtime", + "display_name": "Qwen-Omni Turbo Realtime", "modalities": { "input": [ - "text" + "text", + "image", + "audio" ], "output": [ - "text" + "text", + "audio" ] }, "limit": { - "context": 262144, - "output": 65536 + "context": 32768, + "output": 2048 }, "temperature": true, "tool_call": true, @@ -5323,108 +5561,85 @@ }, "attachment": false, "open_weights": false, - "knowledge": "2025-04", - "release_date": "2025-07-23", - "last_updated": "2025-07-23", + "knowledge": "2024-04", + "release_date": "2025-05-08", + "last_updated": "2025-05-08", "cost": { - "input": 0.86, - "output": 3.43 + "input": 0.23, + "output": 0.918, + "input_audio": 3.584, + "output_audio": 7.168 }, "type": "chat" }, { - "id": "glm-4.6v", - "name": "GLM-4.6V", - "display_name": "GLM-4.6V", + "id": "qwen2-5-math-7b-instruct", + "name": "Qwen2.5-Math 7B Instruct", + "display_name": "Qwen2.5-Math 7B Instruct", "modalities": { "input": [ - "text", - "image", - "video" + "text" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 32768 + "context": 4096, + "output": 3072 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, - "attachment": true, + "attachment": false, "open_weights": true, - "knowledge": "2025-04", - "release_date": "2025-12-08", - "last_updated": "2025-12-08", + "knowledge": "2024-04", + "release_date": "2024-09", + "last_updated": "2024-09", "cost": { - "input": 0.145, - "output": 0.43 + "input": 0.144, + "output": 0.287 }, "type": "chat" }, { - "id": "gemini-2.5-flash", - "name": "gemini-2.5-flash", - "display_name": "gemini-2.5-flash", + "id": "qwen3-next-80b-a3b-instruct", + "name": "Qwen3 Next 80B A3B Instruct", + "display_name": "Qwen3 Next 80B A3B Instruct", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 1000000, - "output": 65536 + "context": 131072, + "output": 32768 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": true, - "mode": "budget", - "budget": { - "default": -1, - "min": 0, - "max": 24576, - "auto": -1, - "off": 0, - "unit": "tokens" - }, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thought_signatures" - ] - } + "supported": false }, - "attachment": true, - "open_weights": false, - "knowledge": "2025-01", - "release_date": "2025-06-17", - "last_updated": "2025-06-17", + "attachment": false, + "open_weights": true, + "knowledge": "2025-04", + "release_date": "2025-09", + "last_updated": "2025-09", "cost": { - "input": 0.3, - "output": 2.5 + "input": 0.144, + "output": 0.574 }, "type": "chat" }, { - "id": "gemini-2.5-flash-preview-09-2025", - "name": "gemini-2.5-flash-preview-09-2025", - "display_name": "gemini-2.5-flash-preview-09-2025", + "id": "qwen3.7-plus", + "name": "Qwen3.7 Plus", + "display_name": "Qwen3.7 Plus", "modalities": { "input": [ "text", @@ -5436,7 +5651,7 @@ }, "limit": { "context": 1000000, - "output": 65536 + "output": 64000 }, "temperature": true, "tool_call": true, @@ -5446,54 +5661,49 @@ }, "extra_capabilities": { "reasoning": { - "supported": true, - "default_enabled": true, - "mode": "budget", - "budget": { - "default": -1, - "min": 0, - "max": 24576, - "auto": -1, - "off": 0, - "unit": "tokens" - }, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thought_signatures" - ] + "supported": true } }, - "attachment": true, + "attachment": false, "open_weights": false, - "knowledge": "2025-01", - "release_date": "2025-09-26", - "last_updated": "2025-09-26", + "knowledge": "2025-04", + "release_date": "2026-06-02", + "last_updated": "2026-06-02", "cost": { - "input": 0.3, - "output": 2.5 + "input": 0.5, + "output": 3, + "cache_read": 0.05, + "cache_write": 0.625, + "tiers": [ + { + "input": 2, + "output": 6, + "cache_read": 0.2, + "cache_write": 2.5, + "tier": { + "type": "context", + "size": 128000 + } + } + ] }, "type": "chat" }, { - "id": "glm-5v-turbo", - "name": "GLM-5V-Turbo", - "display_name": "GLM-5V-Turbo", + "id": "qwen3.7-max", + "name": "Qwen3.7 Max", + "display_name": "Qwen3.7 Max", "modalities": { "input": [ - "text", - "image", - "video", - "audio", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 131072 + "context": 1000000, + "output": 65536 }, "temperature": true, "tool_call": true, @@ -5503,33 +5713,28 @@ }, "extra_capabilities": { "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] + "supported": true } }, - "attachment": true, + "attachment": false, "open_weights": false, - "release_date": "2026-04-02", - "last_updated": "2026-04-02", + "release_date": "2026-05-21", + "last_updated": "2026-05-21", "cost": { - "input": 0.72, - "output": 3.2 + "input": 2.5, + "output": 7.5, + "cache_read": 0.5, + "cache_write": 3.125 }, "type": "chat" }, { - "id": "gemini-2.5-flash-lite-preview-09-2025", - "name": "gemini-2.5-flash-lite-preview-09-2025", - "display_name": "gemini-2.5-flash-lite-preview-09-2025", + "id": "qwen-long", + "name": "Qwen Long", + "display_name": "Qwen Long", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" @@ -5537,48 +5742,28 @@ }, "limit": { "context": 1000000, - "output": 65536 + "output": 8192 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": false - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": false, - "mode": "budget", - "budget": { - "default": -1, - "min": 512, - "max": 24576, - "auto": -1, - "unit": "tokens" - }, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thought_signatures" - ] - } + "supported": false }, - "attachment": true, + "attachment": false, "open_weights": false, - "knowledge": "2025-01", - "release_date": "2025-09-26", - "last_updated": "2025-09-26", + "knowledge": "2024-04", + "release_date": "2025-01-25", + "last_updated": "2025-01-25", "cost": { - "input": 0.1, - "output": 0.4 + "input": 0.072, + "output": 0.287 }, "type": "chat" }, { - "id": "glm-for-coding", - "name": "glm-for-coding", - "display_name": "glm-for-coding", + "id": "qwen-math-turbo", + "name": "Qwen Math Turbo", + "display_name": "Qwen Math Turbo", "modalities": { "input": [ "text" @@ -5588,91 +5773,109 @@ ] }, "limit": { - "context": 200000, - "output": 131072 + "context": 4096, + "output": 3072 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, "attachment": false, "open_weights": false, - "release_date": "2025-09-30", - "last_updated": "2025-09-30", + "knowledge": "2024-04", + "release_date": "2024-09-19", + "last_updated": "2024-09-19", "cost": { - "input": 0.086, - "output": 0.343 + "input": 0.287, + "output": 0.861 }, "type": "chat" }, { - "id": "claude-opus-4-5-20251101", - "name": "claude-opus-4-5-20251101", - "display_name": "claude-opus-4-5-20251101", + "id": "qwen3-max", + "name": "Qwen3 Max", + "display_name": "Qwen3 Max", "modalities": { "input": [ - "text", - "image", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 64000 + "context": 262144, + "output": 65536 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": false + "supported": true }, "extra_capabilities": { "reasoning": { "supported": true, - "default_enabled": false, - "mode": "mixed", - "budget": { - "min": 1024, - "unit": "tokens" - }, - "effort": "high", - "effort_options": [ - "low", - "medium", - "high" - ], "interleaved": true, "summaries": true, "visibility": "summary", "continuation": [ "thinking_blocks" - ], - "notes": [ - "Claude Opus 4.5 uses manual thinking.type = \"enabled\" with budget_tokens; effort can be used alongside the thinking budget.", - "Interleaved thinking requires the interleaved-thinking-2025-05-14 beta header." ] } }, - "attachment": true, + "attachment": false, "open_weights": false, - "knowledge": "2025-03-31", - "release_date": "2025-11-25", - "last_updated": "2025-11-25", + "knowledge": "2025-04", + "release_date": "2025-09-23", + "last_updated": "2025-09-23", "cost": { - "input": 5, - "output": 25 + "input": 0.861, + "output": 3.441 }, "type": "chat" }, { - "id": "MiniMax-M2", - "name": "MiniMax-M2", - "display_name": "MiniMax-M2", + "id": "qwen2-5-omni-7b", + "name": "Qwen2.5-Omni 7B", + "display_name": "Qwen2.5-Omni 7B", + "modalities": { + "input": [ + "text", + "image", + "audio", + "video" + ], + "output": [ + "text", + "audio" + ] + }, + "limit": { + "context": 32768, + "output": 2048 + }, + "temperature": true, + "tool_call": true, + "reasoning": { + "supported": false + }, + "attachment": false, + "open_weights": true, + "knowledge": "2024-04", + "release_date": "2024-12", + "last_updated": "2024-12", + "cost": { + "input": 0.087, + "output": 0.345, + "input_audio": 5.448 + }, + "type": "chat" + }, + { + "id": "qwen3-8b", + "name": "Qwen3 8B", + "display_name": "Qwen3 8B", "modalities": { "input": [ "text" @@ -5682,65 +5885,79 @@ ] }, "limit": { - "context": 1000000, - "output": 128000 + "context": 131072, + "output": 8192 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true + "supported": true, + "default": true, + "budget": { + "default": 38912, + "min": 0, + "max": 38912 + } }, "extra_capabilities": { "reasoning": { - "supported": true + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] } }, "attachment": false, - "open_weights": false, - "release_date": "2025-10-26", - "last_updated": "2025-10-26", + "open_weights": true, + "knowledge": "2025-04", + "release_date": "2025-04", + "last_updated": "2025-04", "cost": { - "input": 0.33, - "output": 1.32 + "input": 0.072, + "output": 0.287, + "reasoning": 0.717 }, "type": "chat" }, { - "id": "doubao-seed-code-preview-251028", - "name": "doubao-seed-code-preview-251028", - "display_name": "doubao-seed-code-preview-251028", + "id": "qwen2-5-14b-instruct", + "name": "Qwen2.5 14B Instruct", + "display_name": "Qwen2.5 14B Instruct", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 256000, - "output": 32000 + "context": 131072, + "output": 8192 }, "temperature": true, "tool_call": true, "reasoning": { "supported": false }, - "attachment": true, - "open_weights": false, - "release_date": "2025-11-11", - "last_updated": "2025-11-11", + "attachment": false, + "open_weights": true, + "knowledge": "2024-04", + "release_date": "2024-09", + "last_updated": "2024-09", "cost": { - "input": 0.17, - "output": 1.14 + "input": 0.144, + "output": 0.431 }, "type": "chat" }, { - "id": "glm-5", - "name": "glm-5", - "display_name": "glm-5", + "id": "glm-5.1", + "name": "GLM-5.1", + "display_name": "GLM-5.1", "modalities": { "input": [ "text" @@ -5750,8 +5967,8 @@ ] }, "limit": { - "context": 204800, - "output": 131072 + "context": 202752, + "output": 128000 }, "temperature": true, "tool_call": true, @@ -5772,18 +5989,19 @@ }, "attachment": false, "open_weights": true, - "release_date": "2026-02-12", - "last_updated": "2026-02-12", + "release_date": "2026-04-14", + "last_updated": "2026-04-14", "cost": { - "input": 0.6, - "output": 2.6 + "input": 0.87, + "output": 3.48, + "cache_read": 0.17 }, "type": "chat" }, { - "id": "glm-5-turbo", - "name": "glm-5-turbo", - "display_name": "glm-5-turbo", + "id": "deepseek-v4-pro", + "name": "DeepSeek V4 Pro", + "display_name": "DeepSeek V4 Pro", "modalities": { "input": [ "text" @@ -5793,8 +6011,8 @@ ] }, "limit": { - "context": 200000, - "output": 131072 + "context": 1000000, + "output": 384000 }, "temperature": true, "tool_call": true, @@ -5814,19 +6032,21 @@ } }, "attachment": false, - "open_weights": false, - "release_date": "2026-03-16", - "last_updated": "2026-03-16", + "open_weights": true, + "knowledge": "2025-05", + "release_date": "2026-04-24", + "last_updated": "2026-04-24", "cost": { - "input": 0.72, - "output": 3.2 + "input": 0.435, + "output": 0.87, + "cache_read": 0.003625 }, "type": "chat" }, { - "id": "glm-4.5", - "name": "GLM-4.5", - "display_name": "GLM-4.5", + "id": "qwen3-next-80b-a3b-thinking", + "name": "Qwen3 Next 80B A3B Thinking", + "display_name": "Qwen3 Next 80B A3B Thinking", "modalities": { "input": [ "text" @@ -5837,173 +6057,154 @@ }, "limit": { "context": 131072, - "output": 98304 + "output": 32768 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": true, - "default": true + "default": true, + "budget": { + "default": 81920, + "min": 0, + "max": 81920 + } + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } }, "attachment": false, "open_weights": true, "knowledge": "2025-04", - "release_date": "2025-07-29", - "last_updated": "2025-07-29", + "release_date": "2025-09", + "last_updated": "2025-09", "cost": { - "input": 0.286, - "output": 1.142 + "input": 0.144, + "output": 1.434 }, "type": "chat" }, { - "id": "qwen3-235b-a22b-instruct-2507", - "name": "qwen3-235b-a22b-instruct-2507", - "display_name": "qwen3-235b-a22b-instruct-2507", + "id": "qvq-max", + "name": "QVQ Max", + "display_name": "QVQ Max", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 65536 + "context": 131072, + "output": 8192 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "attachment": false, "open_weights": false, - "knowledge": "2025-04", - "release_date": "2025-07-30", - "last_updated": "2025-07-30", + "knowledge": "2024-04", + "release_date": "2025-03-25", + "last_updated": "2025-03-25", "cost": { - "input": 0.29, - "output": 1.143 + "input": 1.147, + "output": 4.588 }, "type": "chat" }, { - "id": "gpt-5.4-nano-2026-03-17", - "name": "gpt-5.4-nano-2026-03-17", - "display_name": "gpt-5.4-nano-2026-03-17", + "id": "qwen-plus-character", + "name": "Qwen Plus Character", + "display_name": "Qwen Plus Character", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 400000, - "output": 128000 + "context": 32768, + "output": 4096 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": false - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": false, - "mode": "effort", - "effort": "none", - "effort_options": [ - "none", - "low", - "medium", - "high", - "xhigh" - ], - "verbosity": "medium", - "verbosity_options": [ - "low", - "medium", - "high" - ], - "visibility": "hidden" - } + "supported": false }, - "attachment": true, + "attachment": false, "open_weights": false, - "knowledge": "2025-08-31", - "release_date": "2026-03-19", - "last_updated": "2026-03-19", + "knowledge": "2024-04", + "release_date": "2024-01", + "last_updated": "2024-01", "cost": { - "input": 0.2, - "output": 1.25 + "input": 0.115, + "output": 0.287 }, "type": "chat" }, { - "id": "claude-sonnet-4-20250514", - "name": "claude-sonnet-4-20250514", - "display_name": "claude-sonnet-4-20250514", + "id": "kimi-k2-thinking", + "name": "Moonshot Kimi K2 Thinking", + "display_name": "Moonshot Kimi K2 Thinking", "modalities": { "input": [ - "text", - "image", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 64000 + "context": 262144, + "output": 16384 }, "temperature": true, "tool_call": true, "reasoning": { "supported": true, - "default": false + "default": true }, "extra_capabilities": { "reasoning": { "supported": true, - "default_enabled": false, - "mode": "budget", - "budget": { - "min": 1024, - "unit": "tokens" - }, "interleaved": true, "summaries": true, "visibility": "summary", "continuation": [ "thinking_blocks" - ], - "notes": [ - "Claude 4 manual thinking uses thinking.type = \"enabled\" with budget_tokens.", - "Interleaved thinking requires the interleaved-thinking-2025-05-14 beta header for this model family." ] } }, - "attachment": true, - "open_weights": false, - "knowledge": "2025-03-31", - "release_date": "2025-05-22", - "last_updated": "2025-05-22", + "attachment": false, + "open_weights": true, + "release_date": "2025-11-06", + "last_updated": "2025-11-06", "cost": { - "input": 3, - "output": 15 + "input": 0.574, + "output": 2.294 }, "type": "chat" }, { - "id": "glm-4.5-x", - "name": "glm-4.5-x", - "display_name": "glm-4.5-x", + "id": "deepseek-r1", + "name": "DeepSeek R1", + "display_name": "DeepSeek R1", "modalities": { "input": [ "text" @@ -6013,33 +6214,45 @@ ] }, "limit": { - "context": 128000, + "context": 131072, "output": 16384 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } }, "attachment": false, "open_weights": false, - "knowledge": "2025-04", - "release_date": "2025-07-29", - "last_updated": "2025-07-29", + "release_date": "2025-01-01", + "last_updated": "2025-01-01", "cost": { - "input": 1.143, - "output": 2.29 + "input": 0.574, + "output": 2.294 }, "type": "chat" }, { - "id": "gemini-3-pro-preview", - "name": "gemini-3-pro-preview", - "display_name": "gemini-3-pro-preview", + "id": "qwen3.5-flash", + "name": "Qwen3.5 Flash", + "display_name": "Qwen3.5 Flash", "modalities": { "input": [ "text", - "image" + "image", + "video" ], "output": [ "text" @@ -6047,7 +6260,7 @@ }, "limit": { "context": 1000000, - "output": 64000 + "output": 65536 }, "temperature": true, "tool_call": true, @@ -6058,67 +6271,76 @@ "extra_capabilities": { "reasoning": { "supported": true, - "default_enabled": true, - "mode": "level", - "level": "high", - "level_options": [ - "low", - "high" - ], + "interleaved": true, "summaries": true, "visibility": "summary", "continuation": [ - "thought_signatures" + "thinking_blocks" ] } }, "attachment": true, "open_weights": false, - "knowledge": "2025-06", - "release_date": "2025-11-19", - "last_updated": "2025-11-19", + "knowledge": "2025-04", + "release_date": "2026-02-23", + "last_updated": "2026-02-23", "cost": { - "input": 2, - "output": 12 + "input": 0.172, + "output": 1.72, + "reasoning": 1.72 }, "type": "chat" }, { - "id": "kimi-k2-0905-preview", - "name": "kimi-k2-0905-preview", - "display_name": "kimi-k2-0905-preview", + "id": "qwen3.6-flash", + "name": "Qwen3.6 Flash", + "display_name": "Qwen3.6 Flash", "modalities": { "input": [ - "text" + "text", + "image", + "video" ], "output": [ "text" ] }, "limit": { - "context": 262144, - "output": 262144 + "context": 1000000, + "output": 65536 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": false, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } + }, + "attachment": true, "open_weights": false, - "knowledge": "2025-06", - "release_date": "2025-09-05", - "last_updated": "2025-09-05", + "release_date": "2026-04-27", + "last_updated": "2026-04-27", "cost": { - "input": 0.632, - "output": 2.53 + "input": 0.1875, + "output": 1.125, + "cache_write": 0.234375 }, "type": "chat" }, { - "id": "doubao-seed-1-6-thinking-250715", - "name": "doubao-seed-1-6-thinking-250715", - "display_name": "doubao-seed-1-6-thinking-250715", + "id": "qwen2-5-vl-72b-instruct", + "name": "Qwen2.5-VL 72B Instruct", + "display_name": "Qwen2.5-VL 72B Instruct", "modalities": { "input": [ "text", @@ -6129,45 +6351,52 @@ ] }, "limit": { - "context": 256000, - "output": 16000 + "context": 131072, + "output": 8192 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, - "attachment": true, - "open_weights": false, - "release_date": "2025-07-15", - "last_updated": "2025-07-15", + "attachment": false, + "open_weights": true, + "knowledge": "2024-04", + "release_date": "2024-09", + "last_updated": "2024-09", "cost": { - "input": 0.121, - "output": 1.21 + "input": 2.294, + "output": 6.881 }, "type": "chat" }, { - "id": "MiniMax-M2.7-highspeed", - "name": "MiniMax-M2.7-highspeed", - "display_name": "MiniMax-M2.7-highspeed", + "id": "qwen3-vl-plus", + "name": "Qwen3 VL Plus", + "display_name": "Qwen3 VL Plus", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 204800, - "output": 131072 + "context": 262144, + "output": 32768 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true + "supported": true, + "default": false, + "budget": { + "default": 81920, + "min": 0, + "max": 81920 + } }, "extra_capabilities": { "reasoning": { @@ -6182,232 +6411,154 @@ }, "attachment": false, "open_weights": false, - "release_date": "2026-03-19", - "last_updated": "2026-03-19", + "knowledge": "2025-04", + "release_date": "2025-09-23", + "last_updated": "2025-09-23", "cost": { - "input": 0.6, - "output": 4.8 + "input": 0.143353, + "output": 1.433525, + "reasoning": 4.300576 }, "type": "chat" }, { - "id": "claude-sonnet-4-5", - "name": "claude-sonnet-4-5", - "display_name": "claude-sonnet-4-5", + "id": "qwen-vl-ocr", + "name": "Qwen Vl Ocr", + "display_name": "Qwen Vl Ocr", "modalities": { "input": [ "text", - "image", - "pdf" + "image" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 64000 + "context": 34096, + "output": 4096 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": false - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": false, - "mode": "budget", - "budget": { - "min": 1024, - "unit": "tokens" - }, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ], - "notes": [ - "Claude 4 manual thinking uses thinking.type = \"enabled\" with budget_tokens.", - "Interleaved thinking requires the interleaved-thinking-2025-05-14 beta header for this model family." - ] - } + "supported": false }, - "attachment": true, + "attachment": false, "open_weights": false, - "knowledge": "2025-07-31", - "release_date": "2025-09-30", - "last_updated": "2025-09-30", + "knowledge": "2024-04", + "release_date": "2024-10-28", + "last_updated": "2025-04-13", "cost": { - "input": 3, - "output": 15 + "input": 0.717, + "output": 0.717 }, "type": "chat" }, { - "id": "gpt-5.4-mini", - "name": "gpt-5.4-mini", - "display_name": "gpt-5.4-mini", + "id": "qwen-mt-turbo", + "name": "Qwen Mt Turbo", + "display_name": "Qwen Mt Turbo", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 400000, - "output": 128000 + "context": 16384, + "output": 8192 }, - "temperature": false, - "tool_call": true, + "temperature": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": false - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": false, - "mode": "effort", - "effort": "none", - "effort_options": [ - "none", - "low", - "medium", - "high", - "xhigh" - ], - "verbosity": "medium", - "verbosity_options": [ - "low", - "medium", - "high" - ], - "visibility": "hidden" - } + "supported": false }, - "attachment": true, + "attachment": false, "open_weights": false, - "knowledge": "2025-08-31", - "release_date": "2026-03-19", - "last_updated": "2026-03-19", + "knowledge": "2024-04", + "release_date": "2025-01", + "last_updated": "2025-01", "cost": { - "input": 0.75, - "output": 4.5 + "input": 0.101, + "output": 0.28 }, "type": "chat" }, { - "id": "claude-opus-4-6", - "name": "claude-opus-4-6", - "display_name": "claude-opus-4-6", + "id": "qwen-math-plus", + "name": "Qwen Math Plus", + "display_name": "Qwen Math Plus", "modalities": { "input": [ - "text", - "image", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 1000000, - "output": 128000 + "context": 4096, + "output": 3072 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": false - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": false, - "mode": "mixed", - "budget": { - "min": 1024, - "unit": "tokens" - }, - "effort": "high", - "effort_options": [ - "low", - "medium", - "high", - "max" - ], - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ], - "notes": [ - "Anthropic recommends adaptive thinking with effort for Claude 4.6; budget_tokens remains a deprecated compatibility path.", - "Anthropic API defaults effort to high; lower effort levels should be chosen per workload." - ] - } + "supported": false }, - "attachment": true, + "attachment": false, "open_weights": false, - "knowledge": "2025-05-31", - "release_date": "2026-02-06", - "last_updated": "2026-03-13", + "knowledge": "2024-04", + "release_date": "2024-08-16", + "last_updated": "2024-09-19", "cost": { - "input": 5, - "output": 25 + "input": 0.574, + "output": 1.721 }, "type": "chat" }, { - "id": "gpt-5.1-chat-latest", - "name": "gpt-5.1-chat-latest", - "display_name": "gpt-5.1-chat-latest", + "id": "qwen-mt-plus", + "name": "Qwen Mt Plus", + "display_name": "Qwen Mt Plus", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 16384 + "context": 16384, + "output": 8192 }, - "temperature": false, - "tool_call": true, + "temperature": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": true + "supported": false }, - "attachment": true, + "attachment": false, "open_weights": false, - "knowledge": "2024-09-30", - "release_date": "2025-11-14", - "last_updated": "2025-11-14", + "knowledge": "2024-04", + "release_date": "2025-01", + "last_updated": "2025-01", "cost": { - "input": 1.25, - "output": 10 + "input": 0.259, + "output": 0.775 }, "type": "chat" }, { - "id": "claude-opus-4-6-thinking", - "name": "claude-opus-4-6-thinking", - "display_name": "claude-opus-4-6-thinking", + "id": "qwen3.5-plus", + "name": "Qwen3.5 Plus", + "display_name": "Qwen3.5 Plus", "modalities": { "input": [ "text", "image", - "pdf" + "video" ], "output": [ "text" @@ -6415,7 +6566,7 @@ }, "limit": { "context": 1000000, - "output": 128000 + "output": 65536 }, "temperature": true, "tool_call": true, @@ -6426,46 +6577,68 @@ "extra_capabilities": { "reasoning": { "supported": true, - "default_enabled": true, - "mode": "mixed", - "budget": { - "min": 1024, - "unit": "tokens" - }, - "effort": "high", - "effort_options": [ - "low", - "medium", - "high", - "max" - ], "interleaved": true, "summaries": true, "visibility": "summary", "continuation": [ "thinking_blocks" - ], - "notes": [ - "Anthropic recommends adaptive thinking with effort for Claude 4.6; budget_tokens remains a deprecated compatibility path.", - "Anthropic API defaults effort to high; lower effort levels should be chosen per workload." ] } }, - "attachment": true, + "attachment": false, "open_weights": false, - "knowledge": "2025-05", - "release_date": "2026-02-06", - "last_updated": "2026-03-13", - "cost": { - "input": 5, - "output": 25 + "knowledge": "2025-04", + "release_date": "2026-02-16", + "last_updated": "2026-02-16", + "cost": { + "input": 0.573, + "output": 3.44, + "reasoning": 3.44 }, "type": "chat" }, { - "id": "glm-4.5-airx", - "name": "glm-4.5-airx", - "display_name": "glm-4.5-airx", + "id": "qwen-omni-turbo", + "name": "Qwen-Omni Turbo", + "display_name": "Qwen-Omni Turbo", + "modalities": { + "input": [ + "text", + "image", + "audio", + "video" + ], + "output": [ + "text", + "audio" + ] + }, + "limit": { + "context": 32768, + "output": 2048 + }, + "temperature": true, + "tool_call": true, + "reasoning": { + "supported": false + }, + "attachment": false, + "open_weights": false, + "knowledge": "2024-04", + "release_date": "2025-01-19", + "last_updated": "2025-03-26", + "cost": { + "input": 0.058, + "output": 0.23, + "input_audio": 3.584, + "output_audio": 7.168 + }, + "type": "chat" + }, + { + "id": "qwen2-5-72b-instruct", + "name": "Qwen2.5 72B Instruct", + "display_name": "Qwen2.5 72B Instruct", "modalities": { "input": [ "text" @@ -6475,8 +6648,8 @@ ] }, "limit": { - "context": 128000, - "output": 16384 + "context": 131072, + "output": 8192 }, "temperature": true, "tool_call": true, @@ -6484,33 +6657,31 @@ "supported": false }, "attachment": false, - "open_weights": false, - "knowledge": "2025-04", - "release_date": "2025-07-29", - "last_updated": "2025-07-29", + "open_weights": true, + "knowledge": "2024-04", + "release_date": "2024-09", + "last_updated": "2024-09", "cost": { - "input": 0.572, - "output": 1.714 + "input": 0.574, + "output": 1.721 }, "type": "chat" }, { - "id": "claude-sonnet-4-5-20250929-thinking", - "name": "claude-sonnet-4-5-20250929-thinking", - "display_name": "claude-sonnet-4-5-20250929-thinking", + "id": "deepseek-r1-distill-qwen-7b", + "name": "DeepSeek R1 Distill Qwen 7B", + "display_name": "DeepSeek R1 Distill Qwen 7B", "modalities": { "input": [ - "text", - "image", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 64000 + "context": 32768, + "output": 16384 }, "temperature": true, "tool_call": true, @@ -6518,123 +6689,51 @@ "supported": true, "default": true }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": true, - "mode": "budget", - "budget": { - "min": 1024, - "unit": "tokens" - }, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ], - "notes": [ - "Claude 4 manual thinking uses thinking.type = \"enabled\" with budget_tokens.", - "Interleaved thinking requires the interleaved-thinking-2025-05-14 beta header for this model family." - ] - } - }, - "attachment": true, + "attachment": false, "open_weights": false, - "knowledge": "2025-03", - "release_date": "2025-09-30", - "last_updated": "2025-09-30", + "release_date": "2025-01-01", + "last_updated": "2025-01-01", "cost": { - "input": 3, - "output": 15 + "input": 0.072, + "output": 0.144 }, "type": "chat" }, { - "id": "claude-opus-4-7", - "name": "claude-opus-4-7", - "display_name": "claude-opus-4-7", + "id": "deepseek-v3-1", + "name": "DeepSeek V3.1", + "display_name": "DeepSeek V3.1", "modalities": { "input": [ - "text", - "image", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 1000000, - "output": 128000 + "context": 131072, + "output": 65536 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": false - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": false, - "mode": "effort", - "effort": "high", - "effort_options": [ - "low", - "medium", - "high", - "xhigh", - "max" - ], - "interleaved": true, - "summaries": true, - "visibility": "omitted", - "continuation": [ - "thinking_blocks" - ], - "notes": [ - "Claude Opus 4.7 and newer Opus models require thinking.type = \"adaptive\" to enable thinking explicitly.", - "Manual budget_tokens requests return 400 on Claude Opus 4.7 and newer adaptive-only Opus models.", - "task_budget is separate from thinking control and should not be treated as a thinking budget." - ] - } + "supported": false }, - "attachment": true, + "attachment": false, "open_weights": false, - "knowledge": "2026-01-31", - "release_date": "2026-04-17", - "last_updated": "2026-04-17", + "release_date": "2025-01-01", + "last_updated": "2025-01-01", "cost": { - "input": 5, - "output": 25, - "cache_read": 0.5, - "cache_write": 6.25, - "tiers": [ - { - "input": 10, - "output": 37.5, - "cache_read": 1, - "cache_write": 12.5, - "tier": { - "type": "context", - "size": 200000 - } - } - ], - "context_over_200k": { - "input": 10, - "output": 37.5, - "cache_read": 1, - "cache_write": 12.5 - } + "input": 0.574, + "output": 1.721 }, "type": "chat" }, { - "id": "glm-4.5-air", - "name": "glm-4.5-air", - "display_name": "glm-4.5-air", + "id": "qwen2-5-coder-32b-instruct", + "name": "Qwen2.5-Coder 32B Instruct", + "display_name": "Qwen2.5-Coder 32B Instruct", "modalities": { "input": [ "text" @@ -6645,126 +6744,156 @@ }, "limit": { "context": 131072, - "output": 98304 + "output": 8192 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, "attachment": false, "open_weights": true, - "knowledge": "2025-04", - "release_date": "2025-07-29", - "last_updated": "2025-07-29", + "knowledge": "2024-04", + "release_date": "2024-11", + "last_updated": "2024-11", "cost": { - "input": 0.1143, - "output": 0.286 + "input": 0.287, + "output": 0.861 }, "type": "chat" }, { - "id": "gemini-3-pro-image-preview", - "name": "gemini-3-pro-image-preview", - "display_name": "gemini-3-pro-image-preview", + "id": "qwen-flash", + "name": "Qwen Flash", + "display_name": "Qwen Flash", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 32768, - "output": 64000 + "context": 1000000, + "output": 32768 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { "supported": true, - "default": true + "default": false, + "budget": { + "default": 81920, + "min": 0, + "max": 81920 + } }, "extra_capabilities": { "reasoning": { "supported": true, - "default_enabled": true, - "mode": "level", - "level": "high", - "level_options": [ - "low", - "high" - ], + "interleaved": true, "summaries": true, "visibility": "summary", "continuation": [ - "thought_signatures" + "thinking_blocks" ] } }, - "attachment": true, + "search": { + "supported": true, + "default": false, + "forced_search": false, + "search_strategy": "turbo" + }, + "attachment": false, "open_weights": false, - "knowledge": "2025-06", - "release_date": "2025-11-20", - "last_updated": "2025-11-20", + "knowledge": "2024-04", + "release_date": "2025-07-28", + "last_updated": "2025-07-28", "cost": { - "input": 2, - "output": 120 + "input": 0.022, + "output": 0.216 }, - "type": "imageGeneration" + "type": "chat" }, { - "id": "gpt-5-thinking", - "name": "gpt-5-thinking", - "display_name": "gpt-5-thinking", + "id": "deepseek-v3-2-exp", + "name": "DeepSeek V3.2 Exp", + "display_name": "DeepSeek V3.2 Exp", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 400000, - "output": 128000 + "context": 131072, + "output": 65536 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, - "attachment": true, + "attachment": false, "open_weights": false, - "knowledge": "2024-10", - "release_date": "2025-08-08", - "last_updated": "2025-08-08", + "release_date": "2025-01-01", + "last_updated": "2025-01-01", "cost": { - "input": 1.25, - "output": 10 + "input": 0.287, + "output": 0.431 }, "type": "chat" }, { - "id": "grok-4-1-fast-reasoning", - "name": "grok-4-1-fast-reasoning", - "display_name": "grok-4-1-fast-reasoning", + "id": "moonshot-kimi-k2-instruct", + "name": "Moonshot Kimi K2 Instruct", + "display_name": "Moonshot Kimi K2 Instruct", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 2000000, - "output": 30000 + "context": 131072, + "output": 8192 + }, + "temperature": true, + "tool_call": true, + "reasoning": { + "supported": false + }, + "attachment": false, + "open_weights": true, + "release_date": "2025-01-01", + "last_updated": "2025-01-01", + "cost": { + "input": 0.574, + "output": 2.294 + }, + "type": "chat" + }, + { + "id": "deepseek-r1-distill-qwen-14b", + "name": "DeepSeek R1 Distill Qwen 14B", + "display_name": "DeepSeek R1 Distill Qwen 14B", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 32768, + "output": 16384 }, "temperature": true, "tool_call": true, @@ -6772,26 +6901,20 @@ "supported": true, "default": true }, - "extra_capabilities": { - "reasoning": { - "supported": true - } - }, - "attachment": true, + "attachment": false, "open_weights": false, - "knowledge": "2025-06", - "release_date": "2025-11-20", - "last_updated": "2025-11-20", + "release_date": "2025-01-01", + "last_updated": "2025-01-01", "cost": { - "input": 0.2, - "output": 0.5 + "input": 0.144, + "output": 0.431 }, "type": "chat" }, { - "id": "grok-4.20-multi-agent-beta-0309", - "name": "grok-4.20-multi-agent-beta-0309", - "display_name": "grok-4.20-multi-agent-beta-0309", + "id": "qwen3-vl-235b-a22b", + "name": "Qwen3-VL 235B-A22B", + "display_name": "Qwen3-VL 235B-A22B", "modalities": { "input": [ "text", @@ -6802,8 +6925,8 @@ ] }, "limit": { - "context": 2000000, - "output": 30000 + "context": 131072, + "output": 32768 }, "temperature": true, "tool_call": true, @@ -6813,35 +6936,76 @@ }, "extra_capabilities": { "reasoning": { - "supported": true + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] } }, - "attachment": true, + "attachment": false, + "open_weights": true, + "knowledge": "2025-04", + "release_date": "2025-04", + "last_updated": "2025-04", + "cost": { + "input": 0.286705, + "output": 1.14682, + "reasoning": 2.867051 + }, + "type": "chat" + }, + { + "id": "qwen-deep-research", + "name": "Qwen Deep Research", + "display_name": "Qwen Deep Research", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 1000000, + "output": 32768 + }, + "temperature": true, + "tool_call": true, + "reasoning": { + "supported": false + }, + "attachment": false, "open_weights": false, - "release_date": "2026-03-16", - "last_updated": "2026-03-16", + "knowledge": "2024-04", + "release_date": "2024-01", + "last_updated": "2024-01", "cost": { - "input": 2, - "output": 6 + "input": 7.742, + "output": 23.367 }, "type": "chat" }, { - "id": "gemini-2.5-flash-nothink", - "name": "gemini-2.5-flash-nothink", - "display_name": "gemini-2.5-flash-nothink", + "id": "kimi-k2.5", + "name": "Moonshot Kimi K2.5", + "display_name": "Moonshot Kimi K2.5", "modalities": { "input": [ "text", - "image" + "image", + "video" ], "output": [ "text" ] }, "limit": { - "context": 1000000, - "output": 65536 + "context": 262144, + "output": 32768 }, "temperature": true, "tool_call": true, @@ -6852,49 +7016,41 @@ "extra_capabilities": { "reasoning": { "supported": true, - "default_enabled": true, - "mode": "budget", - "budget": { - "default": -1, - "min": 0, - "max": 24576, - "auto": -1, - "off": 0, - "unit": "tokens" - }, + "interleaved": true, "summaries": true, "visibility": "summary", "continuation": [ - "thought_signatures" + "thinking_blocks" ] } }, - "attachment": true, - "open_weights": false, + "attachment": false, + "open_weights": true, "knowledge": "2025-01", - "release_date": "2025-06-24", - "last_updated": "2025-06-24", + "release_date": "2026-01-27", + "last_updated": "2026-01-27", "cost": { - "input": 0.3, - "output": 2.5 + "input": 0.574, + "output": 2.411 }, "type": "chat" }, { - "id": "glm-5.1", - "name": "glm-5.1", - "display_name": "glm-5.1", + "id": "qwen3-vl-30b-a3b", + "name": "Qwen3-VL 30B-A3B", + "display_name": "Qwen3-VL 30B-A3B", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 131072 + "context": 131072, + "output": 32768 }, "temperature": true, "tool_call": true, @@ -6914,128 +7070,124 @@ } }, "attachment": false, - "open_weights": false, - "release_date": "2026-04-10", - "last_updated": "2026-04-10", + "open_weights": true, + "knowledge": "2025-04", + "release_date": "2025-04", + "last_updated": "2025-04", "cost": { - "input": 0.86, - "output": 3.5 + "input": 0.108, + "output": 0.431, + "reasoning": 1.076 }, "type": "chat" }, { - "id": "MiniMax-M2.1", - "name": "MiniMax-M2.1", - "display_name": "MiniMax-M2.1", + "id": "qwen-vl-max", + "name": "Qwen-VL Max", + "display_name": "Qwen-VL Max", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 1000000, - "output": 131072 + "context": 131072, + "output": 8192 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true - } + "supported": false }, "attachment": false, "open_weights": false, - "release_date": "2025-12-19", - "last_updated": "2025-12-19", + "knowledge": "2024-04", + "release_date": "2024-04-08", + "last_updated": "2025-08-13", "cost": { - "input": 0.3, - "output": 1.2 + "input": 0.23, + "output": 0.574 }, "type": "chat" }, { - "id": "gpt-4.1-nano", - "name": "gpt-4.1-nano", - "display_name": "gpt-4.1-nano", + "id": "deepseek-r1-distill-qwen-1-5b", + "name": "DeepSeek R1 Distill Qwen 1.5B", + "display_name": "DeepSeek R1 Distill Qwen 1.5B", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 1047576, - "output": 32768 + "context": 32768, + "output": 16384 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": true, + "attachment": false, "open_weights": false, - "knowledge": "2024-04", - "release_date": "2025-04-14", - "last_updated": "2025-04-14", + "release_date": "2025-01-01", + "last_updated": "2025-01-01", "cost": { - "input": 0.1, - "output": 0.4 + "input": 0, + "output": 0 }, "type": "chat" }, { - "id": "gemini-3.1-flash-image-preview", - "name": "gemini-3.1-flash-image-preview", - "display_name": "gemini-3.1-flash-image-preview", + "id": "qwen-max", + "name": "Qwen Max", + "display_name": "Qwen Max", "modalities": { "input": [ - "text", - "image", - "pdf" + "text" ], "output": [ - "text", - "image" + "text" ] }, "limit": { - "context": 131072, - "output": 32768 + "context": 32768, + "output": 8192 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { - "supported": true + "supported": false }, - "extra_capabilities": { - "reasoning": { - "supported": true - } + "search": { + "supported": true, + "default": false, + "forced_search": false, + "search_strategy": "turbo" }, - "attachment": true, + "attachment": false, "open_weights": false, - "knowledge": "2025-01", - "release_date": "2026-02-27", - "last_updated": "2026-02-27", + "knowledge": "2024-04", + "release_date": "2024-04-03", + "last_updated": "2025-01-25", "cost": { - "input": 0.5, - "output": 60 + "input": 0.345, + "output": 1.377 }, - "type": "imageGeneration" + "type": "chat" }, { - "id": "qwen-plus", - "name": "Qwen-Plus", - "display_name": "Qwen-Plus", + "id": "MiniMax-M2.5", + "name": "MiniMax-M2.5", + "display_name": "MiniMax-M2.5", "modalities": { "input": [ "text" @@ -7045,13 +7197,14 @@ ] }, "limit": { - "context": 1000000, - "output": 32768 + "context": 204800, + "output": 131072 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true + "supported": true, + "default": true }, "extra_capabilities": { "reasoning": { @@ -7065,66 +7218,69 @@ } }, "attachment": false, - "open_weights": false, - "knowledge": "2024-10", - "release_date": "2024-07-23", - "last_updated": "2024-07-23", + "open_weights": true, + "release_date": "2026-02-12", + "last_updated": "2026-02-12", "cost": { - "input": 0.12, + "input": 0.3, "output": 1.2 }, "type": "chat" }, { - "id": "grok-4.20-beta-0309-non-reasoning", - "name": "grok-4.20-beta-0309-non-reasoning", - "display_name": "grok-4.20-beta-0309-non-reasoning", + "id": "qwen3-235b-a22b", + "name": "Qwen3 235B A22B", + "display_name": "Qwen3 235B A22B", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 2000000, - "output": 30000 + "context": 131072, + "output": 32768 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true + "supported": true, + "default": false, + "budget": { + "default": 81920, + "min": 0, + "max": 81920 + } }, "extra_capabilities": { "reasoning": { - "supported": true + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] } }, - "attachment": true, - "open_weights": false, - "release_date": "2026-03-16", - "last_updated": "2026-03-16", + "attachment": false, + "open_weights": true, + "knowledge": "2025-04", + "release_date": "2025-04", + "last_updated": "2025-04", "cost": { - "input": 2, - "output": 6 + "input": 0.287, + "output": 1.147, + "reasoning": 2.868 }, "type": "chat" - } - ] - }, - "nano-gpt": { - "id": "nano-gpt", - "name": "NanoGPT", - "display_name": "NanoGPT", - "api": "https://nano-gpt.com/api/v1", - "doc": "https://docs.nano-gpt.com", - "models": [ + }, { - "id": "learnlm-1.5-pro-experimental", - "name": "Gemini LearnLM Experimental", - "display_name": "Gemini LearnLM Experimental", + "id": "deepseek-r1-distill-llama-8b", + "name": "DeepSeek R1 Distill Llama 8B", + "display_name": "DeepSeek R1 Distill Llama 8B", "modalities": { "input": [ "text" @@ -7134,41 +7290,44 @@ ] }, "limit": { - "context": 32767, - "output": 8192 + "context": 32768, + "output": 16384 }, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "attachment": false, "open_weights": false, - "release_date": "2024-05-14", - "last_updated": "2024-05-14", + "release_date": "2025-01-01", + "last_updated": "2025-01-01", "cost": { - "input": 3.502, - "output": 10.506 + "input": 0, + "output": 0 }, "type": "chat" }, { - "id": "claude-sonnet-4-thinking:8192", - "name": "Claude 4 Sonnet Thinking (8K)", - "display_name": "Claude 4 Sonnet Thinking (8K)", + "id": "kimi-k2.6", + "name": "Moonshot Kimi K2.6", + "display_name": "Moonshot Kimi K2.6", "modalities": { "input": [ "text", "image", - "pdf" + "video" ], "output": [ "text" ] }, "limit": { - "context": 1000000, - "output": 64000 + "context": 262144, + "output": 16384 }, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, @@ -7177,38 +7336,29 @@ "extra_capabilities": { "reasoning": { "supported": true, - "default_enabled": true, - "mode": "budget", - "budget": { - "min": 1024, - "unit": "tokens" - }, "interleaved": true, "summaries": true, "visibility": "summary", "continuation": [ "thinking_blocks" - ], - "notes": [ - "Claude 4 manual thinking uses thinking.type = \"enabled\" with budget_tokens.", - "Interleaved thinking requires the interleaved-thinking-2025-05-14 beta header for this model family." ] } }, "attachment": true, - "open_weights": false, - "release_date": "2025-05-22", - "last_updated": "2025-05-22", + "open_weights": true, + "knowledge": "2025-01", + "release_date": "2026-04-21", + "last_updated": "2026-04-21", "cost": { - "input": 2.992, - "output": 14.994 + "input": 0.929, + "output": 3.858 }, "type": "chat" }, { - "id": "mistral-code-latest", - "name": "Mistral Code Latest", - "display_name": "Mistral Code Latest", + "id": "qwen3-coder-480b-a35b-instruct", + "name": "Qwen3-Coder 480B-A35B Instruct", + "display_name": "Qwen3-Coder 480B-A35B Instruct", "modalities": { "input": [ "text" @@ -7218,27 +7368,29 @@ ] }, "limit": { - "context": 256000, - "output": 32768 + "context": 262144, + "output": 65536 }, + "temperature": true, "tool_call": true, "reasoning": { "supported": false }, "attachment": false, - "open_weights": false, - "release_date": "2026-06-02", - "last_updated": "2026-06-02", + "open_weights": true, + "knowledge": "2025-04", + "release_date": "2025-04", + "last_updated": "2025-04", "cost": { - "input": 0.3, - "output": 0.9 + "input": 0.861, + "output": 3.441 }, "type": "chat" }, { - "id": "command-a-reasoning-08-2025", - "name": "Cohere Command A (08/2025)", - "display_name": "Cohere Command A (08/2025)", + "id": "qwq-plus", + "name": "QwQ Plus", + "display_name": "QwQ Plus", "modalities": { "input": [ "text" @@ -7248,27 +7400,84 @@ ] }, "limit": { - "context": 256000, + "context": 131072, "output": 8192 }, + "temperature": true, "tool_call": false, "reasoning": { - "supported": false + "supported": true, + "default": true, + "budget": { + "default": 32768, + "min": 0, + "max": 32768 + } + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } + }, + "search": { + "supported": true, + "default": false, + "forced_search": false, + "search_strategy": "turbo" }, "attachment": false, "open_weights": false, - "release_date": "2025-08-22", - "last_updated": "2025-08-22", + "knowledge": "2024-04", + "release_date": "2025-03-05", + "last_updated": "2025-03-05", "cost": { - "input": 2.5, - "output": 10 + "input": 0.23, + "output": 0.574 }, "type": "chat" }, { - "id": "Qwen3.5-27B-BlueStar-v3-Derestricted-Lite", - "name": "Qwen3.5 27B BlueStar v3 Derestricted Lite", - "display_name": "Qwen3.5 27B BlueStar v3 Derestricted Lite", + "id": "qwen2-5-32b-instruct", + "name": "Qwen2.5 32B Instruct", + "display_name": "Qwen2.5 32B Instruct", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 131072, + "output": 8192 + }, + "temperature": true, + "tool_call": true, + "reasoning": { + "supported": false + }, + "attachment": false, + "open_weights": true, + "knowledge": "2024-04", + "release_date": "2024-09", + "last_updated": "2024-09", + "cost": { + "input": 0.287, + "output": 0.861 + }, + "type": "chat" + }, + { + "id": "qwen3.5-397b-a17b", + "name": "Qwen3.5 397B-A17B", + "display_name": "Qwen3.5 397B-A17B", "modalities": { "input": [ "text", @@ -7281,9 +7490,10 @@ }, "limit": { "context": 262144, - "output": 16384 + "output": 65536 }, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { "supported": true, "default": true @@ -7299,51 +7509,54 @@ ] } }, - "attachment": true, - "open_weights": false, - "release_date": "2026-04-30", - "last_updated": "2026-04-30", + "attachment": false, + "open_weights": true, + "knowledge": "2025-04", + "release_date": "2026-02-16", + "last_updated": "2026-02-16", "cost": { - "input": 0.306, - "output": 0.306 + "input": 0.43, + "output": 2.58, + "reasoning": 2.58 }, "type": "chat" }, { - "id": "deepclaude", - "name": "DeepClaude", - "display_name": "DeepClaude", + "id": "tongyi-intent-detect-v3", + "name": "Tongyi Intent Detect V3", + "display_name": "Tongyi Intent Detect V3", "modalities": { "input": [ - "text", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 8192 + "context": 8192, + "output": 1024 }, + "temperature": true, "tool_call": false, "reasoning": { "supported": false }, - "attachment": true, + "attachment": false, "open_weights": false, - "release_date": "2025-02-01", - "last_updated": "2025-02-01", + "knowledge": "2024-04", + "release_date": "2024-01", + "last_updated": "2024-01", "cost": { - "input": 3, - "output": 15 + "input": 0.058, + "output": 0.144 }, "type": "chat" }, { - "id": "v0-1.5-lg", - "name": "v0 1.5 LG", - "display_name": "v0 1.5 LG", + "id": "qwen3-coder-flash", + "name": "Qwen3 Coder Flash", + "display_name": "Qwen3 Coder Flash", "modalities": { "input": [ "text" @@ -7354,26 +7567,28 @@ }, "limit": { "context": 1000000, - "output": 64000 + "output": 65536 }, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { "supported": false }, "attachment": false, "open_weights": false, - "release_date": "2025-07-04", - "last_updated": "2025-07-04", + "knowledge": "2025-04", + "release_date": "2025-07-28", + "last_updated": "2025-07-28", "cost": { - "input": 15, - "output": 75 + "input": 0.144, + "output": 0.574 }, "type": "chat" }, { - "id": "Meta-Llama-3-1-8B-Instruct-FP8", - "name": "Llama 3.1 8B (decentralized)", - "display_name": "Llama 3.1 8B (decentralized)", + "id": "deepseek-r1-distill-qwen-32b", + "name": "DeepSeek R1 Distill Qwen 32B", + "display_name": "DeepSeek R1 Distill Qwen 32B", "modalities": { "input": [ "text" @@ -7383,42 +7598,43 @@ ] }, "limit": { - "context": 128000, + "context": 32768, "output": 16384 }, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "attachment": false, "open_weights": false, - "release_date": "2024-07-23", - "last_updated": "2024-07-23", + "release_date": "2025-01-01", + "last_updated": "2025-01-01", "cost": { - "input": 0.02, - "output": 0.03 + "input": 0.287, + "output": 0.861 }, "type": "chat" }, { - "id": "Qwen3.5-27B-Marvin-DPO-V2-Derestricted", - "name": "Qwen3.5 27B Marvin DPO V2 Derestricted", - "display_name": "Qwen3.5 27B Marvin DPO V2 Derestricted", + "id": "qwq-32b", + "name": "QwQ 32B", + "display_name": "QwQ 32B", "modalities": { "input": [ - "text", - "image", - "video" + "text" ], "output": [ "text" ] }, "limit": { - "context": 262144, - "output": 16384 + "context": 131072, + "output": 8192 }, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { "supported": true, "default": true @@ -7434,160 +7650,148 @@ ] } }, - "attachment": true, - "open_weights": false, - "release_date": "2026-04-30", - "last_updated": "2026-04-30", + "attachment": false, + "open_weights": true, + "knowledge": "2024-04", + "release_date": "2024-12", + "last_updated": "2024-12", "cost": { - "input": 0.306, - "output": 0.306 + "input": 0.287, + "output": 0.861 }, "type": "chat" }, { - "id": "gemini-2.5-flash-lite-preview-06-17", - "name": "Gemini 2.5 Flash Lite Preview", - "display_name": "Gemini 2.5 Flash Lite Preview", + "id": "qwen3-14b", + "name": "Qwen3 14B", + "display_name": "Qwen3 14B", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 1048756, - "output": 65536 + "context": 131072, + "output": 8192 }, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { "supported": true, - "default": false + "default": true, + "budget": { + "default": 38912, + "min": 0, + "max": 38912 + } }, "extra_capabilities": { "reasoning": { "supported": true, - "default_enabled": false, - "mode": "budget", - "budget": { - "default": -1, - "min": 512, - "max": 24576, - "auto": -1, - "unit": "tokens" - }, + "interleaved": true, "summaries": true, "visibility": "summary", "continuation": [ - "thought_signatures" + "thinking_blocks" ] } }, - "attachment": true, - "open_weights": false, - "release_date": "2025-06-17", - "last_updated": "2025-06-17", + "attachment": false, + "open_weights": true, + "knowledge": "2025-04", + "release_date": "2025-04", + "last_updated": "2025-04", "cost": { - "input": 0.15, - "output": 0.6 + "input": 0.144, + "output": 0.574, + "reasoning": 1.434 }, "type": "chat" }, { - "id": "glm-4.1v-thinking-flashx", - "name": "GLM 4.1V Thinking FlashX", - "display_name": "GLM 4.1V Thinking FlashX", + "id": "qwen3-asr-flash", + "name": "Qwen3-ASR Flash", + "display_name": "Qwen3-ASR Flash", "modalities": { "input": [ - "text", - "image" + "audio" ], "output": [ "text" ] }, "limit": { - "context": 64000, - "output": 8192 + "context": 53248, + "output": 4096 }, + "temperature": false, "tool_call": false, "reasoning": { "supported": false }, - "attachment": true, + "attachment": false, "open_weights": false, - "release_date": "2025-07-09", - "last_updated": "2025-07-09", + "knowledge": "2024-04", + "release_date": "2025-09-08", + "last_updated": "2025-09-08", "cost": { - "input": 0.3, - "output": 0.3 + "input": 0.032, + "output": 0.032 }, "type": "chat" }, { - "id": "Qwen3.5-27B-Derestricted", - "name": "Qwen3.5 27B Derestricted", - "display_name": "Qwen3.5 27B Derestricted", + "id": "qwen-doc-turbo", + "name": "Qwen Doc Turbo", + "display_name": "Qwen Doc Turbo", "modalities": { "input": [ - "text", - "image", - "video" + "text" ], "output": [ "text" ] }, "limit": { - "context": 262144, - "output": 16384 + "context": 131072, + "output": 8192 }, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } - }, - "attachment": true, + "attachment": false, "open_weights": false, - "release_date": "2026-03-17", - "last_updated": "2026-03-17", + "knowledge": "2024-04", + "release_date": "2024-01", + "last_updated": "2024-01", "cost": { - "input": 0.306, - "output": 0.306 + "input": 0.087, + "output": 0.144 }, "type": "chat" }, { - "id": "claude-haiku-4-5-20251001-thinking", - "name": "Claude Haiku 4.5 Thinking", - "display_name": "Claude Haiku 4.5 Thinking", + "id": "glm-5", + "name": "GLM-5", + "display_name": "GLM-5", "modalities": { "input": [ - "text", - "image", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 64000 + "context": 202752, + "output": 16384 }, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, @@ -7596,39 +7800,28 @@ "extra_capabilities": { "reasoning": { "supported": true, - "default_enabled": true, - "mode": "budget", - "budget": { - "min": 1024, - "unit": "tokens" - }, "interleaved": true, "summaries": true, "visibility": "summary", "continuation": [ "thinking_blocks" - ], - "notes": [ - "Claude 4 manual thinking uses thinking.type = \"enabled\" with budget_tokens.", - "Interleaved thinking requires the interleaved-thinking-2025-05-14 beta header for this model family." ] } }, - "attachment": true, + "attachment": false, "open_weights": false, - "release_date": "2025-10-15", - "last_updated": "2025-10-15", + "release_date": "2026-02-11", + "last_updated": "2026-02-11", "cost": { - "input": 1, - "output": 5, - "cache_read": 0.1 + "input": 0.86, + "output": 3.15 }, "type": "chat" }, { - "id": "gemini-2.0-flash-thinking-exp-1219", - "name": "Gemini 2.0 Flash Thinking 1219", - "display_name": "Gemini 2.0 Flash Thinking 1219", + "id": "qwen-turbo", + "name": "Qwen Turbo", + "display_name": "Qwen Turbo", "modalities": { "input": [ "text" @@ -7638,27 +7831,53 @@ ] }, "limit": { - "context": 32767, - "output": 8192 + "context": 131072, + "output": 16384 }, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": false, + "budget": { + "default": 38912, + "min": 0, + "max": 38912 + } + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } + }, + "search": { + "supported": true, + "default": false, + "forced_search": false, + "search_strategy": "turbo" }, "attachment": false, "open_weights": false, - "release_date": "2024-12-19", - "last_updated": "2024-12-19", + "knowledge": "2024-04", + "release_date": "2024-11-01", + "last_updated": "2025-07-15", "cost": { - "input": 0.1003, - "output": 0.408 + "input": 0.044, + "output": 0.087, + "reasoning": 0.431 }, "type": "chat" }, { - "id": "v0-1.0-md", - "name": "v0 1.0 MD", - "display_name": "v0 1.0 MD", + "id": "qwen2-5-7b-instruct", + "name": "Qwen2.5 7B Instruct", + "display_name": "Qwen2.5 7B Instruct", "modalities": { "input": [ "text" @@ -7668,123 +7887,144 @@ ] }, "limit": { - "context": 200000, - "output": 64000 + "context": 131072, + "output": 8192 }, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { "supported": false }, "attachment": false, - "open_weights": false, - "release_date": "2025-07-04", - "last_updated": "2025-07-04", + "open_weights": true, + "knowledge": "2024-04", + "release_date": "2024-09", + "last_updated": "2024-09", "cost": { - "input": 3, - "output": 15 + "input": 0.072, + "output": 0.144 }, "type": "chat" }, { - "id": "qwen3-30b-a3b-instruct-2507", - "name": "Qwen3 30B A3B Instruct 2507", - "display_name": "Qwen3 30B A3B Instruct 2507", + "id": "qwen2-5-vl-7b-instruct", + "name": "Qwen2.5-VL 7B Instruct", + "display_name": "Qwen2.5-VL 7B Instruct", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 256000, - "output": 32768 + "context": 131072, + "output": 8192 }, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { "supported": false }, "attachment": false, - "open_weights": false, - "release_date": "2025-02-20", - "last_updated": "2025-02-20", + "open_weights": true, + "knowledge": "2024-04", + "release_date": "2024-09", + "last_updated": "2024-09", "cost": { - "input": 0.2, - "output": 0.5 + "input": 0.287, + "output": 0.717 }, "type": "chat" }, { - "id": "gemma-4-31B-K1-v5", - "name": "Gemma 4 31B K1 v5", - "display_name": "Gemma 4 31B K1 v5", + "id": "qwen3.6-max-preview", + "name": "Qwen3.6 Max Preview", + "display_name": "Qwen3.6 Max Preview", "modalities": { "input": [ - "text", - "image", - "video" + "text" ], "output": [ "text" ] }, "limit": { - "context": 262144, - "output": 16384 + "context": 245800, + "output": 65536 }, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { "supported": true, "default": true }, - "attachment": true, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } + }, + "attachment": false, "open_weights": false, - "release_date": "2026-05-02", - "last_updated": "2026-05-02", + "release_date": "2026-04-20", + "last_updated": "2026-04-21", "cost": { - "input": 0.306, - "output": 0.306 + "input": 1.32, + "output": 7.9, + "cache_read": 0.132 }, "type": "chat" }, { - "id": "glm-4-plus", - "name": "GLM-4 Plus", - "display_name": "GLM-4 Plus", + "id": "qwen-vl-plus", + "name": "Qwen-VL Plus", + "display_name": "Qwen-VL Plus", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 4096 + "context": 131072, + "output": 8192 }, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { "supported": false }, "attachment": false, "open_weights": false, - "release_date": "2024-08-01", - "last_updated": "2024-08-01", + "knowledge": "2024-04", + "release_date": "2024-01-25", + "last_updated": "2025-08-15", "cost": { - "input": 7.497, - "output": 7.497 + "input": 0.115, + "output": 0.287 }, "type": "chat" }, { - "id": "auto-model-basic", - "name": "Auto model (Basic)", - "display_name": "Auto model (Basic)", + "id": "qwen3.6-plus", + "name": "Qwen3.6 Plus", + "display_name": "Qwen3.6 Plus", "modalities": { "input": [ - "text" + "text", + "image", + "video" ], "output": [ "text" @@ -7792,26 +8032,60 @@ }, "limit": { "context": 1000000, - "output": 1000000 + "output": 65536 }, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } }, "attachment": false, "open_weights": false, - "release_date": "2024-06-01", - "last_updated": "2024-06-01", + "knowledge": "2025-04", + "release_date": "2026-04-02", + "last_updated": "2026-04-02", "cost": { - "input": 9.996, - "output": 19.992 + "input": 0.5, + "output": 3, + "cache_read": 0.05, + "cache_write": 0.625, + "tiers": [ + { + "input": 2, + "output": 6, + "cache_read": 0.2, + "cache_write": 2.5, + "tier": { + "type": "context", + "size": 256000 + } + } + ], + "context_over_200k": { + "input": 2, + "output": 6, + "cache_read": 0.2, + "cache_write": 2.5 + } }, "type": "chat" }, { - "id": "jamba-large", - "name": "Jamba Large", - "display_name": "Jamba Large", + "id": "MiniMax/MiniMax-M2.7", + "name": "MiniMax-M2.7", + "display_name": "MiniMax-M2.7", "modalities": { "input": [ "text" @@ -7821,27 +8095,42 @@ ] }, "limit": { - "context": 256000, - "output": 4096 + "context": 204800, + "output": 131072 }, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } }, "attachment": false, - "open_weights": false, - "release_date": "2025-07-09", - "last_updated": "2025-07-09", + "open_weights": true, + "release_date": "2026-03-18", + "last_updated": "2026-03-18", "cost": { - "input": 1.989, - "output": 7.99 + "input": 0.3, + "output": 1.2, + "cache_read": 0.06, + "cache_write": 0.375 }, "type": "chat" }, { - "id": "qwen3.5-122b-a10b", - "name": "Qwen3.5 122B A10B", - "display_name": "Qwen3.5 122B A10B", + "id": "kimi/kimi-k2.5", + "name": "kimi/kimi-k2.5", + "display_name": "kimi/kimi-k2.5", "modalities": { "input": [ "text", @@ -7853,12 +8142,14 @@ ] }, "limit": { - "context": 260096, - "output": 65536 + "context": 262144, + "output": 262144 }, - "tool_call": false, + "temperature": false, + "tool_call": true, "reasoning": { - "supported": true + "supported": true, + "default": true }, "extra_capabilities": { "reasoning": { @@ -7871,34 +8162,36 @@ ] } }, - "attachment": true, - "open_weights": false, - "release_date": "2026-02-24", - "last_updated": "2026-02-24", + "attachment": false, + "open_weights": true, + "knowledge": "2025-01", + "release_date": "2026-01-27", + "last_updated": "2026-01-27", "cost": { - "input": 0.36, - "output": 2.88 + "input": 0.6, + "output": 3, + "cache_read": 0.1 }, "type": "chat" }, { - "id": "gemini-2.5-flash-preview-04-17:thinking", - "name": "Gemini 2.5 Flash Preview Thinking", - "display_name": "Gemini 2.5 Flash Preview Thinking", + "id": "siliconflow/deepseek-r1-0528", + "name": "siliconflow/deepseek-r1-0528", + "display_name": "siliconflow/deepseek-r1-0528", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 1048756, - "output": 65536 + "context": 163840, + "output": 32768 }, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { "supported": true, "default": true @@ -7906,68 +8199,60 @@ "extra_capabilities": { "reasoning": { "supported": true, - "default_enabled": true, - "mode": "budget", - "budget": { - "default": -1, - "min": 0, - "max": 24576, - "auto": -1, - "off": 0, - "unit": "tokens" - }, + "interleaved": true, "summaries": true, "visibility": "summary", "continuation": [ - "thought_signatures" + "thinking_blocks" ] } }, - "attachment": true, + "attachment": false, "open_weights": false, - "release_date": "2025-04-17", - "last_updated": "2025-04-17", + "release_date": "2025-05-28", + "last_updated": "2025-11-25", "cost": { - "input": 0.15, - "output": 3.5 + "input": 0.5, + "output": 2.18 }, "type": "chat" }, { - "id": "doubao-1.5-vision-pro-32k", - "name": "Doubao 1.5 Vision Pro 32k", - "display_name": "Doubao 1.5 Vision Pro 32k", + "id": "siliconflow/deepseek-v3.1-terminus", + "name": "siliconflow/deepseek-v3.1-terminus", + "display_name": "siliconflow/deepseek-v3.1-terminus", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 32000, - "output": 8192 + "context": 163840, + "output": 65536 }, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": true, + "attachment": false, "open_weights": false, - "release_date": "2025-01-22", - "last_updated": "2025-01-22", + "release_date": "2025-09-29", + "last_updated": "2025-11-25", "cost": { - "input": 0.459, - "output": 1.377 + "input": 0.27, + "output": 1 }, "type": "chat" }, { - "id": "hunyuan-turbos-20250226", - "name": "Hunyuan Turbo S", - "display_name": "Hunyuan Turbo S", + "id": "siliconflow/deepseek-v3-0324", + "name": "siliconflow/deepseek-v3-0324", + "display_name": "siliconflow/deepseek-v3-0324", "modalities": { "input": [ "text" @@ -7977,41 +8262,41 @@ ] }, "limit": { - "context": 24000, - "output": 8192 + "context": 163840, + "output": 163840 }, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { "supported": false }, "attachment": false, "open_weights": false, - "release_date": "2025-02-27", - "last_updated": "2025-02-27", + "release_date": "2024-12-26", + "last_updated": "2025-11-25", "cost": { - "input": 0.187, - "output": 0.374 + "input": 0.25, + "output": 1 }, "type": "chat" }, { - "id": "gemini-2.5-flash-preview-09-2025-thinking", - "name": "Gemini 2.5 Flash Preview (09/2025) – Thinking", - "display_name": "Gemini 2.5 Flash Preview (09/2025) – Thinking", + "id": "siliconflow/deepseek-v3.2", + "name": "siliconflow/deepseek-v3.2", + "display_name": "siliconflow/deepseek-v3.2", "modalities": { "input": [ - "text", - "image", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 1048756, + "context": 163840, "output": 65536 }, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, @@ -8019,38 +8304,23 @@ }, "extra_capabilities": { "reasoning": { - "supported": true, - "default_enabled": true, - "mode": "budget", - "budget": { - "default": -1, - "min": 0, - "max": 24576, - "auto": -1, - "off": 0, - "unit": "tokens" - }, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thought_signatures" - ] + "supported": true } }, - "attachment": true, + "attachment": false, "open_weights": false, - "release_date": "2025-09-25", - "last_updated": "2025-09-25", + "release_date": "2025-12-03", + "last_updated": "2025-12-03", "cost": { - "input": 0.3, - "output": 2.5 + "input": 0.27, + "output": 0.42 }, "type": "chat" }, { - "id": "gemini-2.0-flash-exp-image-generation", - "name": "Gemini Text + Image", - "display_name": "Gemini Text + Image", + "id": "qwen3-coder-plus", + "name": "Qwen3 Coder Plus", + "display_name": "Qwen3 Coder Plus", "modalities": { "input": [ "text" @@ -8060,32 +8330,32 @@ ] }, "limit": { - "context": 32767, - "output": 8192 + "context": 1000000, + "output": 65536 }, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { "supported": false }, "attachment": false, - "open_weights": false, - "release_date": "2025-02-19", - "last_updated": "2025-02-19", + "open_weights": true, + "knowledge": "2025-04", + "release_date": "2025-07-23", + "last_updated": "2025-07-23", "cost": { - "input": 0.2, - "output": 0.8 + "input": 1, + "output": 5 }, "type": "chat" }, { - "id": "hermes-high", - "name": "Hermes High", - "display_name": "Hermes High", + "id": "qwen3-coder-plus-2025-09-23", + "name": "Qwen3 Coder Plus 2025 09 23", + "display_name": "Qwen3 Coder Plus 2025 09 23", "modalities": { "input": [ - "text", - "image", - "pdf" + "text" ], "output": [ "text" @@ -8093,27 +8363,20 @@ }, "limit": { "context": 1000000, - "output": 128000 + "output": 65536 }, + "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true - }, - "attachment": true, - "open_weights": false, - "release_date": "2026-05-11", - "last_updated": "2026-05-11", - "cost": { - "input": 4.998, - "output": 25.007 + "supported": false }, + "attachment": false, "type": "chat" }, { - "id": "step-r1-v-mini", - "name": "Step R1 V Mini", - "display_name": "Step R1 V Mini", + "id": "qwen3-coder-plus-2025-07-22", + "name": "Qwen3 Coder Plus 2025 07 22", + "display_name": "Qwen3 Coder Plus 2025 07 22", "modalities": { "input": [ "text" @@ -8123,27 +8386,21 @@ ] }, "limit": { - "context": 128000, + "context": 1000000, "output": 65536 }, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { "supported": false }, "attachment": false, - "open_weights": false, - "release_date": "2025-04-08", - "last_updated": "2025-04-08", - "cost": { - "input": 2.5, - "output": 11 - }, "type": "chat" }, { - "id": "gemini-2.5-flash-preview-05-20", - "name": "Gemini 2.5 Flash 0520", - "display_name": "Gemini 2.5 Flash 0520", + "id": "qwen-vl-ocr-latest", + "name": "Qwen Vl Ocr Latest", + "display_name": "Qwen Vl Ocr Latest", "modalities": { "input": [ "text", @@ -8154,126 +8411,74 @@ ] }, "limit": { - "context": 1048000, - "output": 65536 - }, - "tool_call": false, - "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": true, - "mode": "budget", - "budget": { - "default": -1, - "min": 0, - "max": 24576, - "auto": -1, - "off": 0, - "unit": "tokens" - }, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thought_signatures" - ] - } - }, - "attachment": true, - "open_weights": false, - "release_date": "2025-05-20", - "last_updated": "2025-05-20", - "cost": { - "input": 0.15, - "output": 0.6 - }, - "type": "chat" - }, - { - "id": "sonar", - "name": "Perplexity Simple", - "display_name": "Perplexity Simple", - "modalities": { - "input": [ - "text" - ], - "output": [ - "text" - ] - }, - "limit": { - "context": 127000, - "output": 128000 + "context": 34096, + "output": 4096 }, + "temperature": true, "tool_call": false, "reasoning": { "supported": false }, "attachment": false, - "open_weights": false, - "release_date": "2025-02-19", - "last_updated": "2025-02-19", - "cost": { - "input": 1.003, - "output": 1.003 - }, "type": "chat" }, { - "id": "yi-large", - "name": "Yi Large", - "display_name": "Yi Large", + "id": "qvq-max-2025-05-15", + "name": "Qvq Max 2025 05 15", + "display_name": "Qvq Max 2025 05 15", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 32000, - "output": 4096 + "context": 131072, + "output": 8192 }, + "temperature": true, "tool_call": false, "reasoning": { - "supported": false + "supported": true, + "default": false, + "budget": { + "default": 16384, + "min": 0, + "max": 16384 + } }, "attachment": false, - "open_weights": false, - "release_date": "2024-05-13", - "last_updated": "2024-05-13", - "cost": { - "input": 3.196, - "output": 3.196 - }, "type": "chat" }, { - "id": "Qwen3.5-27B-Omega-Evolution-v2.0-Derestricted-Lite", - "name": "Qwen3.5 27B Omega Evolution v2.0 Derestricted Lite", - "display_name": "Qwen3.5 27B Omega Evolution v2.0 Derestricted Lite", + "id": "qwen-turbo-latest", + "name": "Qwen Turbo Latest", + "display_name": "Qwen Turbo Latest", "modalities": { "input": [ - "text", - "image", - "video" + "text" ], "output": [ "text" ] }, "limit": { - "context": 262144, + "context": 131072, "output": 16384 }, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { "supported": true, - "default": true + "default": false, + "budget": { + "default": 38912, + "min": 0, + "max": 38912 + } }, "extra_capabilities": { "reasoning": { @@ -8286,20 +8491,19 @@ ] } }, - "attachment": true, - "open_weights": false, - "release_date": "2026-04-06", - "last_updated": "2026-04-06", - "cost": { - "input": 0.306, - "output": 0.306 + "search": { + "supported": true, + "default": false, + "forced_search": false, + "search_strategy": "turbo" }, + "attachment": false, "type": "chat" }, { - "id": "doubao-seed-2-0-code-preview-260215", - "name": "Doubao Seed 2.0 Code Preview", - "display_name": "Doubao Seed 2.0 Code Preview", + "id": "qwen-turbo-2024-09-19", + "name": "Qwen Turbo 2024 09 19", + "display_name": "Qwen Turbo 2024 09 19", "modalities": { "input": [ "text" @@ -8309,62 +8513,24 @@ ] }, "limit": { - "context": 256000, - "output": 128000 + "context": 131072, + "output": 8192 }, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { "supported": false }, "attachment": false, - "open_weights": false, - "release_date": "2026-02-14", - "last_updated": "2026-02-14", - "cost": { - "input": 0.782, - "output": 3.893 - }, "type": "chat" }, { - "id": "ernie-4.5-turbo-128k", - "name": "Ernie 4.5 Turbo 128k", - "display_name": "Ernie 4.5 Turbo 128k", + "id": "qwen-flash-2025-07-28", + "name": "Qwen Flash 2025 07 28", + "display_name": "Qwen Flash 2025 07 28", "modalities": { "input": [ - "text", - "image" - ], - "output": [ "text" - ] - }, - "limit": { - "context": 128000, - "output": 16384 - }, - "tool_call": false, - "reasoning": { - "supported": false - }, - "attachment": true, - "open_weights": false, - "release_date": "2025-05-08", - "last_updated": "2025-05-08", - "cost": { - "input": 0.132, - "output": 0.55 - }, - "type": "chat" - }, - { - "id": "gemini-2.0-flash-001", - "name": "Gemini 2.0 Flash", - "display_name": "Gemini 2.0 Flash", - "modalities": { - "input": [ - "text", - "image" ], "output": [ "text" @@ -8372,265 +8538,238 @@ }, "limit": { "context": 1000000, - "output": 8192 + "output": 32768 }, + "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": false, + "budget": { + "default": 81920, + "min": 0, + "max": 81920 + } }, - "attachment": true, - "open_weights": false, - "release_date": "2024-12-11", - "last_updated": "2024-12-11", - "cost": { - "input": 0.1003, - "output": 0.408 + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } }, + "search": { + "supported": true, + "default": false, + "forced_search": false, + "search_strategy": "turbo" + }, + "attachment": false, "type": "chat" }, { - "id": "Gemma-4-31B-it", - "name": "Gemma 4 31B IT", - "display_name": "Gemma 4 31B IT", + "id": "qwen-plus-latest", + "name": "Qwen Plus Latest", + "display_name": "Qwen Plus Latest", "modalities": { "input": [ - "text", - "image", - "video" + "text" ], "output": [ "text" ] }, "limit": { - "context": 262144, - "output": 16384 + "context": 1000000, + "output": 32768 }, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { "supported": true, - "default": true + "default": false, + "budget": { + "default": 81920, + "min": 0, + "max": 81920 + } }, - "attachment": true, - "open_weights": false, - "release_date": "2026-04-09", - "last_updated": "2026-04-09", - "cost": { - "input": 0.306, - "output": 0.306 + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } }, + "search": { + "supported": true, + "default": false, + "forced_search": false, + "search_strategy": "turbo" + }, + "attachment": false, "type": "chat" }, { - "id": "gemini-2.0-pro-exp-02-05", - "name": "Gemini 2.0 Pro 0205", - "display_name": "Gemini 2.0 Pro 0205", + "id": "qwen-plus-2024-09-19", + "name": "Qwen Plus 2024 09 19", + "display_name": "Qwen Plus 2024 09 19", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 2097152, + "context": 131072, "output": 8192 }, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { "supported": false }, - "attachment": true, - "open_weights": false, - "release_date": "2025-02-05", - "last_updated": "2025-02-05", - "cost": { - "input": 1.989, - "output": 7.956 - }, + "attachment": false, "type": "chat" }, { - "id": "claw-high", - "name": "Claw High", - "display_name": "Claw High", + "id": "qwen-plus-2025-07-14", + "name": "Qwen Plus 2025 07 14", + "display_name": "Qwen Plus 2025 07 14", "modalities": { "input": [ - "text", - "image", - "pdf" - ], - "output": [ "text" - ] - }, - "limit": { - "context": 1000000, - "output": 128000 - }, - "tool_call": true, - "reasoning": { - "supported": true, - "default": true - }, - "attachment": true, - "open_weights": false, - "release_date": "2026-05-11", - "last_updated": "2026-05-11", - "cost": { - "input": 4.998, - "output": 25.007 - }, - "type": "chat" - }, - { - "id": "claude-opus-4-1-thinking:32000", - "name": "Claude 4.1 Opus Thinking (32K)", - "display_name": "Claude 4.1 Opus Thinking (32K)", - "modalities": { - "input": [ - "text", - "image", - "pdf" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 32000 + "context": 131072, + "output": 16384 }, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, - "default": true + "default": false, + "budget": { + "default": 38912, + "min": 0, + "max": 38912 + } }, "extra_capabilities": { "reasoning": { "supported": true, - "default_enabled": true, - "mode": "budget", - "budget": { - "min": 1024, - "unit": "tokens" - }, "interleaved": true, "summaries": true, "visibility": "summary", "continuation": [ "thinking_blocks" - ], - "notes": [ - "Claude 4 manual thinking uses thinking.type = \"enabled\" with budget_tokens.", - "Interleaved thinking requires the interleaved-thinking-2025-05-14 beta header for this model family." ] } }, - "attachment": true, - "open_weights": false, - "release_date": "2025-05-22", - "last_updated": "2025-05-22", - "cost": { - "input": 14.994, - "output": 75.004 + "search": { + "supported": true, + "default": false, + "forced_search": false, + "search_strategy": "turbo" }, + "attachment": false, "type": "chat" }, { - "id": "claude-opus-4-thinking:32768", - "name": "Claude 4 Opus Thinking (32K)", - "display_name": "Claude 4 Opus Thinking (32K)", + "id": "qwen-plus-2025-09-11", + "name": "Qwen Plus 2025 09 11", + "display_name": "Qwen Plus 2025 09 11", "modalities": { "input": [ - "text", - "image", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 32000 + "context": 1000000, + "output": 32768 }, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, - "default": true + "default": false, + "budget": { + "default": 81920, + "min": 0, + "max": 81920 + } }, "extra_capabilities": { "reasoning": { "supported": true, - "default_enabled": true, - "mode": "budget", - "budget": { - "min": 1024, - "unit": "tokens" - }, "interleaved": true, "summaries": true, "visibility": "summary", "continuation": [ "thinking_blocks" - ], - "notes": [ - "Claude 4 manual thinking uses thinking.type = \"enabled\" with budget_tokens.", - "Interleaved thinking requires the interleaved-thinking-2025-05-14 beta header for this model family." ] } }, - "attachment": true, - "open_weights": false, - "release_date": "2025-05-22", - "last_updated": "2025-05-22", - "cost": { - "input": 14.994, - "output": 75.004 + "search": { + "supported": true, + "default": false, + "forced_search": false, + "search_strategy": "turbo" }, + "attachment": false, "type": "chat" }, { - "id": "Gemma-4-31B-Claude-4.6-Opus-Reasoning-Distilled", - "name": "Gemma 4 31B Claude 4.6 Opus Reasoning Distilled", - "display_name": "Gemma 4 31B Claude 4.6 Opus Reasoning Distilled", + "id": "qwen-max-latest", + "name": "Qwen Max Latest", + "display_name": "Qwen Max Latest", "modalities": { "input": [ - "text", - "image", - "video" + "text" ], "output": [ "text" ] }, "limit": { - "context": 262144, - "output": 16384 + "context": 131072, + "output": 8192 }, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, - "attachment": true, - "open_weights": false, - "release_date": "2026-05-01", - "last_updated": "2026-05-01", - "cost": { - "input": 0.306, - "output": 0.306, - "cache_read": 0.0306 + "search": { + "supported": true, + "default": false, + "forced_search": false, + "search_strategy": "turbo" }, + "attachment": false, "type": "chat" }, { - "id": "exa-research", - "name": "Exa (Research)", - "display_name": "Exa (Research)", + "id": "qwen-max-2024-09-19", + "name": "Qwen Max 2024 09 19", + "display_name": "Qwen Max 2024 09 19", "modalities": { "input": [ "text" @@ -8640,32 +8779,108 @@ ] }, "limit": { - "context": 8192, + "context": 32768, "output": 8192 }, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { "supported": false }, - "attachment": false, - "open_weights": false, - "release_date": "2025-06-04", - "last_updated": "2025-06-04", - "cost": { - "input": 2.5, - "output": 2.5 + "search": { + "supported": true, + "default": false, + "forced_search": false, + "search_strategy": "turbo" }, + "attachment": false, "type": "chat" }, { - "id": "Qwen3.5-27B-Omega-Evolution-v2.2-Derestricted-Lite", - "name": "Qwen3.5 27B Omega Evolution v2.2 Derestricted Lite", - "display_name": "Qwen3.5 27B Omega Evolution v2.2 Derestricted Lite", + "id": "qwen-max-2024-04-28", + "name": "Qwen Max 2024 04 28", + "display_name": "Qwen Max 2024 04 28", "modalities": { "input": [ - "text", - "image", - "video" + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 8000, + "output": 2000 + }, + "temperature": true, + "tool_call": true, + "reasoning": { + "supported": false + }, + "attachment": false, + "type": "chat" + }, + { + "id": "qwen-max-2024-04-03", + "name": "Qwen Max 2024 04 03", + "display_name": "Qwen Max 2024 04 03", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 8000, + "output": 2000 + }, + "temperature": true, + "tool_call": true, + "reasoning": { + "supported": false + }, + "attachment": false, + "type": "chat" + }, + { + "id": "qwen-max-2025-01-25", + "name": "Qwen Max 2025 01 25", + "display_name": "Qwen Max 2025 01 25", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 131072, + "output": 8192 + }, + "temperature": true, + "tool_call": true, + "reasoning": { + "supported": false + }, + "search": { + "supported": true, + "default": false, + "forced_search": false, + "search_strategy": "turbo" + }, + "attachment": false, + "type": "chat" + }, + { + "id": "qwen3-max-2025-09-23", + "name": "Qwen3 Max 20250923", + "display_name": "Qwen3 Max 20250923", + "modalities": { + "input": [ + "text" ], "output": [ "text" @@ -8673,12 +8888,42 @@ }, "limit": { "context": 262144, - "output": 16384 + "output": 65536 }, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { + "supported": false + }, + "search": { "supported": true, - "default": true + "default": false, + "forced_search": false, + "search_strategy": "turbo" + }, + "attachment": false, + "type": "chat" + }, + { + "id": "qwen3-max-preview", + "name": "Qwen3 Max Preview", + "display_name": "Qwen3 Max Preview", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 262144, + "output": 65536 + }, + "temperature": true, + "tool_call": true, + "reasoning": { + "supported": true }, "extra_capabilities": { "reasoning": { @@ -8691,38 +8936,41 @@ ] } }, - "attachment": true, - "open_weights": false, - "release_date": "2026-05-02", - "last_updated": "2026-05-02", - "cost": { - "input": 0.306, - "output": 0.306 + "search": { + "supported": true, + "default": false, + "forced_search": false, + "search_strategy": "turbo" }, + "attachment": false, "type": "chat" }, { - "id": "Qwen3.5-27B-Vivid-Durian", - "name": "Qwen3.5 27B Vivid Durian", - "display_name": "Qwen3.5 27B Vivid Durian", + "id": "qwen3-235b-a22b-thinking-2507", + "name": "Qwen3 235B A22B Thinking 2507", + "display_name": "Qwen3 235B A22B Thinking 2507", "modalities": { "input": [ - "text", - "image", - "video" + "text" ], "output": [ "text" ] }, "limit": { - "context": 262144, - "output": 16384 + "context": 131072, + "output": 32768 }, + "temperature": true, "tool_call": false, "reasoning": { "supported": true, - "default": true + "default": true, + "budget": { + "default": 81920, + "min": 0, + "max": 81920 + } }, "extra_capabilities": { "reasoning": { @@ -8735,20 +8983,13 @@ ] } }, - "attachment": true, - "open_weights": false, - "release_date": "2026-03-18", - "last_updated": "2026-03-18", - "cost": { - "input": 0.306, - "output": 0.306 - }, + "attachment": false, "type": "chat" }, { - "id": "deepseek-v3-0324", - "name": "DeepSeek Chat 0324", - "display_name": "DeepSeek Chat 0324", + "id": "qwen3-235b-a22b-instruct-2507", + "name": "Qwen3 235B A22B Instruct 2507", + "display_name": "Qwen3 235B A22B Instruct 2507", "modalities": { "input": [ "text" @@ -8758,58 +8999,45 @@ ] }, "limit": { - "context": 128000, - "output": 8192 + "context": 131072, + "output": 32768 }, + "temperature": true, "tool_call": true, "reasoning": { "supported": false }, "attachment": false, - "open_weights": false, - "release_date": "2025-03-24", - "last_updated": "2025-03-24", - "cost": { - "input": 0.25, - "output": 0.7 - }, "type": "chat" }, { - "id": "azure-gpt-4o", - "name": "Azure gpt-4o", - "display_name": "Azure gpt-4o", + "id": "qwen3-30b-a3b-instruct-2507", + "name": "Qwen3 30B A3B Instruct 2507", + "display_name": "Qwen3 30B A3B Instruct 2507", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 16384 + "context": 131072, + "output": 32768 }, + "temperature": true, "tool_call": true, "reasoning": { "supported": false }, - "attachment": true, - "open_weights": false, - "release_date": "2024-05-13", - "last_updated": "2024-05-13", - "cost": { - "input": 2.499, - "output": 9.996 - }, + "attachment": false, "type": "chat" }, { - "id": "ernie-x1-32k-preview", - "name": "Ernie X1 32k", - "display_name": "Ernie X1 32k", + "id": "qwen3-30b-a3b-thinking-2507", + "name": "Qwen3 30B A3B Thinking 2507", + "display_name": "Qwen3 30B A3B Thinking 2507", "modalities": { "input": [ "text" @@ -8819,27 +9047,38 @@ ] }, "limit": { - "context": 32000, - "output": 16384 + "context": 131072, + "output": 32768 }, + "temperature": true, "tool_call": false, "reasoning": { - "supported": false + "supported": true, + "default": true, + "budget": { + "default": 81920, + "min": 0, + "max": 81920 + } }, - "attachment": false, - "open_weights": false, - "release_date": "2025-04-03", - "last_updated": "2025-04-03", - "cost": { - "input": 0.33, - "output": 1.32 + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } }, + "attachment": false, "type": "chat" }, { - "id": "qwen3-coder-30b-a3b-instruct", - "name": "Qwen3 Coder 30B A3B Instruct", - "display_name": "Qwen3 Coder 30B A3B Instruct", + "id": "qwen3-30b-a3b", + "name": "Qwen3 30B A3B", + "display_name": "Qwen3 30B A3B", "modalities": { "input": [ "text" @@ -8849,27 +9088,38 @@ ] }, "limit": { - "context": 128000, - "output": 65536 + "context": 131072, + "output": 32768 }, + "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": false, + "budget": { + "default": 81920, + "min": 0, + "max": 81920 + } }, - "attachment": false, - "open_weights": false, - "release_date": "2025-08-05", - "last_updated": "2025-08-05", - "cost": { - "input": 0.1, - "output": 0.4 + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } }, + "attachment": false, "type": "chat" }, { - "id": "doubao-seed-2-0-lite-260215", - "name": "Doubao Seed 2.0 Lite", - "display_name": "Doubao Seed 2.0 Lite", + "id": "qwen3-4b", + "name": "Qwen3 4B", + "display_name": "Qwen3 4B", "modalities": { "input": [ "text" @@ -8879,233 +9129,246 @@ ] }, "limit": { - "context": 256000, - "output": 32000 + "context": 131072, + "output": 8192 }, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { - "supported": true + "supported": true, + "default": true, + "budget": { + "default": 38912, + "min": 0, + "max": 38912 + } }, "extra_capabilities": { "reasoning": { - "supported": true + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] } }, "attachment": false, - "open_weights": false, - "release_date": "2026-02-14", - "last_updated": "2026-02-14", - "cost": { - "input": 0.1462, - "output": 0.8738 - }, "type": "chat" }, { - "id": "gemini-2.5-pro-preview-06-05", - "name": "Gemini 2.5 Pro Preview 0605", - "display_name": "Gemini 2.5 Pro Preview 0605", + "id": "qwen3-1.7b", + "name": "Qwen3 1.7B", + "display_name": "Qwen3 1.7B", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 1048756, - "output": 65536 + "context": 32768, + "output": 8192 }, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { "supported": true, - "default": true + "default": true, + "budget": { + "default": 30720, + "min": 0, + "max": 30720 + } }, "extra_capabilities": { "reasoning": { "supported": true, - "default_enabled": true, - "mode": "budget", - "budget": { - "default": -1, - "min": 128, - "max": 32768, - "auto": -1, - "unit": "tokens" - }, + "interleaved": true, "summaries": true, "visibility": "summary", "continuation": [ - "thought_signatures" + "thinking_blocks" ] } }, - "attachment": true, - "open_weights": false, - "release_date": "2025-06-05", - "last_updated": "2025-06-05", - "cost": { - "input": 2.5, - "output": 10 - }, + "attachment": false, "type": "chat" }, { - "id": "claude-haiku-4-5-20251001", - "name": "Claude Haiku 4.5", - "display_name": "Claude Haiku 4.5", + "id": "qwen3-0.6b", + "name": "Qwen3 0.6B", + "display_name": "Qwen3 0.6B", "modalities": { "input": [ - "text", - "image", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 64000 + "context": 32768, + "output": 8192 }, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, - "default": false + "default": true, + "budget": { + "default": 30720, + "min": 0, + "max": 30720 + } }, "extra_capabilities": { "reasoning": { "supported": true, - "default_enabled": false, - "mode": "budget", - "budget": { - "min": 1024, - "unit": "tokens" - }, "interleaved": true, "summaries": true, "visibility": "summary", "continuation": [ "thinking_blocks" - ], - "notes": [ - "Claude 4 manual thinking uses thinking.type = \"enabled\" with budget_tokens.", - "Interleaved thinking requires the interleaved-thinking-2025-05-14 beta header for this model family." ] } }, - "attachment": true, - "open_weights": false, - "release_date": "2025-10-15", - "last_updated": "2025-10-15", - "cost": { - "input": 1, - "output": 5 - }, + "attachment": false, "type": "chat" }, { - "id": "MiniMax-M1", - "name": "MiniMax M1", - "display_name": "MiniMax M1", + "id": "qwen3-vl-plus-2025-09-23", + "name": "Qwen3 VL Plus 2025 09 23", + "display_name": "Qwen3 VL Plus 2025 09 23", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 1000000, - "output": 131072 + "context": 262144, + "output": 32768 }, + "temperature": true, "tool_call": false, "reasoning": { - "supported": false + "supported": true, + "default": false, + "budget": { + "default": 81920, + "min": 0, + "max": 81920 + } }, - "attachment": false, - "open_weights": false, - "release_date": "2025-06-16", - "last_updated": "2025-06-16", - "cost": { - "input": 0.1394, - "output": 1.3328 + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } }, + "attachment": false, "type": "chat" }, { - "id": "command-a-plus-05-2026", - "name": "Cohere Command A+ (05/2026)", - "display_name": "Cohere Command A+ (05/2026)", + "id": "qwq-plus-latest", + "name": "QwQ Plus Latest", + "display_name": "QwQ Plus Latest", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 64000 + "context": 131072, + "output": 8192 }, + "temperature": true, "tool_call": false, "reasoning": { "supported": true, - "default": true + "default": true, + "budget": { + "default": 32768, + "min": 0, + "max": 32768 + } }, - "attachment": true, - "open_weights": false, - "release_date": "2026-05-22", - "last_updated": "2026-05-22", - "cost": { - "input": 2.5, - "output": 10 + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } + }, + "search": { + "supported": false }, + "attachment": false, "type": "chat" - }, + } + ] + }, + "regolo-ai": { + "id": "regolo-ai", + "name": "Regolo AI", + "display_name": "Regolo AI", + "api": "https://api.regolo.ai/v1", + "doc": "https://docs.regolo.ai/", + "models": [ { - "id": "qwen3.7-plus:thinking", - "name": "Qwen3.7 Plus Thinking", - "display_name": "Qwen3.7 Plus Thinking", + "id": "llama-3.1-8b-instruct", + "name": "Llama 3.1 8B Instruct", + "display_name": "Llama 3.1 8B Instruct", "modalities": { "input": [ - "text", - "image", - "video" + "text" ], "output": [ "text" ] }, "limit": { - "context": 983616, - "output": 65536 + "context": 120000, + "output": 120000 }, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, - "attachment": true, + "attachment": false, "open_weights": false, - "release_date": "2026-06-01", - "last_updated": "2026-06-01", + "release_date": "2025-04-07", + "last_updated": "2025-04-07", "cost": { - "input": 0.4, - "output": 1.6, - "cache_read": 0.04 + "input": 0.05, + "output": 0.25 }, "type": "chat" }, { - "id": "Baichuan-M2", - "name": "Baichuan M2 32B Medical", - "display_name": "Baichuan M2 32B Medical", + "id": "minimax-m2.5", + "name": "MiniMax 2.5", + "display_name": "MiniMax 2.5", "modalities": { "input": [ "text" @@ -9115,102 +9378,97 @@ ] }, "limit": { - "context": 32768, - "output": 32768 + "context": 190000, + "output": 64000 }, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true + } }, "attachment": false, "open_weights": false, - "release_date": "2025-08-19", - "last_updated": "2025-08-19", + "release_date": "2026-03-10", + "last_updated": "2026-03-10", "cost": { - "input": 15.73, - "output": 15.73 + "input": 0.8, + "output": 3.5 }, "type": "chat" }, { - "id": "Qwen3.5-27B-Infracelestial", - "name": "Qwen3.5 27B Infracelestial", - "display_name": "Qwen3.5 27B Infracelestial", + "id": "mistral-small3.2", + "name": "Mistral Small 3.2", + "display_name": "Mistral Small 3.2", "modalities": { "input": [ - "text", - "image", - "video" + "text" ], "output": [ "text" ] }, "limit": { - "context": 262144, - "output": 16384 + "context": 120000, + "output": 120000 }, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { "supported": true, "default": true }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } - }, - "attachment": true, + "attachment": false, "open_weights": false, - "release_date": "2026-04-30", - "last_updated": "2026-04-30", + "release_date": "2025-01-31", + "last_updated": "2025-01-31", "cost": { - "input": 0.306, - "output": 0.306 + "input": 0.5, + "output": 2.2 }, "type": "chat" }, { - "id": "asi1-mini", - "name": "ASI1 Mini", - "display_name": "ASI1 Mini", + "id": "qwen3-reranker-4b", + "name": "Qwen3-Reranker-4B", + "display_name": "Qwen3-Reranker-4B", "modalities": { "input": [ - "text", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 16384 + "context": 32768, + "output": 8192 }, + "temperature": false, "tool_call": false, "reasoning": { "supported": false }, - "attachment": true, - "open_weights": false, - "release_date": "2025-03-25", - "last_updated": "2025-03-25", + "attachment": false, + "open_weights": true, + "release_date": "2026-02-01", + "last_updated": "2026-02-01", "cost": { - "input": 1, - "output": 1 + "input": 0.12, + "output": 0.12 }, - "type": "chat" + "type": "rerank" }, { - "id": "venice-uncensored", - "name": "Venice Uncensored", - "display_name": "Venice Uncensored", + "id": "qwen3-embedding-8b", + "name": "Qwen3-Embedding-8B", + "display_name": "Qwen3-Embedding-8B", "modalities": { "input": [ "text" @@ -9220,106 +9478,94 @@ ] }, "limit": { - "context": 128000, - "output": 16384 + "context": 32768, + "output": 8192 }, + "temperature": false, "tool_call": false, "reasoning": { "supported": false }, "attachment": false, - "open_weights": false, - "release_date": "2025-02-24", - "last_updated": "2025-02-24", + "open_weights": true, + "release_date": "2026-02-01", + "last_updated": "2026-02-01", "cost": { - "input": 0.4, - "output": 0.4 + "input": 0.1, + "output": 0.1 }, - "type": "chat" + "type": "embedding" }, { - "id": "Qwen3.5-27B-NaNovel-Derestricted-Lite", - "name": "Qwen3.5 27B NaNovel Derestricted Lite", - "display_name": "Qwen3.5 27B NaNovel Derestricted Lite", + "id": "llama-3.3-70b-instruct", + "name": "Llama 3.3 70B Instruct", + "display_name": "Llama 3.3 70B Instruct", "modalities": { "input": [ - "text", - "image", - "video" + "text" ], "output": [ "text" ] }, "limit": { - "context": 262144, + "context": 128000, "output": 16384 }, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } + "supported": false }, - "attachment": true, + "attachment": false, "open_weights": false, - "release_date": "2026-04-30", - "last_updated": "2026-04-30", + "release_date": "2025-04-28", + "last_updated": "2025-04-28", "cost": { - "input": 0.306, - "output": 0.306 + "input": 0.6, + "output": 2.7 }, "type": "chat" }, { - "id": "glm-4-air", - "name": "GLM-4 Air", - "display_name": "GLM-4 Air", + "id": "qwen-image", + "name": "Qwen-Image", + "display_name": "Qwen-Image", "modalities": { "input": [ "text" ], "output": [ - "text" + "image" ] }, "limit": { - "context": 128000, + "context": 8192, "output": 4096 }, + "temperature": true, "tool_call": false, "reasoning": { "supported": false }, "attachment": false, "open_weights": false, - "release_date": "2024-06-05", - "last_updated": "2024-06-05", + "release_date": "2026-03-01", + "last_updated": "2026-03-01", "cost": { - "input": 0.2006, - "output": 0.2006 + "input": 0.5, + "output": 2 }, - "type": "chat" + "type": "imageGeneration" }, { - "id": "Qwen3.5-27B-Writer-V2-Derestricted-Lite", - "name": "Qwen3.5 27B Writer V2 Derestricted Lite", - "display_name": "Qwen3.5 27B Writer V2 Derestricted Lite", + "id": "qwen3.5-122b", + "name": "Qwen3.5-122B", + "display_name": "Qwen3.5-122B", "modalities": { "input": [ "text", - "image", - "video" + "image" ], "output": [ "text" @@ -9329,7 +9575,8 @@ "context": 262144, "output": 16384 }, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { "supported": true, "default": true @@ -9346,71 +9593,56 @@ } }, "attachment": true, - "open_weights": false, - "release_date": "2026-04-06", - "last_updated": "2026-04-06", + "open_weights": true, + "release_date": "2026-02-01", + "last_updated": "2026-02-01", "cost": { - "input": 0.306, - "output": 0.306 + "input": 0.9, + "output": 3.6 }, "type": "chat" }, { - "id": "gemini-2.5-flash-lite-preview-09-2025-thinking", - "name": "Gemini 2.5 Flash Lite Preview (09/2025) – Thinking", - "display_name": "Gemini 2.5 Flash Lite Preview (09/2025) – Thinking", + "id": "gpt-oss-120b", + "name": "GPT-OSS-120B", + "display_name": "GPT-OSS-120B", "modalities": { "input": [ - "text", - "image", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 1048756, - "output": 65536 + "context": 128000, + "output": 16384 }, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, - "default": false + "default": true }, "extra_capabilities": { "reasoning": { - "supported": true, - "default_enabled": false, - "mode": "budget", - "budget": { - "default": -1, - "min": 512, - "max": 24576, - "auto": -1, - "unit": "tokens" - }, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thought_signatures" - ] + "supported": true } }, - "attachment": true, + "attachment": false, "open_weights": false, - "release_date": "2025-09-25", - "last_updated": "2025-09-25", + "release_date": "2025-08-05", + "last_updated": "2025-08-05", "cost": { - "input": 0.1, - "output": 0.4 + "input": 1, + "output": 4.2 }, "type": "chat" }, { - "id": "venice-uncensored:web", - "name": "Venice Uncensored Web", - "display_name": "Venice Uncensored Web", + "id": "qwen3-coder-next", + "name": "Qwen3-Coder-Next", + "display_name": "Qwen3-Coder-Next", "modalities": { "input": [ "text" @@ -9420,126 +9652,155 @@ ] }, "limit": { - "context": 80000, + "context": 262144, "output": 16384 }, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "attachment": false, - "open_weights": false, - "release_date": "2024-05-01", - "last_updated": "2024-05-01", + "open_weights": true, + "release_date": "2026-03-01", + "last_updated": "2026-03-01", "cost": { - "input": 0.4, - "output": 0.4 + "input": 0.3, + "output": 1.2 }, "type": "chat" }, { - "id": "deepseek-r1-sambanova", - "name": "DeepSeek R1 Fast", - "display_name": "DeepSeek R1 Fast", + "id": "qwen3.5-9b", + "name": "Qwen3.5-9B", + "display_name": "Qwen3.5-9B", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 4096 + "context": 262144, + "output": 8192 }, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": false, - "open_weights": false, - "release_date": "2025-02-20", - "last_updated": "2025-02-20", + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } + }, + "attachment": true, + "open_weights": true, + "release_date": "2026-02-01", + "last_updated": "2026-02-01", "cost": { - "input": 4.998, - "output": 6.987 + "input": 0.15, + "output": 0.6 }, "type": "chat" }, { - "id": "Gemma-4-31B-GarnetV2", - "name": "Gemma 4 31B Garnet V2", - "display_name": "Gemma 4 31B Garnet V2", + "id": "mistral-small-4-119b", + "name": "Mistral Small 4 119B", + "display_name": "Mistral Small 4 119B", "modalities": { "input": [ "text", - "image", - "video" + "image" ], "output": [ "text" ] }, "limit": { - "context": 262144, + "context": 256000, "output": 16384 }, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { "supported": true, "default": true }, "attachment": true, "open_weights": false, - "release_date": "2026-05-01", - "last_updated": "2026-05-01", + "release_date": "2026-03-15", + "last_updated": "2026-03-15", "cost": { - "input": 0.306, - "output": 0.306 + "input": 0.75, + "output": 3 }, "type": "chat" }, { - "id": "holo3-35b-a3b:thinking", - "name": "Holo3-35B-A3B Thinking", - "display_name": "Holo3-35B-A3B Thinking", + "id": "gpt-oss-20b", + "name": "GPT-OSS-20B", + "display_name": "GPT-OSS-20B", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 65536, - "output": 65536 + "context": 128000, + "output": 16384 }, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, "default": true }, - "attachment": true, - "open_weights": false, - "release_date": "2024-01-01", - "last_updated": "2024-01-01", + "extra_capabilities": { + "reasoning": { + "supported": true + } + }, + "attachment": false, + "open_weights": true, + "release_date": "2026-03-01", + "last_updated": "2026-03-01", "cost": { - "input": 0.25, + "input": 0.4, "output": 1.8 }, "type": "chat" - }, + } + ] + }, + "stackit": { + "id": "stackit", + "name": "STACKIT", + "display_name": "STACKIT", + "api": "https://api.openai-compat.model-serving.eu01.onstackit.cloud/v1", + "doc": "https://docs.stackit.cloud/products/data-and-ai/ai-model-serving/basics/available-shared-models", + "models": [ { - "id": "kimi-thinking-preview", - "name": "Kimi Thinking Preview", - "display_name": "Kimi Thinking Preview", + "id": "neuralmagic/Meta-Llama-3.1-8B-Instruct-FP8", + "name": "Llama 3.1 8B", + "display_name": "Llama 3.1 8B", "modalities": { "input": [ - "text", - "pdf" + "text" ], "output": [ "text" @@ -9547,26 +9808,27 @@ }, "limit": { "context": 128000, - "output": 16384 + "output": 8192 }, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { "supported": false }, - "attachment": true, - "open_weights": false, - "release_date": "2025-05-07", - "last_updated": "2025-05-07", + "attachment": false, + "open_weights": true, + "release_date": "2024-07-23", + "last_updated": "2024-07-23", "cost": { - "input": 31.46, - "output": 31.46 + "input": 0.16, + "output": 0.27 }, "type": "chat" }, { - "id": "Baichuan4-Turbo", - "name": "Baichuan 4 Turbo", - "display_name": "Baichuan 4 Turbo", + "id": "neuralmagic/Mistral-Nemo-Instruct-2407-FP8", + "name": "Mistral Nemo", + "display_name": "Mistral Nemo", "modalities": { "input": [ "text" @@ -9577,26 +9839,27 @@ }, "limit": { "context": 128000, - "output": 32768 + "output": 8192 }, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { "supported": false }, "attachment": false, - "open_weights": false, - "release_date": "2025-08-19", - "last_updated": "2025-08-19", + "open_weights": true, + "release_date": "2024-07-01", + "last_updated": "2024-07-01", "cost": { - "input": 2.42, - "output": 2.42 + "input": 0.49, + "output": 0.71 }, "type": "chat" }, { - "id": "glm-4-long", - "name": "GLM-4 Long", - "display_name": "GLM-4 Long", + "id": "cortecs/Llama-3.3-70B-Instruct-FP8-Dynamic", + "name": "Llama 3.3 70B", + "display_name": "Llama 3.3 70B", "modalities": { "input": [ "text" @@ -9606,145 +9869,124 @@ ] }, "limit": { - "context": 1000000, - "output": 4096 + "context": 128000, + "output": 8192 }, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { "supported": false }, "attachment": false, - "open_weights": false, - "release_date": "2024-08-01", - "last_updated": "2024-08-01", + "open_weights": true, + "release_date": "2024-12-05", + "last_updated": "2024-12-05", "cost": { - "input": 0.2006, - "output": 0.2006 + "input": 0.49, + "output": 0.71 }, "type": "chat" }, { - "id": "brave", - "name": "Brave (Answers)", - "display_name": "Brave (Answers)", + "id": "google/gemma-3-27b-it", + "name": "Gemma 3 27B", + "display_name": "Gemma 3 27B", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 8192, + "context": 37000, "output": 8192 }, + "temperature": true, "tool_call": false, "reasoning": { "supported": false }, - "attachment": false, - "open_weights": false, - "release_date": "2023-03-02", - "last_updated": "2024-01-01", + "attachment": true, + "open_weights": true, + "release_date": "2025-05-17", + "last_updated": "2025-05-17", "cost": { - "input": 5, - "output": 5 + "input": 0.49, + "output": 0.71 }, "type": "chat" }, { - "id": "Qwen3.5-27B-Musica-v1", - "name": "Qwen3.5 27B Musica v1", - "display_name": "Qwen3.5 27B Musica v1", + "id": "Qwen/Qwen3-VL-Embedding-8B", + "name": "Qwen3-VL Embedding 8B", + "display_name": "Qwen3-VL Embedding 8B", "modalities": { "input": [ "text", - "image", - "video" + "image" ], "output": [ "text" ] }, "limit": { - "context": 262144, - "output": 16384 + "context": 32000, + "output": 4096 }, + "temperature": false, "tool_call": false, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } + "supported": false }, "attachment": true, - "open_weights": false, - "release_date": "2026-03-27", - "last_updated": "2026-03-27", + "open_weights": true, + "release_date": "2026-02-05", + "last_updated": "2026-02-05", "cost": { - "input": 0.306, - "output": 0.306 + "input": 0.09, + "output": 0.09 }, "type": "chat" }, { - "id": "Qwen3.5-27B-Writer-V2-Derestricted", - "name": "Qwen3.5 27B Writer V2 Derestricted", - "display_name": "Qwen3.5 27B Writer V2 Derestricted", + "id": "Qwen/Qwen3-VL-235B-A22B-Instruct-FP8", + "name": "Qwen3-VL 235B", + "display_name": "Qwen3-VL 235B", "modalities": { "input": [ "text", - "image", - "video" + "image" ], "output": [ "text" ] }, "limit": { - "context": 262144, - "output": 16384 + "context": 218000, + "output": 8192 }, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } + "supported": false }, "attachment": true, - "open_weights": false, - "release_date": "2026-04-06", - "last_updated": "2026-04-06", + "open_weights": true, + "release_date": "2024-11-01", + "last_updated": "2024-11-01", "cost": { - "input": 0.306, - "output": 0.306 + "input": 1.64, + "output": 1.91 }, "type": "chat" }, { - "id": "sonar-pro", - "name": "Perplexity Pro", - "display_name": "Perplexity Pro", + "id": "openai/gpt-oss-120b", + "name": "GPT-OSS 120B", + "display_name": "GPT-OSS 120B", "modalities": { "input": [ "text" @@ -9754,27 +9996,34 @@ ] }, "limit": { - "context": 200000, - "output": 128000 + "context": 131000, + "output": 8192 }, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true + } }, "attachment": false, - "open_weights": false, - "release_date": "2025-02-19", - "last_updated": "2025-02-19", + "open_weights": true, + "release_date": "2025-08-05", + "last_updated": "2025-08-05", "cost": { - "input": 2.992, - "output": 14.994 + "input": 0.49, + "output": 0.71 }, "type": "chat" }, { - "id": "glm-4", - "name": "GLM-4", - "display_name": "GLM-4", + "id": "intfloat/e5-mistral-7b-instruct", + "name": "E5 Mistral 7B", + "display_name": "E5 Mistral 7B", "modalities": { "input": [ "text" @@ -9784,87 +10033,106 @@ ] }, "limit": { - "context": 128000, + "context": 4096, "output": 4096 }, + "temperature": false, "tool_call": false, "reasoning": { "supported": false }, "attachment": false, - "open_weights": false, - "release_date": "2024-01-16", - "last_updated": "2024-01-16", + "open_weights": true, + "release_date": "2023-12-11", + "last_updated": "2023-12-11", "cost": { - "input": 14.994, - "output": 14.994 + "input": 0.02, + "output": 0.02 }, "type": "chat" - }, + } + ] + }, + "vercel": { + "id": "vercel", + "name": "Vercel AI Gateway", + "display_name": "Vercel AI Gateway", + "doc": "https://github.com/vercel/ai/tree/5eb85cc45a259553501f535b8ac79a77d0e79223/packages/gateway", + "models": [ { - "id": "doubao-seed-1-8-251215", - "name": "Doubao Seed 1.8", - "display_name": "Doubao Seed 1.8", + "id": "xai/grok-4.1-fast-reasoning", + "name": "Grok 4.1 Fast Reasoning", + "display_name": "Grok 4.1 Fast Reasoning", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 8192 + "context": 1000000, + "output": 1000000 }, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "attachment": false, "open_weights": false, - "release_date": "2025-12-15", - "last_updated": "2025-12-15", + "knowledge": "2024-10", + "release_date": "2025-07-09", + "last_updated": "2025-07-09", "cost": { - "input": 0.612, - "output": 6.12 + "input": 0.2, + "output": 0.5, + "cache_read": 0.05 }, "type": "chat" }, { - "id": "Qwen2.5-32B-EVA-v0.2", - "name": "Qwen 2.5 32b EVA", - "display_name": "Qwen 2.5 32b EVA", + "id": "xai/grok-4.20-non-reasoning-beta", + "name": "Grok 4.20 Beta Non-Reasoning", + "display_name": "Grok 4.20 Beta Non-Reasoning", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 24576, - "output": 8192 + "context": 2000000, + "output": 2000000 }, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { "supported": false }, - "attachment": false, + "attachment": true, "open_weights": false, - "release_date": "2024-09-01", - "last_updated": "2024-09-01", + "release_date": "2026-03-11", + "last_updated": "2026-03-13", "cost": { - "input": 0.493, - "output": 0.493 + "input": 1.25, + "output": 2.5, + "cache_read": 0.4 }, "type": "chat" }, { - "id": "claw-low", - "name": "Claw Low", - "display_name": "Claw Low", + "id": "xai/grok-4.3", + "name": "Grok 4.3", + "display_name": "Grok 4.3", "modalities": { "input": [ "text", @@ -9876,29 +10144,35 @@ ] }, "limit": { - "context": 1048576, - "output": 65536 + "context": 1000000, + "output": 1000000 }, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, "default": true }, + "extra_capabilities": { + "reasoning": { + "supported": true + } + }, "attachment": true, "open_weights": false, - "release_date": "2026-05-11", - "last_updated": "2026-05-11", + "release_date": "2026-04-30", + "last_updated": "2026-04-17", "cost": { - "input": 0.25, - "output": 1.5, - "cache_read": 0.025 + "input": 1.25, + "output": 2.5, + "cache_read": 0.2 }, "type": "chat" }, { - "id": "claude-opus-4-20250514", - "name": "Claude 4 Opus", - "display_name": "Claude 4 Opus", + "id": "xai/grok-4.1-fast-non-reasoning", + "name": "Grok 4.1 Fast Non-Reasoning", + "display_name": "Grok 4.1 Fast Non-Reasoning", "modalities": { "input": [ "text", @@ -9910,345 +10184,325 @@ ] }, "limit": { - "context": 200000, - "output": 32000 + "context": 1000000, + "output": 1000000 }, + "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": false - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": false, - "mode": "budget", - "budget": { - "min": 1024, - "unit": "tokens" - }, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ], - "notes": [ - "Claude 4 manual thinking uses thinking.type = \"enabled\" with budget_tokens.", - "Interleaved thinking requires the interleaved-thinking-2025-05-14 beta header for this model family." - ] - } + "supported": false }, - "attachment": true, + "attachment": false, "open_weights": false, - "release_date": "2025-05-14", - "last_updated": "2025-05-14", + "knowledge": "2024-10", + "release_date": "2025-07-09", + "last_updated": "2025-07-09", "cost": { - "input": 14.994, - "output": 75.004 + "input": 0.2, + "output": 0.5, + "cache_read": 0.05 }, "type": "chat" }, { - "id": "Qwen3.5-27B-NaNovel-Derestricted", - "name": "Qwen3.5 27B NaNovel Derestricted", - "display_name": "Qwen3.5 27B NaNovel Derestricted", + "id": "xai/grok-imagine-video", + "name": "Grok Imagine", + "display_name": "Grok Imagine", "modalities": { "input": [ - "text", - "image", - "video" + "text" ], "output": [ - "text" + "video" ] }, "limit": { - "context": 262144, - "output": 16384 + "context": 8192, + "output": 8192 }, + "temperature": true, "tool_call": false, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } + "supported": false }, - "attachment": true, + "attachment": false, "open_weights": false, - "release_date": "2026-04-30", - "last_updated": "2026-04-30", - "cost": { - "input": 0.306, - "output": 0.306 - }, + "release_date": "2026-01-28", + "last_updated": "2026-01-28", "type": "chat" }, { - "id": "Magistral-Small-2506", - "name": "Magistral Small 2506", - "display_name": "Magistral Small 2506", + "id": "xai/grok-4.20-multi-agent-beta", + "name": "Grok 4.20 Multi Agent Beta", + "display_name": "Grok 4.20 Multi Agent Beta", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 32768, - "output": 32768 + "context": 2000000, + "output": 2000000 }, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "attachment": false, "open_weights": false, - "release_date": "2025-09-25", - "last_updated": "2025-09-25", + "release_date": "2026-03-11", + "last_updated": "2026-03-13", "cost": { - "input": 0.4, - "output": 1.4 + "input": 1.25, + "output": 2.5, + "cache_read": 0.2 }, "type": "chat" }, { - "id": "Qwen3.5-27B-Queen-Derestricted-Lite", - "name": "Qwen3.5 27B Queen Derestricted Lite", - "display_name": "Qwen3.5 27B Queen Derestricted Lite", + "id": "xai/grok-4.20-reasoning", + "name": "Grok 4.20 Reasoning", + "display_name": "Grok 4.20 Reasoning", "modalities": { "input": [ "text", "image", - "video" + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 262144, - "output": 16384 + "context": 2000000, + "output": 2000000 }, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { "supported": true, "default": true }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } - }, "attachment": true, "open_weights": false, - "release_date": "2026-04-30", - "last_updated": "2026-04-30", + "release_date": "2026-03-09", + "last_updated": "2026-03-23", "cost": { - "input": 0.306, - "output": 0.306 + "input": 1.25, + "output": 2.5, + "cache_read": 0.2 }, "type": "chat" }, { - "id": "deepseek-reasoner", - "name": "DeepSeek Reasoner", - "display_name": "DeepSeek Reasoner", + "id": "xai/grok-4.20-reasoning-beta", + "name": "Grok 4.20 Beta Reasoning", + "display_name": "Grok 4.20 Beta Reasoning", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 64000, - "output": 65536 + "context": 2000000, + "output": 2000000 }, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { - "supported": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } + "supported": true, + "default": true }, - "attachment": false, + "attachment": true, "open_weights": false, - "release_date": "2025-01-20", - "last_updated": "2025-01-20", + "release_date": "2026-03-11", + "last_updated": "2026-03-13", "cost": { - "input": 0.4, - "output": 1.7 + "input": 1.25, + "output": 2.5, + "cache_read": 0.2 }, "type": "chat" }, { - "id": "exa-answer", - "name": "Exa (Answer)", - "display_name": "Exa (Answer)", + "id": "xai/grok-imagine-video-1.5-preview", + "name": "Grok Imagine Video 1.5 Preview", + "display_name": "Grok Imagine Video 1.5 Preview", "modalities": { "input": [ "text" ], "output": [ - "text" + "video" ] }, "limit": { - "context": 4096, - "output": 4096 + "context": 8192, + "output": 8192 }, + "temperature": true, "tool_call": false, "reasoning": { "supported": false }, "attachment": false, "open_weights": false, - "release_date": "2025-06-04", - "last_updated": "2025-06-04", - "cost": { - "input": 2.5, - "output": 2.5 - }, + "release_date": "2026-05-30", + "last_updated": "2026-05-30", "type": "chat" }, { - "id": "doubao-1.5-pro-256k", - "name": "Doubao 1.5 Pro 256k", - "display_name": "Doubao 1.5 Pro 256k", + "id": "xai/grok-4.20-non-reasoning", + "name": "Grok 4.20 Non-Reasoning", + "display_name": "Grok 4.20 Non-Reasoning", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 256000, - "output": 16384 + "context": 2000000, + "output": 2000000 }, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { "supported": false }, - "attachment": false, + "attachment": true, "open_weights": false, - "release_date": "2025-03-12", - "last_updated": "2025-03-12", + "release_date": "2026-03-09", + "last_updated": "2026-03-23", "cost": { - "input": 0.799, - "output": 1.445 + "input": 1.25, + "output": 2.5, + "cache_read": 0.2 }, "type": "chat" }, { - "id": "gemma-4-31B-Larkspur-v0.5", - "name": "Gemma 4 31B Larkspur v0.5", - "display_name": "Gemma 4 31B Larkspur v0.5", + "id": "xai/grok-4.20-multi-agent", + "name": "Grok 4.20 Multi-Agent", + "display_name": "Grok 4.20 Multi-Agent", "modalities": { "input": [ "text", "image", - "video" + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 262144, - "output": 16384 + "context": 2000000, + "output": 2000000 }, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { "supported": true, "default": true }, - "attachment": true, + "attachment": false, "open_weights": false, - "release_date": "2026-05-02", - "last_updated": "2026-05-02", + "release_date": "2026-03-09", + "last_updated": "2026-03-23", "cost": { - "input": 0.306, - "output": 0.306 + "input": 1.25, + "output": 2.5, + "cache_read": 0.2 }, "type": "chat" }, { - "id": "qwen3.5-flash:thinking", - "name": "Qwen3.5 Flash Thinking", - "display_name": "Qwen3.5 Flash Thinking", + "id": "xai/grok-imagine-image", + "name": "Grok Imagine Image", + "display_name": "Grok Imagine Image", "modalities": { "input": [ + "text" + ], + "output": [ "text", - "image", - "video" + "image" + ] + }, + "limit": { + "context": 8192, + "output": 8192 + }, + "temperature": true, + "tool_call": false, + "reasoning": { + "supported": false + }, + "attachment": false, + "open_weights": false, + "release_date": "2026-01-28", + "last_updated": "2026-02-19", + "type": "chat" + }, + { + "id": "xai/grok-build-0.1", + "name": "Grok Build 0.1", + "display_name": "Grok Build 0.1", + "modalities": { + "input": [ + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 991808, - "output": 65536 + "context": 256000, + "output": 256000 }, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { "supported": true, "default": true }, "extra_capabilities": { "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] + "supported": true } }, "attachment": true, "open_weights": false, - "release_date": "2026-02-24", - "last_updated": "2026-02-24", + "release_date": "2026-05-20", + "last_updated": "2026-04-16", "cost": { - "input": 0.09, - "output": 0.36 + "input": 1, + "output": 2, + "cache_read": 0.2 }, "type": "chat" }, { - "id": "KAT-Coder-Exp-72B-1010", - "name": "KAT Coder Exp 72B 1010", - "display_name": "KAT Coder Exp 72B 1010", + "id": "moonshotai/kimi-k2", + "name": "Kimi K2 Instruct", + "display_name": "Kimi K2 Instruct", "modalities": { "input": [ "text" @@ -10258,27 +10512,28 @@ ] }, "limit": { - "context": 128000, - "output": 32768 + "context": 131072, + "output": 131072 }, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { "supported": false }, "attachment": false, "open_weights": false, - "release_date": "2025-10-28", - "last_updated": "2025-10-28", + "release_date": "2025-09-05", + "last_updated": "2025-09-05", "cost": { - "input": 0.1, - "output": 0.2 + "input": 0.57, + "output": 2.3 }, "type": "chat" }, { - "id": "exa-research-pro", - "name": "Exa (Research Pro)", - "display_name": "Exa (Research Pro)", + "id": "moonshotai/kimi-k2-thinking", + "name": "Kimi K2 Thinking", + "display_name": "Kimi K2 Thinking", "modalities": { "input": [ "text" @@ -10288,27 +10543,42 @@ ] }, "limit": { - "context": 16384, - "output": 16384 + "context": 262114, + "output": 262114 }, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } }, "attachment": false, "open_weights": false, - "release_date": "2025-06-04", - "last_updated": "2025-06-04", + "knowledge": "2024-08", + "release_date": "2025-11-06", + "last_updated": "2025-11-06", "cost": { - "input": 2.5, - "output": 2.5 + "input": 0.6, + "output": 2.5, + "cache_read": 0.15 }, "type": "chat" }, { - "id": "ernie-4.5-turbo-vl-32k", - "name": "Ernie 4.5 Turbo VL 32k", - "display_name": "Ernie 4.5 Turbo VL 32k", + "id": "moonshotai/kimi-k2.5", + "name": "Kimi K2.5", + "display_name": "Kimi K2.5", "modalities": { "input": [ "text", @@ -10319,27 +10589,42 @@ ] }, "limit": { - "context": 32000, - "output": 16384 + "context": 262114, + "output": 262114 }, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } }, "attachment": true, - "open_weights": false, - "release_date": "2025-05-08", - "last_updated": "2025-05-08", + "open_weights": true, + "knowledge": "2025-01", + "release_date": "2026-01-26", + "last_updated": "2026-01", "cost": { - "input": 0.495, - "output": 1.43 + "input": 0.6, + "output": 3, + "cache_read": 0.1 }, "type": "chat" }, { - "id": "claude-opus-4-thinking:32000", - "name": "Claude 4 Opus Thinking (32K)", - "display_name": "Claude 4 Opus Thinking (32K)", + "id": "moonshotai/kimi-k2.6", + "name": "Kimi K2.6", + "display_name": "Kimi K2.6", "modalities": { "input": [ "text", @@ -10351,9 +10636,10 @@ ] }, "limit": { - "context": 200000, - "output": 32000 + "context": 262000, + "output": 262000 }, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, @@ -10361,380 +10647,298 @@ }, "extra_capabilities": { "reasoning": { - "supported": true, - "default_enabled": true, - "mode": "budget", - "budget": { - "min": 1024, - "unit": "tokens" - }, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ], - "notes": [ - "Claude 4 manual thinking uses thinking.type = \"enabled\" with budget_tokens.", - "Interleaved thinking requires the interleaved-thinking-2025-05-14 beta header for this model family." - ] + "supported": true } }, "attachment": true, - "open_weights": false, - "release_date": "2025-05-22", - "last_updated": "2025-05-22", + "open_weights": true, + "knowledge": "2025-01", + "release_date": "2026-04-20", + "last_updated": "2026-04-21", "cost": { - "input": 14.994, - "output": 75.004 + "input": 0.95, + "output": 4, + "cache_read": 0.16 }, "type": "chat" }, { - "id": "qwen3-vl-235b-a22b-instruct-original", - "name": "Qwen3 VL 235B A22B Instruct Original", - "display_name": "Qwen3 VL 235B A22B Instruct Original", + "id": "klingai/kling-v3.0-motion-control", + "name": "Kling v3.0 Motion Control", + "display_name": "Kling v3.0 Motion Control", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ - "text" + "video" ] }, "limit": { - "context": 32768, - "output": 32768 + "context": 8192, + "output": 8192 }, + "temperature": true, "tool_call": false, "reasoning": { "supported": false }, - "attachment": true, + "attachment": false, "open_weights": false, - "release_date": "2025-09-25", - "last_updated": "2025-09-25", - "cost": { - "input": 0.5, - "output": 1.2 - }, + "release_date": "2026-03-04", + "last_updated": "2026-03-04", "type": "chat" }, { - "id": "yi-lightning", - "name": "Yi Lightning", - "display_name": "Yi Lightning", + "id": "klingai/kling-v2.6-i2v", + "name": "Kling v2.6 Image-to-Video", + "display_name": "Kling v2.6 Image-to-Video", "modalities": { "input": [ "text" ], "output": [ - "text" + "video" ] }, "limit": { - "context": 12000, - "output": 4096 + "context": 8192, + "output": 8192 }, + "temperature": true, "tool_call": false, "reasoning": { "supported": false }, "attachment": false, "open_weights": false, - "release_date": "2024-10-16", - "last_updated": "2024-10-16", - "cost": { - "input": 0.2006, - "output": 0.2006 - }, + "release_date": "2025-12-21", + "last_updated": "2025-12-21", "type": "chat" }, { - "id": "azure-o1", - "name": "Azure o1", - "display_name": "Azure o1", + "id": "klingai/kling-v2.5-turbo-t2v", + "name": "Kling v2.5 Turbo Text-to-Video", + "display_name": "Kling v2.5 Turbo Text-to-Video", "modalities": { "input": [ "text" ], "output": [ - "text" + "video" ] }, "limit": { - "context": 200000, - "output": 100000 + "context": 8192, + "output": 8192 }, + "temperature": true, "tool_call": false, "reasoning": { "supported": false }, "attachment": false, "open_weights": false, - "release_date": "2024-12-17", - "last_updated": "2024-12-17", - "cost": { - "input": 14.994, - "output": 59.993 - }, + "release_date": "2025-09-23", + "last_updated": "2025-09-23", "type": "chat" }, { - "id": "mirothinker-1-7-deepresearch-mini", - "name": "MiroThinker 1.7 Deep Research Mini", - "display_name": "MiroThinker 1.7 Deep Research Mini", + "id": "klingai/kling-v3.0-i2v", + "name": "Kling v3.0 Image-to-Video", + "display_name": "Kling v3.0 Image-to-Video", "modalities": { "input": [ "text" ], "output": [ - "text" + "video" ] }, "limit": { - "context": 262144, - "output": 16384 + "context": 8192, + "output": 8192 }, + "temperature": true, "tool_call": false, "reasoning": { - "supported": true, - "default": true + "supported": false }, "attachment": false, "open_weights": false, - "release_date": "2026-05-11", - "last_updated": "2026-05-11", - "cost": { - "input": 1.25, - "output": 10 - }, + "release_date": "2026-02-05", + "last_updated": "2026-02-05", "type": "chat" }, { - "id": "mistral-code-agent-latest", - "name": "Mistral Code Agent Latest", - "display_name": "Mistral Code Agent Latest", + "id": "klingai/kling-v2.5-turbo-i2v", + "name": "Kling v2.5 Turbo Image-to-Video", + "display_name": "Kling v2.5 Turbo Image-to-Video", "modalities": { "input": [ "text" ], "output": [ - "text" + "video" ] }, "limit": { - "context": 262144, - "output": 32768 + "context": 8192, + "output": 8192 }, - "tool_call": true, + "temperature": true, + "tool_call": false, "reasoning": { "supported": false }, "attachment": false, "open_weights": false, - "release_date": "2026-06-02", - "last_updated": "2026-06-02", - "cost": { - "input": 0.4, - "output": 2 - }, + "release_date": "2025-09-23", + "last_updated": "2025-09-23", "type": "chat" }, { - "id": "Gemma-4-31B-DarkIdol", - "name": "Gemma 4 31B DarkIdol", - "display_name": "Gemma 4 31B DarkIdol", + "id": "klingai/kling-v3.0-t2v", + "name": "Kling v3.0 Text-to-Video", + "display_name": "Kling v3.0 Text-to-Video", "modalities": { "input": [ - "text", - "image", - "video" + "text" ], "output": [ - "text" + "video" ] }, "limit": { - "context": 262144, - "output": 16384 + "context": 8192, + "output": 8192 }, + "temperature": true, "tool_call": false, "reasoning": { - "supported": true, - "default": true + "supported": false }, - "attachment": true, + "attachment": false, "open_weights": false, - "release_date": "2026-05-01", - "last_updated": "2026-05-01", - "cost": { - "input": 0.306, - "output": 0.306 - }, + "release_date": "2026-02-05", + "last_updated": "2026-02-05", "type": "chat" }, { - "id": "jamba-mini-1.6", - "name": "Jamba Mini 1.6", - "display_name": "Jamba Mini 1.6", + "id": "klingai/kling-v2.6-motion-control", + "name": "Kling v2.6 Motion Control", + "display_name": "Kling v2.6 Motion Control", "modalities": { "input": [ "text" ], "output": [ - "text" + "video" ] }, "limit": { - "context": 256000, - "output": 4096 + "context": 8192, + "output": 8192 }, + "temperature": true, "tool_call": false, "reasoning": { "supported": false }, "attachment": false, "open_weights": false, - "release_date": "2025-03-01", - "last_updated": "2025-03-01", - "cost": { - "input": 0.1989, - "output": 0.408 - }, + "release_date": "2025-12-21", + "last_updated": "2025-12-21", "type": "chat" }, { - "id": "hermes-low", - "name": "Hermes Low", - "display_name": "Hermes Low", + "id": "klingai/kling-v2.6-t2v", + "name": "Kling v2.6 Text-to-Video", + "display_name": "Kling v2.6 Text-to-Video", "modalities": { "input": [ - "text", - "image", - "pdf" + "text" ], "output": [ - "text" + "video" ] }, "limit": { - "context": 1048576, - "output": 65536 + "context": 8192, + "output": 8192 }, - "tool_call": true, + "temperature": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": true + "supported": false }, - "attachment": true, + "attachment": false, "open_weights": false, - "release_date": "2026-05-11", - "last_updated": "2026-05-11", - "cost": { - "input": 0.25, - "output": 1.5, - "cache_read": 0.025 - }, + "release_date": "2025-12-21", + "last_updated": "2025-12-21", "type": "chat" }, { - "id": "Qwen3.5-27B-BlueStar-Derestricted", - "name": "Qwen3.5 27B BlueStar Derestricted", - "display_name": "Qwen3.5 27B BlueStar Derestricted", + "id": "voyage/voyage-4-lite", + "name": "voyage-4-lite", + "display_name": "voyage-4-lite", "modalities": { "input": [ - "text", - "image", - "video" + "text" ], "output": [ "text" ] }, "limit": { - "context": 262144, - "output": 16384 + "context": 32000, + "output": 8192 }, + "temperature": true, "tool_call": false, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } + "supported": false }, - "attachment": true, + "attachment": false, "open_weights": false, - "release_date": "2026-04-06", - "last_updated": "2026-04-06", - "cost": { - "input": 0.306, - "output": 0.306 - }, + "release_date": "2026-03-06", + "last_updated": "2026-03-06", "type": "chat" }, { - "id": "Qwen3.5-27B-Marvin-V2-Derestricted-Lite", - "name": "Qwen3.5 27B Marvin V2 Derestricted Lite", - "display_name": "Qwen3.5 27B Marvin V2 Derestricted Lite", + "id": "voyage/voyage-law-2", + "name": "voyage-law-2", + "display_name": "voyage-law-2", "modalities": { "input": [ - "text", - "image", - "video" + "text" ], "output": [ "text" ] }, "limit": { - "context": 262144, - "output": 16384 + "context": 8192, + "output": 1536 }, + "temperature": true, "tool_call": false, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } + "supported": false }, - "attachment": true, + "attachment": false, "open_weights": false, - "release_date": "2026-04-30", - "last_updated": "2026-04-30", - "cost": { - "input": 0.306, - "output": 0.306 - }, + "release_date": "2024-03-01", + "last_updated": "2024-03", "type": "chat" }, { - "id": "ernie-x1-32k", - "name": "Ernie X1 32k", - "display_name": "Ernie X1 32k", + "id": "voyage/voyage-4", + "name": "voyage-4", + "display_name": "voyage-4", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" @@ -10742,132 +10946,77 @@ }, "limit": { "context": 32000, - "output": 16384 + "output": 8192 }, + "temperature": true, "tool_call": false, "reasoning": { "supported": false }, - "attachment": true, + "attachment": false, "open_weights": false, - "release_date": "2025-05-08", - "last_updated": "2025-05-08", - "cost": { - "input": 0.33, - "output": 1.32 - }, + "release_date": "2026-03-06", + "last_updated": "2026-03-06", "type": "chat" }, { - "id": "claude-sonnet-4-thinking:1024", - "name": "Claude 4 Sonnet Thinking (1K)", - "display_name": "Claude 4 Sonnet Thinking (1K)", + "id": "voyage/voyage-code-3", + "name": "voyage-code-3", + "display_name": "voyage-code-3", "modalities": { "input": [ - "text", - "image", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 1000000, - "output": 64000 + "context": 8192, + "output": 1536 }, - "tool_call": true, + "temperature": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": true, - "mode": "budget", - "budget": { - "min": 1024, - "unit": "tokens" - }, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ], - "notes": [ - "Claude 4 manual thinking uses thinking.type = \"enabled\" with budget_tokens.", - "Interleaved thinking requires the interleaved-thinking-2025-05-14 beta header for this model family." - ] - } + "supported": false }, - "attachment": true, + "attachment": false, "open_weights": false, - "release_date": "2025-05-22", - "last_updated": "2025-05-22", - "cost": { - "input": 2.992, - "output": 14.994 - }, + "release_date": "2024-09-01", + "last_updated": "2024-09", "type": "chat" }, { - "id": "gemini-2.5-flash-preview-04-17", - "name": "Gemini 2.5 Flash Preview", - "display_name": "Gemini 2.5 Flash Preview", + "id": "voyage/voyage-4-large", + "name": "voyage-4-large", + "display_name": "voyage-4-large", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 1048756, - "output": 65536 + "context": 32000, + "output": 8192 }, + "temperature": true, "tool_call": false, "reasoning": { - "supported": true, - "default": true + "supported": false }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": true, - "mode": "budget", - "budget": { - "default": -1, - "min": 0, - "max": 24576, - "auto": -1, - "off": 0, - "unit": "tokens" - }, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thought_signatures" - ] - } - }, - "attachment": true, + "attachment": false, "open_weights": false, - "release_date": "2025-04-17", - "last_updated": "2025-04-17", - "cost": { - "input": 0.15, - "output": 0.6 - }, + "release_date": "2026-03-06", + "last_updated": "2026-03-06", "type": "chat" }, { - "id": "hermes-medium", - "name": "Hermes Medium", - "display_name": "Hermes Medium", + "id": "voyage/rerank-2.5", + "name": "Voyage Rerank 2.5", + "display_name": "Voyage Rerank 2.5", "modalities": { "input": [ "text" @@ -10877,250 +11026,159 @@ ] }, "limit": { - "context": 204800, - "output": 131072 + "context": 32000, + "output": 32000 }, - "tool_call": true, + "temperature": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": true + "supported": false }, "attachment": false, "open_weights": false, - "release_date": "2026-05-11", - "last_updated": "2026-05-11", - "cost": { - "input": 0.3, - "output": 1.2 - }, + "release_date": "2025-08-11", + "last_updated": "2025-08-11", "type": "chat" }, { - "id": "Qwen3.5-27B-Marvin-DPO-V2-Derestricted-Lite", - "name": "Qwen3.5 27B Marvin DPO V2 Derestricted Lite", - "display_name": "Qwen3.5 27B Marvin DPO V2 Derestricted Lite", + "id": "voyage/rerank-2.5-lite", + "name": "Voyage Rerank 2.5 Lite", + "display_name": "Voyage Rerank 2.5 Lite", "modalities": { "input": [ - "text", - "image", - "video" - ], - "output": [ "text" - ] - }, - "limit": { - "context": 262144, - "output": 16384 - }, - "tool_call": false, - "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } - }, - "attachment": true, - "open_weights": false, - "release_date": "2026-04-30", - "last_updated": "2026-04-30", - "cost": { - "input": 0.306, - "output": 0.306 - }, - "type": "chat" - }, - { - "id": "gemma-4-31B-MeroMero", - "name": "Gemma 4 31B MeroMero", - "display_name": "Gemma 4 31B MeroMero", - "modalities": { - "input": [ - "text", - "image", - "video" ], "output": [ "text" ] }, "limit": { - "context": 262144, - "output": 16384 + "context": 32000, + "output": 32000 }, + "temperature": true, "tool_call": false, "reasoning": { - "supported": true, - "default": true + "supported": false }, - "attachment": true, + "attachment": false, "open_weights": false, - "release_date": "2026-05-02", - "last_updated": "2026-05-02", - "cost": { - "input": 0.306, - "output": 0.306 - }, + "release_date": "2025-08-11", + "last_updated": "2025-08-11", "type": "chat" }, { - "id": "ernie-5.0-thinking-preview", - "name": "Ernie 5.0 Thinking Preview", - "display_name": "Ernie 5.0 Thinking Preview", + "id": "voyage/voyage-code-2", + "name": "voyage-code-2", + "display_name": "voyage-code-2", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 16384 + "context": 8192, + "output": 1536 }, + "temperature": true, "tool_call": false, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true - } + "supported": false }, - "attachment": true, + "attachment": false, "open_weights": false, - "release_date": "2025-11-18", - "last_updated": "2025-11-18", - "cost": { - "input": 1.1, - "output": 2 - }, + "release_date": "2024-01-01", + "last_updated": "2024-01", "type": "chat" }, { - "id": "Gemma-4-31B-Queen", - "name": "Gemma 4 31B Queen", - "display_name": "Gemma 4 31B Queen", + "id": "voyage/voyage-3.5-lite", + "name": "voyage-3.5-lite", + "display_name": "voyage-3.5-lite", "modalities": { "input": [ - "text", - "image", - "video" + "text" ], "output": [ "text" ] }, "limit": { - "context": 262144, - "output": 16384 + "context": 8192, + "output": 1536 }, + "temperature": true, "tool_call": false, "reasoning": { - "supported": true, - "default": true + "supported": false }, - "attachment": true, + "attachment": false, "open_weights": false, - "release_date": "2026-05-01", - "last_updated": "2026-05-01", - "cost": { - "input": 0.306, - "output": 0.306 - }, + "release_date": "2025-05-20", + "last_updated": "2025-05-20", "type": "chat" }, { - "id": "kimi-k2-instruct-fast", - "name": "Kimi K2 0711 Fast", - "display_name": "Kimi K2 0711 Fast", + "id": "voyage/voyage-3.5", + "name": "voyage-3.5", + "display_name": "voyage-3.5", "modalities": { "input": [ - "text", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 131072, - "output": 16384 + "context": 8192, + "output": 1536 }, + "temperature": true, "tool_call": false, "reasoning": { "supported": false }, - "attachment": true, + "attachment": false, "open_weights": false, - "release_date": "2025-07-15", - "last_updated": "2025-07-15", - "cost": { - "input": 0.1, - "output": 2 - }, + "release_date": "2025-05-20", + "last_updated": "2025-05-20", "type": "chat" }, { - "id": "Qwen3.5-27B-Queen-Derestricted", - "name": "Qwen3.5 27B Queen Derestricted", - "display_name": "Qwen3.5 27B Queen Derestricted", + "id": "voyage/voyage-3-large", + "name": "voyage-3-large", + "display_name": "voyage-3-large", "modalities": { "input": [ - "text", - "image", - "video" + "text" ], "output": [ "text" ] }, "limit": { - "context": 262144, - "output": 16384 + "context": 8192, + "output": 1536 }, + "temperature": true, "tool_call": false, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } + "supported": false }, - "attachment": true, + "attachment": false, "open_weights": false, - "release_date": "2026-04-30", - "last_updated": "2026-04-30", - "cost": { - "input": 0.306, - "output": 0.306 - }, + "release_date": "2024-09-01", + "last_updated": "2024-09", "type": "chat" }, { - "id": "deepseek-r1", - "name": "DeepSeek R1", - "display_name": "DeepSeek R1", + "id": "voyage/voyage-finance-2", + "name": "voyage-finance-2", + "display_name": "voyage-finance-2", "modalities": { "input": [ "text" @@ -11130,133 +11188,83 @@ ] }, "limit": { - "context": 128000, - "output": 8192 + "context": 8192, + "output": 1536 }, + "temperature": true, "tool_call": false, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } + "supported": false }, "attachment": false, "open_weights": false, - "release_date": "2025-01-20", - "last_updated": "2025-01-20", - "cost": { - "input": 0.4, - "output": 1.7 - }, + "release_date": "2024-03-01", + "last_updated": "2024-03", "type": "chat" }, { - "id": "gemini-2.5-pro-preview-05-06", - "name": "Gemini 2.5 Pro Preview 0506", - "display_name": "Gemini 2.5 Pro Preview 0506", + "id": "mistral/mistral-nemo", + "name": "Mistral Nemo", + "display_name": "Mistral Nemo", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 1048756, - "output": 65536 + "context": 131072, + "output": 131072 }, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": true, - "mode": "budget", - "budget": { - "default": -1, - "min": 128, - "max": 32768, - "auto": -1, - "unit": "tokens" - }, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thought_signatures" - ] - } + "supported": false }, - "attachment": true, + "attachment": false, "open_weights": false, - "release_date": "2025-05-06", - "last_updated": "2025-05-06", + "knowledge": "2024-04", + "release_date": "2024-07-01", + "last_updated": "2024-07-01", "cost": { - "input": 2.5, - "output": 10 + "input": 0.02, + "output": 0.04 }, "type": "chat" }, { - "id": "qwen3.5-flash", - "name": "Qwen3.5 Flash", - "display_name": "Qwen3.5 Flash", + "id": "mistral/codestral-embed", + "name": "Codestral Embed", + "display_name": "Codestral Embed", "modalities": { "input": [ - "text", - "image", - "video" + "text" ], "output": [ "text" ] }, "limit": { - "context": 991808, - "output": 65536 + "context": 8192, + "output": 1536 }, + "temperature": true, "tool_call": false, "reasoning": { - "supported": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } + "supported": false }, - "attachment": true, + "attachment": false, "open_weights": false, - "release_date": "2026-02-24", - "last_updated": "2026-02-24", - "cost": { - "input": 0.09, - "output": 0.36 - }, + "release_date": "2025-05-28", + "last_updated": "2025-05-28", "type": "chat" }, { - "id": "phi-4-multimodal-instruct", - "name": "Phi 4 Multimodal", - "display_name": "Phi 4 Multimodal", + "id": "mistral/mistral-embed", + "name": "Mistral Embed", + "display_name": "Mistral Embed", "modalities": { "input": [ "text" @@ -11266,27 +11274,24 @@ ] }, "limit": { - "context": 128000, - "output": 16384 + "context": 8192, + "output": 1536 }, + "temperature": true, "tool_call": false, "reasoning": { "supported": false }, "attachment": false, "open_weights": false, - "release_date": "2025-07-26", - "last_updated": "2025-07-26", - "cost": { - "input": 0.07, - "output": 0.11 - }, + "release_date": "2023-12-11", + "last_updated": "2023-12-11", "type": "chat" }, { - "id": "qwen3.7-max", - "name": "Qwen3.7 Max", - "display_name": "Qwen3.7 Max", + "id": "mistral/devstral-small", + "name": "Devstral Small 1.1", + "display_name": "Devstral Small 1.1", "modalities": { "input": [ "text" @@ -11296,63 +11301,62 @@ ] }, "limit": { - "context": 1000000, - "output": 65536 + "context": 128000, + "output": 64000 }, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { - "supported": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true - } + "supported": false }, "attachment": false, "open_weights": false, - "release_date": "2026-05-21", - "last_updated": "2026-05-21", + "knowledge": "2024-10", + "release_date": "2025-05-07", + "last_updated": "2025-05-07", "cost": { - "input": 2.5, - "output": 7.5, - "cache_read": 0.25 + "input": 0.1, + "output": 0.3 }, "type": "chat" }, { - "id": "azure-gpt-4-turbo", - "name": "Azure gpt-4-turbo", - "display_name": "Azure gpt-4-turbo", + "id": "mistral/mistral-large-3", + "name": "Mistral Large 3", + "display_name": "Mistral Large 3", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 4096 + "context": 256000, + "output": 256000 }, + "temperature": true, "tool_call": false, "reasoning": { "supported": false }, - "attachment": false, + "attachment": true, "open_weights": false, - "release_date": "2023-11-06", - "last_updated": "2024-01-01", + "knowledge": "2024-10", + "release_date": "2025-12-02", + "last_updated": "2025-12-02", "cost": { - "input": 9.996, - "output": 30.005 + "input": 0.5, + "output": 1.5 }, "type": "chat" }, { - "id": "sonar-reasoning-pro", - "name": "Perplexity Reasoning Pro", - "display_name": "Perplexity Reasoning Pro", + "id": "mistral/mistral-medium-3.5", + "name": "Mistral Medium Latest", + "display_name": "Mistral Medium Latest", "modalities": { "input": [ "text" @@ -11362,28 +11366,29 @@ ] }, "limit": { - "context": 127000, - "output": 128000 + "context": 256000, + "output": 256000 }, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { "supported": true, "default": true }, "attachment": false, "open_weights": false, - "release_date": "2025-02-19", - "last_updated": "2025-02-19", + "release_date": "2026-05-21", + "last_updated": "2026-05-21", "cost": { - "input": 2.006, - "output": 7.9985 + "input": 1.5, + "output": 7.5 }, "type": "chat" }, { - "id": "gemini-2.5-pro", - "name": "Gemini 2.5 Pro", - "display_name": "Gemini 2.5 Pro", + "id": "mistral/mistral-medium", + "name": "Mistral Medium 3.1", + "display_name": "Mistral Medium 3.1", "modalities": { "input": [ "text", @@ -11394,47 +11399,29 @@ ] }, "limit": { - "context": 1048756, - "output": 65536 + "context": 128000, + "output": 64000 }, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": true, - "mode": "budget", - "budget": { - "default": -1, - "min": 128, - "max": 32768, - "auto": -1, - "unit": "tokens" - }, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thought_signatures" - ] - } + "supported": false }, "attachment": true, "open_weights": false, - "release_date": "2025-06-05", - "last_updated": "2025-06-05", + "knowledge": "2024-10", + "release_date": "2025-05-07", + "last_updated": "2025-05-07", "cost": { - "input": 2.5, - "output": 10 + "input": 0.4, + "output": 2 }, "type": "chat" }, { - "id": "KAT-Coder-Air-V1", - "name": "KAT Coder Air V1", - "display_name": "KAT Coder Air V1", + "id": "mistral/devstral-small-2", + "name": "Devstral Small 2", + "display_name": "Devstral Small 2", "modalities": { "input": [ "text" @@ -11444,57 +11431,63 @@ ] }, "limit": { - "context": 128000, - "output": 32768 + "context": 256000, + "output": 256000 }, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { "supported": false }, "attachment": false, "open_weights": false, - "release_date": "2025-10-28", - "last_updated": "2025-10-28", + "knowledge": "2024-10", + "release_date": "2025-05-07", + "last_updated": "2025-05-07", "cost": { "input": 0.1, - "output": 0.2 + "output": 0.3 }, "type": "chat" }, { - "id": "glm-4-air-0111", - "name": "GLM 4 Air 0111", - "display_name": "GLM 4 Air 0111", + "id": "mistral/ministral-14b", + "name": "Ministral 14B", + "display_name": "Ministral 14B", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 4096 + "context": 256000, + "output": 256000 }, + "temperature": true, "tool_call": false, "reasoning": { "supported": false }, - "attachment": false, + "attachment": true, "open_weights": false, - "release_date": "2025-01-11", - "last_updated": "2025-01-11", + "knowledge": "2024-10", + "release_date": "2025-12-01", + "last_updated": "2025-12-01", "cost": { - "input": 0.1394, - "output": 0.1394 + "input": 0.2, + "output": 0.2 }, "type": "chat" }, { - "id": "doubao-1.5-pro-32k", - "name": "Doubao 1.5 Pro 32k", - "display_name": "Doubao 1.5 Pro 32k", + "id": "mistral/devstral-2", + "name": "Devstral 2", + "display_name": "Devstral 2", "modalities": { "input": [ "text" @@ -11504,63 +11497,65 @@ ] }, "limit": { - "context": 32000, - "output": 8192 + "context": 256000, + "output": 256000 }, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { "supported": false }, "attachment": false, "open_weights": false, - "release_date": "2025-01-22", - "last_updated": "2025-01-22", + "knowledge": "2024-10", + "release_date": "2025-12-09", + "last_updated": "2025-12-09", "cost": { - "input": 0.1343, - "output": 0.3349 + "input": 0.4, + "output": 2 }, "type": "chat" }, { - "id": "qwen3.5-omni-plus", - "name": "Qwen3.5 Omni Plus", - "display_name": "Qwen3.5 Omni Plus", + "id": "mistral/ministral-8b", + "name": "Ministral 8B (latest)", + "display_name": "Ministral 8B (latest)", "modalities": { "input": [ - "text", - "image", - "video", - "audio" + "text" ], "output": [ "text" ] }, "limit": { - "context": 983616, - "output": 65536 + "context": 128000, + "output": 128000 }, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { "supported": false }, - "attachment": true, - "open_weights": false, - "release_date": "2026-03-30", - "last_updated": "2026-03-30", + "attachment": false, + "open_weights": true, + "knowledge": "2024-10", + "release_date": "2024-10-01", + "last_updated": "2024-10-04", "cost": { - "input": 0, - "output": 0 + "input": 0.1, + "output": 0.1 }, "type": "chat" }, { - "id": "doubao-seed-1-6-flash-250615", - "name": "Doubao Seed 1.6 Flash", - "display_name": "Doubao Seed 1.6 Flash", + "id": "mistral/mistral-small", + "name": "Mistral Small (latest)", + "display_name": "Mistral Small (latest)", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" @@ -11568,26 +11563,29 @@ }, "limit": { "context": 256000, - "output": 16384 + "output": 256000 }, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": false, - "open_weights": false, - "release_date": "2025-06-15", - "last_updated": "2025-06-15", + "attachment": true, + "open_weights": true, + "knowledge": "2025-06", + "release_date": "2026-03-16", + "last_updated": "2026-03-16", "cost": { - "input": 0.0374, - "output": 0.374 + "input": 0.15, + "output": 0.6 }, "type": "chat" }, { - "id": "mirothinker-1-7-deepresearch", - "name": "MiroThinker 1.7 Deep Research", - "display_name": "MiroThinker 1.7 Deep Research", + "id": "mistral/codestral", + "name": "Codestral (latest)", + "display_name": "Codestral (latest)", "modalities": { "input": [ "text" @@ -11597,148 +11595,130 @@ ] }, "limit": { - "context": 262144, - "output": 16384 + "context": 256000, + "output": 4096 }, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, "attachment": false, - "open_weights": false, - "release_date": "2026-05-11", - "last_updated": "2026-05-11", + "open_weights": true, + "knowledge": "2024-10", + "release_date": "2024-05-29", + "last_updated": "2025-01-04", "cost": { - "input": 4, - "output": 25 + "input": 0.3, + "output": 0.9 }, "type": "chat" }, { - "id": "azure-o3-mini", - "name": "Azure o3-mini", - "display_name": "Azure o3-mini", + "id": "mistral/pixtral-12b", + "name": "Pixtral 12B", + "display_name": "Pixtral 12B", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 65536 + "context": 128000, + "output": 128000 }, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { "supported": false }, - "attachment": false, - "open_weights": false, - "release_date": "2025-01-31", - "last_updated": "2025-01-31", + "attachment": true, + "open_weights": true, + "knowledge": "2024-09", + "release_date": "2024-09-01", + "last_updated": "2024-09-01", "cost": { - "input": 1.088, - "output": 4.3996 + "input": 0.15, + "output": 0.15 }, "type": "chat" }, { - "id": "claude-sonnet-4-5-20250929", - "name": "Claude Sonnet 4.5", - "display_name": "Claude Sonnet 4.5", + "id": "mistral/pixtral-large", + "name": "Pixtral Large (latest)", + "display_name": "Pixtral Large (latest)", "modalities": { "input": [ "text", - "image", - "pdf" + "image" ], "output": [ "text" ] }, "limit": { - "context": 1000000, - "output": 64000 + "context": 128000, + "output": 128000 }, + "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": false - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": false, - "mode": "budget", - "budget": { - "min": 1024, - "unit": "tokens" - }, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ], - "notes": [ - "Claude 4 manual thinking uses thinking.type = \"enabled\" with budget_tokens.", - "Interleaved thinking requires the interleaved-thinking-2025-05-14 beta header for this model family." - ] - } + "supported": false }, "attachment": true, - "open_weights": false, - "release_date": "2025-09-29", - "last_updated": "2025-09-29", + "open_weights": true, + "knowledge": "2024-11", + "release_date": "2024-11-01", + "last_updated": "2024-11-04", "cost": { - "input": 2.992, - "output": 14.994 + "input": 2, + "output": 6 }, "type": "chat" }, { - "id": "claude-3-5-haiku-20241022", - "name": "Claude 3.5 Haiku", - "display_name": "Claude 3.5 Haiku", + "id": "mistral/ministral-3b", + "name": "Ministral 3B (latest)", + "display_name": "Ministral 3B (latest)", "modalities": { "input": [ - "text", - "image", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 8192 + "context": 128000, + "output": 128000 }, + "temperature": true, "tool_call": true, "reasoning": { "supported": false }, - "attachment": true, - "open_weights": false, - "release_date": "2024-10-22", - "last_updated": "2024-10-22", + "attachment": false, + "open_weights": true, + "knowledge": "2024-10", + "release_date": "2024-10-01", + "last_updated": "2024-10-04", "cost": { - "input": 0.8, - "output": 4 + "input": 0.04, + "output": 0.04 }, "type": "chat" }, { - "id": "deepseek-chat", - "name": "DeepSeek V3/Deepseek Chat", - "display_name": "DeepSeek V3/Deepseek Chat", + "id": "mistral/magistral-small", + "name": "Magistral Small", + "display_name": "Magistral Small", "modalities": { "input": [ - "text", - "pdf" + "text" ], "output": [ "text" @@ -11746,58 +11726,62 @@ }, "limit": { "context": 128000, - "output": 8192 + "output": 128000 }, + "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": true, - "open_weights": false, - "release_date": "2025-02-27", - "last_updated": "2025-02-27", + "attachment": false, + "open_weights": true, + "knowledge": "2025-06", + "release_date": "2025-03-17", + "last_updated": "2025-03-17", "cost": { - "input": 0.25, - "output": 0.7 + "input": 0.5, + "output": 1.5 }, "type": "chat" }, { - "id": "gemini-2.0-flash-thinking-exp-01-21", - "name": "Gemini 2.0 Flash Thinking 0121", - "display_name": "Gemini 2.0 Flash Thinking 0121", + "id": "mistral/magistral-medium", + "name": "Magistral Medium (latest)", + "display_name": "Magistral Medium (latest)", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 1000000, - "output": 8192 + "context": 128000, + "output": 16384 }, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { "supported": true, "default": true }, - "attachment": true, - "open_weights": false, - "release_date": "2025-01-21", - "last_updated": "2025-01-21", + "attachment": false, + "open_weights": true, + "knowledge": "2025-06", + "release_date": "2025-03-17", + "last_updated": "2025-03-20", "cost": { - "input": 0.306, - "output": 1.003 + "input": 2, + "output": 5 }, "type": "chat" }, { - "id": "phi-4-mini-instruct", - "name": "Phi 4 Mini", - "display_name": "Phi 4 Mini", + "id": "google/gemini-embedding-2", + "name": "Gemini Embedding 2", + "display_name": "Gemini Embedding 2", "modalities": { "input": [ "text" @@ -11807,27 +11791,24 @@ ] }, "limit": { - "context": 128000, - "output": 16384 + "context": 8192, + "output": 8192 }, + "temperature": true, "tool_call": false, "reasoning": { "supported": false }, "attachment": false, "open_weights": false, - "release_date": "2025-07-26", - "last_updated": "2025-07-26", - "cost": { - "input": 0.17, - "output": 0.68 - }, + "release_date": "2026-03-10", + "last_updated": "2026-03-23", "type": "chat" }, { - "id": "claw-medium", - "name": "Claw Medium", - "display_name": "Claw Medium", + "id": "google/text-multilingual-embedding-002", + "name": "Text Multilingual Embedding 002", + "display_name": "Text Multilingual Embedding 002", "modalities": { "input": [ "text" @@ -11837,192 +11818,191 @@ ] }, "limit": { - "context": 204800, - "output": 131072 + "context": 8192, + "output": 1536 }, - "tool_call": true, + "temperature": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": true + "supported": false }, "attachment": false, "open_weights": false, - "release_date": "2026-05-11", - "last_updated": "2026-05-11", - "cost": { - "input": 0.3, - "output": 1.2 - }, + "release_date": "2024-03-01", + "last_updated": "2024-03", "type": "chat" }, { - "id": "Qwen3.5-27B-BlueStar-v2-Derestricted", - "name": "Qwen3.5 27B BlueStar v2 Derestricted", - "display_name": "Qwen3.5 27B BlueStar v2 Derestricted", + "id": "google/gemini-3.1-flash-lite", + "name": "Gemini 3.1 Flash Lite", + "display_name": "Gemini 3.1 Flash Lite", "modalities": { "input": [ "text", "image", - "video" + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 262144, - "output": 16384 + "context": 1000000, + "output": 65000 }, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { "supported": true, "default": true }, "extra_capabilities": { "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] + "supported": true } }, "attachment": true, "open_weights": false, - "release_date": "2026-04-06", - "last_updated": "2026-04-06", + "knowledge": "2025-01", + "release_date": "2026-05-07", + "last_updated": "2026-05-07", "cost": { - "input": 0.306, - "output": 0.306 + "input": 0.25, + "output": 1.5, + "cache_read": 0.03 }, "type": "chat" }, { - "id": "claude-opus-4-1-20250805", - "name": "Claude 4.1 Opus", - "display_name": "Claude 4.1 Opus", + "id": "google/gemini-3.1-flash-image", + "name": "Gemini 3.1 Flash Image (Nano Banana 2)", + "display_name": "Gemini 3.1 Flash Image (Nano Banana 2)", "modalities": { "input": [ "text", - "image", - "pdf" + "image" ], "output": [ - "text" + "text", + "image" ] }, "limit": { - "context": 200000, - "output": 32000 + "context": 131072, + "output": 32768 }, - "tool_call": true, + "temperature": true, + "tool_call": false, "reasoning": { "supported": true, - "default": false + "default": true }, "extra_capabilities": { "reasoning": { - "supported": true, - "default_enabled": false, - "mode": "budget", - "budget": { - "min": 1024, - "unit": "tokens" - }, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ], - "notes": [ - "Claude 4 manual thinking uses thinking.type = \"enabled\" with budget_tokens.", - "Interleaved thinking requires the interleaved-thinking-2025-05-14 beta header for this model family." - ] + "supported": true } }, "attachment": true, "open_weights": false, - "release_date": "2025-08-05", - "last_updated": "2025-08-05", + "release_date": "2026-05-28", + "last_updated": "2026-05-28", "cost": { - "input": 14.994, - "output": 75.004 + "input": 0.5, + "output": 3, + "cache_read": 0.05 }, - "type": "chat" + "type": "imageGeneration" }, { - "id": "qwen3.5-omni-flash", - "name": "Qwen3.5 Omni Flash", - "display_name": "Qwen3.5 Omni Flash", + "id": "google/gemini-3-flash", + "name": "Gemini 3 Flash", + "display_name": "Gemini 3 Flash", "modalities": { "input": [ "text", "image", - "video", - "audio" + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 49152, - "output": 16384 + "context": 1000000, + "output": 65000 }, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": true, + "mode": "level", + "level": "high", + "level_options": [ + "minimal", + "low", + "medium", + "high" + ], + "summaries": true, + "visibility": "summary", + "continuation": [ + "thought_signatures" + ] + } }, "attachment": true, "open_weights": false, - "release_date": "2026-03-30", - "last_updated": "2026-03-30", + "knowledge": "2025-03", + "release_date": "2025-12-17", + "last_updated": "2025-12-17", "cost": { - "input": 0, - "output": 0 + "input": 0.5, + "output": 3, + "cache_read": 0.05 }, "type": "chat" }, { - "id": "qwen-max", - "name": "Qwen 2.5 Max", - "display_name": "Qwen 2.5 Max", + "id": "google/veo-3.1-generate-001", + "name": "Veo 3.1", + "display_name": "Veo 3.1", "modalities": { "input": [ "text" ], "output": [ - "text" + "video" ] }, "limit": { - "context": 32000, + "context": 8192, "output": 8192 }, + "temperature": true, "tool_call": false, "reasoning": { "supported": false }, "attachment": false, "open_weights": false, - "release_date": "2024-04-03", - "last_updated": "2024-04-03", - "cost": { - "input": 1.5997, - "output": 6.392 - }, + "release_date": "2026-06-08", + "last_updated": "2026-06-08", "type": "chat" }, { - "id": "doubao-1-5-thinking-pro-250415", - "name": "Doubao 1.5 Thinking Pro", - "display_name": "Doubao 1.5 Thinking Pro", + "id": "google/gemini-3.5-flash", + "name": "Gemini 3.5 Flash", + "display_name": "Gemini 3.5 Flash", "modalities": { "input": [ "text", + "image", "pdf" ], "output": [ @@ -12030,117 +12010,138 @@ ] }, "limit": { - "context": 128000, - "output": 16384 + "context": 1000000, + "output": 64000 }, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": true, + "mode": "level", + "level": "high", + "level_options": [ + "minimal", + "low", + "medium", + "high" + ], + "summaries": true, + "visibility": "summary", + "continuation": [ + "thought_signatures" + ] + } }, "attachment": true, "open_weights": false, - "release_date": "2025-04-17", - "last_updated": "2025-04-17", + "knowledge": "2025-01", + "release_date": "2026-05-19", + "last_updated": "2026-05-19", "cost": { - "input": 0.6, - "output": 2.4 + "input": 1.5, + "output": 9, + "cache_read": 0.15 }, "type": "chat" }, { - "id": "jamba-large-1.7", - "name": "Jamba Large 1.7", - "display_name": "Jamba Large 1.7", + "id": "google/gemma-4-31b-it", + "name": "Gemma 4 31B IT", + "display_name": "Gemma 4 31B IT", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 256000, - "output": 4096 + "context": 262144, + "output": 131072 }, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": false, + "attachment": true, "open_weights": false, - "release_date": "2025-07-09", - "last_updated": "2025-07-09", + "release_date": "2026-04-02", + "last_updated": "2026-04-02", "cost": { - "input": 1.989, - "output": 7.99 + "input": 0.14, + "output": 0.4 }, "type": "chat" }, { - "id": "brave-pro", - "name": "Brave (Pro)", - "display_name": "Brave (Pro)", + "id": "google/veo-3.0-generate-001", + "name": "Veo 3.0", + "display_name": "Veo 3.0", "modalities": { "input": [ "text" ], "output": [ - "text" + "video" ] }, "limit": { "context": 8192, "output": 8192 }, + "temperature": true, "tool_call": false, "reasoning": { "supported": false }, "attachment": false, "open_weights": false, - "release_date": "2023-03-02", - "last_updated": "2024-01-01", - "cost": { - "input": 5, - "output": 5 - }, + "release_date": "2026-06-08", + "last_updated": "2026-06-08", "type": "chat" }, { - "id": "jamba-mini-1.7", - "name": "Jamba Mini 1.7", - "display_name": "Jamba Mini 1.7", + "id": "google/veo-3.0-fast-generate-001", + "name": "Veo 3.0 Fast Generate", + "display_name": "Veo 3.0 Fast Generate", "modalities": { "input": [ "text" ], "output": [ - "text" + "video" ] }, "limit": { - "context": 256000, - "output": 4096 + "context": 8192, + "output": 8192 }, + "temperature": true, "tool_call": false, "reasoning": { "supported": false }, "attachment": false, "open_weights": false, - "release_date": "2025-07-09", - "last_updated": "2025-07-09", - "cost": { - "input": 0.1989, - "output": 0.408 - }, + "release_date": "2026-06-08", + "last_updated": "2026-06-08", "type": "chat" }, { - "id": "sarvam-105b", - "name": "Sarvam 105B", - "display_name": "Sarvam 105B", + "id": "google/text-embedding-005", + "name": "Text Embedding 005", + "display_name": "Text Embedding 005", "modalities": { "input": [ "text" @@ -12150,29 +12151,24 @@ ] }, "limit": { - "context": 131072, - "output": 4096 + "context": 8192, + "output": 1536 }, - "tool_call": true, + "temperature": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": true + "supported": false }, "attachment": false, "open_weights": false, - "release_date": "2026-05-12", - "last_updated": "2026-05-12", - "cost": { - "input": 0.045, - "output": 0.177, - "cache_read": 0.028 - }, + "release_date": "2024-08-01", + "last_updated": "2024-08", "type": "chat" }, { - "id": "v0-1.5-md", - "name": "v0 1.5 MD", - "display_name": "v0 1.5 MD", + "id": "google/gemini-embedding-001", + "name": "Gemini Embedding 001", + "display_name": "Gemini Embedding 001", "modalities": { "input": [ "text" @@ -12182,71 +12178,102 @@ ] }, "limit": { - "context": 200000, - "output": 64000 + "context": 8192, + "output": 1536 }, + "temperature": true, "tool_call": false, "reasoning": { "supported": false }, "attachment": false, "open_weights": false, - "release_date": "2025-07-04", - "last_updated": "2025-07-04", - "cost": { - "input": 3, - "output": 15 - }, - "type": "chat" + "knowledge": "2025-05", + "release_date": "2025-05-20", + "last_updated": "2025-05-20", + "type": "embedding" }, { - "id": "glm-zero-preview", - "name": "GLM Zero Preview", - "display_name": "GLM Zero Preview", + "id": "google/gemini-2.5-flash-image", + "name": "Nano Banana (Gemini 2.5 Flash Image)", + "display_name": "Nano Banana (Gemini 2.5 Flash Image)", "modalities": { "input": [ "text" ], "output": [ - "text" + "text", + "image" ] }, "limit": { - "context": 8000, - "output": 4096 + "context": 32768, + "output": 65536 }, + "temperature": true, "tool_call": false, "reasoning": { "supported": false }, "attachment": false, "open_weights": false, - "release_date": "2024-12-01", - "last_updated": "2024-12-01", + "knowledge": "2025-01", + "release_date": "2025-03-20", + "last_updated": "2025-08-26", "cost": { - "input": 1.802, - "output": 1.802 + "input": 0.3, + "output": 2.5, + "cache_read": 0.03 }, - "type": "chat" + "type": "imageGeneration" }, { - "id": "gemini-2.5-flash-lite", + "id": "google/imagen-4.0-fast-generate-001", + "name": "Imagen 4 Fast", + "display_name": "Imagen 4 Fast", + "modalities": { + "input": [ + "text" + ], + "output": [ + "image" + ] + }, + "limit": { + "context": 480, + "output": 8192 + }, + "temperature": true, + "tool_call": false, + "reasoning": { + "supported": false + }, + "attachment": false, + "open_weights": false, + "release_date": "2025-06-01", + "last_updated": "2025-06", + "type": "imageGeneration" + }, + { + "id": "google/gemini-2.5-flash-lite", "name": "Gemini 2.5 Flash Lite", "display_name": "Gemini 2.5 Flash Lite", "modalities": { "input": [ "text", - "image" + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 1048756, + "context": 1048576, "output": 65536 }, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { "supported": true, "default": false @@ -12272,64 +12299,104 @@ }, "attachment": true, "open_weights": false, + "knowledge": "2025-01", "release_date": "2025-06-17", "last_updated": "2025-06-17", "cost": { "input": 0.1, - "output": 0.4 + "output": 0.4, + "cache_read": 0.01 }, "type": "chat" }, { - "id": "sarvam-30b", - "name": "Sarvam 30B", - "display_name": "Sarvam 30B", + "id": "google/gemini-3.1-flash-image-preview", + "name": "Gemini 3.1 Flash Image Preview (Nano Banana 2)", + "display_name": "Gemini 3.1 Flash Image Preview (Nano Banana 2)", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ - "text" + "text", + "image" ] }, "limit": { - "context": 65536, - "output": 4096 + "context": 131072, + "output": 32768 }, - "tool_call": true, + "temperature": true, + "tool_call": false, "reasoning": { "supported": true, "default": true }, - "attachment": false, + "extra_capabilities": { + "reasoning": { + "supported": true + } + }, + "attachment": true, "open_weights": false, - "release_date": "2026-05-12", - "last_updated": "2026-05-12", + "knowledge": "2025-01", + "release_date": "2026-02-26", + "last_updated": "2026-02-26", "cost": { - "input": 0.028, - "output": 0.111, - "cache_read": 0.017 + "input": 0.5, + "output": 3, + "cache_read": 0.05 }, - "type": "chat" + "type": "imageGeneration" }, { - "id": "gemini-2.5-flash", - "name": "Gemini 2.5 Flash", - "display_name": "Gemini 2.5 Flash", + "id": "google/imagen-4.0-ultra-generate-001", + "name": "Imagen 4 Ultra", + "display_name": "Imagen 4 Ultra", "modalities": { "input": [ - "text", + "text" + ], + "output": [ "image" + ] + }, + "limit": { + "context": 480, + "output": 8192 + }, + "temperature": false, + "tool_call": false, + "reasoning": { + "supported": false + }, + "attachment": false, + "open_weights": false, + "release_date": "2025-05-24", + "last_updated": "2025-05-24", + "type": "imageGeneration" + }, + { + "id": "google/gemini-3.1-pro-preview", + "name": "Gemini 3.1 Pro Preview", + "display_name": "Gemini 3.1 Pro Preview", + "modalities": { + "input": [ + "text", + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 1048756, - "output": 65536 + "context": 1000000, + "output": 64000 }, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { "supported": true, "default": true @@ -12338,15 +12405,12 @@ "reasoning": { "supported": true, "default_enabled": true, - "mode": "budget", - "budget": { - "default": -1, - "min": 0, - "max": 24576, - "auto": -1, - "off": 0, - "unit": "tokens" - }, + "mode": "level", + "level": "high", + "level_options": [ + "low", + "high" + ], "summaries": true, "visibility": "summary", "continuation": [ @@ -12356,126 +12420,203 @@ }, "attachment": true, "open_weights": false, - "release_date": "2025-06-05", - "last_updated": "2025-06-05", + "knowledge": "2025-01", + "release_date": "2025-11-18", + "last_updated": "2026-02-19", "cost": { - "input": 0.3, - "output": 2.5 + "input": 2, + "output": 12, + "cache_read": 0.2 }, "type": "chat" }, { - "id": "azure-gpt-4o-mini", - "name": "Azure gpt-4o-mini", - "display_name": "Azure gpt-4o-mini", + "id": "google/gemma-4-26b-a4b-it", + "name": "Gemma 4 26B A4B IT", + "display_name": "Gemma 4 26B A4B IT", "modalities": { "input": [ "text", - "image" + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 16384 + "context": 262144, + "output": 131072 }, + "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "attachment": true, "open_weights": false, - "release_date": "2024-07-18", - "last_updated": "2024-07-18", + "release_date": "2026-04-02", + "last_updated": "2026-04-02", "cost": { - "input": 0.1496, - "output": 0.595 + "input": 0.15, + "output": 0.6, + "cache_read": 0.015 }, "type": "chat" }, { - "id": "qwen3.5-35b-a3b", - "name": "Qwen3.5 35B A3B", - "display_name": "Qwen3.5 35B A3B", + "id": "google/gemini-3-pro-preview", + "name": "Gemini 3 Pro Preview", + "display_name": "Gemini 3 Pro Preview", "modalities": { "input": [ "text", "image", - "video" + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 260096, - "output": 65536 + "context": 1000000, + "output": 64000 }, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { - "supported": true + "supported": true, + "default": true }, "extra_capabilities": { "reasoning": { "supported": true, - "interleaved": true, + "default_enabled": true, + "mode": "level", + "level": "high", + "level_options": [ + "low", + "high" + ], "summaries": true, "visibility": "summary", "continuation": [ - "thinking_blocks" + "thought_signatures" ] } }, "attachment": true, "open_weights": false, - "release_date": "2026-02-24", - "last_updated": "2026-02-24", + "knowledge": "2025-01", + "release_date": "2025-11-18", + "last_updated": "2025-11-18", "cost": { - "input": 0.225, - "output": 1.8 + "input": 2, + "output": 12, + "cache_read": 0.2, + "tiers": [ + { + "input": 4, + "output": 18, + "cache_read": 0.4, + "tier": { + "type": "context", + "size": 200000 + } + } + ], + "context_over_200k": { + "input": 4, + "output": 18, + "cache_read": 0.4 + } }, "type": "chat" }, { - "id": "ernie-5.1:thinking", - "name": "ERNIE 5.1 Thinking", - "display_name": "ERNIE 5.1 Thinking", + "id": "google/veo-3.1-fast-generate-001", + "name": "Veo 3.1 Fast Generate", + "display_name": "Veo 3.1 Fast Generate", "modalities": { "input": [ - "text", - "image", - "video" + "text" ], "output": [ + "video" + ] + }, + "limit": { + "context": 8192, + "output": 8192 + }, + "temperature": true, + "tool_call": false, + "reasoning": { + "supported": false + }, + "attachment": false, + "open_weights": false, + "release_date": "2026-06-08", + "last_updated": "2026-06-08", + "type": "chat" + }, + { + "id": "google/gemini-3-pro-image", + "name": "Nano Banana Pro (Gemini 3 Pro Image)", + "display_name": "Nano Banana Pro (Gemini 3 Pro Image)", + "modalities": { + "input": [ "text" + ], + "output": [ + "text", + "image" ] }, "limit": { - "context": 119000, - "output": 64000 + "context": 65536, + "output": 32768 }, + "temperature": true, "tool_call": false, "reasoning": { "supported": true, "default": true }, - "attachment": true, + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": true, + "mode": "level", + "level": "high", + "level_options": [ + "low", + "high" + ], + "summaries": true, + "visibility": "summary", + "continuation": [ + "thought_signatures" + ] + } + }, + "attachment": false, "open_weights": false, - "release_date": "2026-05-10", - "last_updated": "2026-05-10", + "knowledge": "2025-03", + "release_date": "2025-09-01", + "last_updated": "2025-09", "cost": { - "input": 0.75, - "output": 3, - "cache_read": 0.75 + "input": 2, + "output": 12, + "cache_read": 0.2 }, - "type": "chat" + "type": "imageGeneration" }, { - "id": "claude-sonnet-4-thinking:64000", - "name": "Claude 4 Sonnet Thinking (64K)", - "display_name": "Claude 4 Sonnet Thinking (64K)", + "id": "google/gemini-3.1-flash-lite-preview", + "name": "Gemini 3.1 Flash Lite Preview", + "display_name": "Gemini 3.1 Flash Lite Preview", "modalities": { "input": [ "text", @@ -12488,8 +12629,9 @@ }, "limit": { "context": 1000000, - "output": 64000 + "output": 65000 }, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, @@ -12497,106 +12639,117 @@ }, "extra_capabilities": { "reasoning": { - "supported": true, - "default_enabled": true, - "mode": "budget", - "budget": { - "min": 1024, - "unit": "tokens" - }, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ], - "notes": [ - "Claude 4 manual thinking uses thinking.type = \"enabled\" with budget_tokens.", - "Interleaved thinking requires the interleaved-thinking-2025-05-14 beta header for this model family." - ] + "supported": true } }, "attachment": true, "open_weights": false, - "release_date": "2025-05-22", - "last_updated": "2025-05-22", + "knowledge": "2025-01", + "release_date": "2026-03-03", + "last_updated": "2026-03-03", "cost": { - "input": 2.992, - "output": 14.994 + "input": 0.25, + "output": 1.5, + "cache_read": 0.03 }, "type": "chat" }, { - "id": "deepseek-reasoner-cheaper", - "name": "Deepseek R1 Cheaper", - "display_name": "Deepseek R1 Cheaper", + "id": "google/imagen-4.0-generate-001", + "name": "Imagen 4", + "display_name": "Imagen 4", "modalities": { "input": [ "text" ], "output": [ - "text" + "image" ] }, "limit": { - "context": 128000, - "output": 65536 + "context": 480, + "output": 8192 }, + "temperature": false, "tool_call": false, "reasoning": { "supported": false }, "attachment": false, "open_weights": false, - "release_date": "2025-01-20", - "last_updated": "2025-01-20", - "cost": { - "input": 0.4, - "output": 1.7 - }, - "type": "chat" + "release_date": "2025-05-22", + "last_updated": "2025-05-22", + "type": "imageGeneration" }, { - "id": "Gemma-4-31B-Gemopus", - "name": "Gemma 4 31B Gemopus", - "display_name": "Gemma 4 31B Gemopus", + "id": "google/gemini-2.5-flash", + "name": "Gemini 2.5 Flash", + "display_name": "Gemini 2.5 Flash", "modalities": { "input": [ "text", "image", - "video" + "audio", + "video", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 262144, - "output": 16384 + "context": 1048576, + "output": 65536 }, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { "supported": true, "default": true }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": true, + "mode": "budget", + "budget": { + "default": -1, + "min": 0, + "max": 24576, + "auto": -1, + "off": 0, + "unit": "tokens" + }, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thought_signatures" + ] + } + }, "attachment": true, "open_weights": false, - "release_date": "2026-05-01", - "last_updated": "2026-05-01", + "knowledge": "2025-01", + "release_date": "2025-03-20", + "last_updated": "2025-06-05", "cost": { - "input": 0.306, - "output": 0.306 + "input": 0.3, + "output": 2.5, + "cache_read": 0.03, + "input_audio": 1 }, "type": "chat" }, { - "id": "gemini-2.5-flash-preview-09-2025", - "name": "Gemini 2.5 Flash Preview (09/2025)", - "display_name": "Gemini 2.5 Flash Preview (09/2025)", + "id": "google/gemini-2.5-pro", + "name": "Gemini 2.5 Pro", + "display_name": "Gemini 2.5 Pro", "modalities": { "input": [ "text", "image", + "audio", + "video", "pdf" ], "output": [ @@ -12604,9 +12757,10 @@ ] }, "limit": { - "context": 1048756, + "context": 1048576, "output": 65536 }, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, @@ -12619,10 +12773,9 @@ "mode": "budget", "budget": { "default": -1, - "min": 0, - "max": 24576, + "min": 128, + "max": 32768, "auto": -1, - "off": 0, "unit": "tokens" }, "summaries": true, @@ -12634,115 +12787,134 @@ }, "attachment": true, "open_weights": false, - "release_date": "2025-09-25", - "last_updated": "2025-09-25", + "knowledge": "2025-01", + "release_date": "2025-03-20", + "last_updated": "2025-06-05", "cost": { - "input": 0.3, - "output": 2.5 + "input": 1.25, + "output": 10, + "cache_read": 0.125, + "tiers": [ + { + "input": 2.5, + "output": 15, + "cache_read": 0.25, + "tier": { + "type": "context", + "size": 200000 + } + } + ], + "context_over_200k": { + "input": 2.5, + "output": 15, + "cache_read": 0.25 + } }, "type": "chat" }, { - "id": "auto-model-standard", - "name": "Auto model (Standard)", - "display_name": "Auto model (Standard)", + "id": "prodia/flux-fast-schnell", + "name": "Flux Schnell", + "display_name": "Flux Schnell", "modalities": { "input": [ "text" ], "output": [ - "text" + "image" ] }, "limit": { - "context": 1000000, - "output": 1000000 + "context": 512, + "output": 8192 }, + "temperature": true, "tool_call": false, "reasoning": { "supported": false }, "attachment": false, "open_weights": false, - "release_date": "2024-06-01", - "last_updated": "2024-06-01", - "cost": { - "input": 9.996, - "output": 19.992 - }, + "release_date": "2026-06-08", + "last_updated": "2026-06-08", "type": "chat" }, { - "id": "Gemma-4-31B-Musica-v1", - "name": "Gemma 4 31B Musica v1", - "display_name": "Gemma 4 31B Musica v1", + "id": "openai/gpt-oss-safeguard-20b", + "name": "gpt-oss-safeguard-20b", + "display_name": "gpt-oss-safeguard-20b", "modalities": { "input": [ - "text", - "image", - "video" + "text" ], "output": [ "text" ] }, "limit": { - "context": 262144, - "output": 16384 + "context": 131072, + "output": 65536 }, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { "supported": true, "default": true }, - "attachment": true, + "attachment": false, "open_weights": false, - "release_date": "2026-05-01", - "last_updated": "2026-05-01", + "knowledge": "2024-10", + "release_date": "2024-12-01", + "last_updated": "2024-12-01", "cost": { - "input": 0.306, - "output": 0.306 + "input": 0.075, + "output": 0.3, + "cache_read": 0.037 }, "type": "chat" }, { - "id": "mistral-small-31-24b-instruct", - "name": "Mistral Small 31 24b Instruct", - "display_name": "Mistral Small 31 24b Instruct", + "id": "openai/gpt-3.5-turbo-instruct", + "name": "GPT-3.5 Turbo Instruct", + "display_name": "GPT-3.5 Turbo Instruct", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 131072 + "context": 8192, + "output": 4096 }, + "temperature": true, "tool_call": false, "reasoning": { "supported": false }, - "attachment": true, + "attachment": false, "open_weights": false, - "release_date": "2025-04-15", - "last_updated": "2025-04-15", + "knowledge": "2021-09", + "release_date": "2023-09-28", + "last_updated": "2023-03-01", "cost": { - "input": 0.1, - "output": 0.3 + "input": 1.5, + "output": 2 }, "type": "chat" }, { - "id": "gemini-2.0-pro-reasoner", - "name": "Gemini 2.0 Pro Reasoner", - "display_name": "Gemini 2.0 Pro Reasoner", + "id": "openai/gpt-5.2-chat", + "name": "GPT-5.2 Chat", + "display_name": "GPT-5.2 Chat", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ "text" @@ -12750,26 +12922,30 @@ }, "limit": { "context": 128000, - "output": 65536 + "output": 16384 }, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": false, + "attachment": true, "open_weights": false, - "release_date": "2025-02-05", - "last_updated": "2025-02-05", + "knowledge": "2024-10", + "release_date": "2025-12-11", + "last_updated": "2025-08-07", "cost": { - "input": 1.292, - "output": 4.998 + "input": 1.75, + "output": 14, + "cache_read": 0.175 }, "type": "chat" }, { - "id": "glm-z1-air", - "name": "GLM Z1 Air", - "display_name": "GLM Z1 Air", + "id": "openai/text-embedding-3-large", + "name": "text-embedding-3-large", + "display_name": "text-embedding-3-large", "modalities": { "input": [ "text" @@ -12779,68 +12955,79 @@ ] }, "limit": { - "context": 32000, - "output": 16384 + "context": 8192, + "output": 1536 }, - "tool_call": true, + "temperature": true, + "tool_call": false, "reasoning": { "supported": false }, "attachment": false, "open_weights": false, - "release_date": "2025-04-15", - "last_updated": "2025-04-15", - "cost": { - "input": 0.07, - "output": 0.07 - }, - "type": "chat" + "release_date": "2024-01-25", + "last_updated": "2024-01-25", + "type": "embedding" }, { - "id": "qwen-turbo", - "name": "Qwen Turbo", - "display_name": "Qwen Turbo", + "id": "openai/gpt-5.2-pro", + "name": "GPT 5.2 ", + "display_name": "GPT 5.2 ", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 1000000, - "output": 8192 + "context": 400000, + "output": 128000 }, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { - "supported": true + "supported": true, + "default": true }, "extra_capabilities": { "reasoning": { "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] + "default_enabled": true, + "mode": "effort", + "effort": "high", + "effort_options": [ + "medium", + "high", + "xhigh" + ], + "verbosity": "medium", + "verbosity_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" } }, - "attachment": false, + "attachment": true, "open_weights": false, - "release_date": "2024-11-01", - "last_updated": "2024-11-01", + "knowledge": "2024-10", + "release_date": "2025-12-11", + "last_updated": "2025-12-11", "cost": { - "input": 0.04998, - "output": 0.2006 + "input": 21, + "output": 168 }, "type": "chat" }, { - "id": "fastgpt", - "name": "Web Answer", - "display_name": "Web Answer", + "id": "openai/gpt-4o-mini-search-preview", + "name": "GPT 4o Mini Search Preview", + "display_name": "GPT 4o Mini Search Preview", "modalities": { "input": [ "text" @@ -12850,102 +13037,98 @@ ] }, "limit": { - "context": 32768, - "output": 32768 + "context": 128000, + "output": 16384 }, + "temperature": true, "tool_call": false, "reasoning": { "supported": false }, "attachment": false, "open_weights": false, - "release_date": "2023-08-01", - "last_updated": "2024-01-01", + "knowledge": "2023-09", + "release_date": "2025-03-12", + "last_updated": "2025-01", "cost": { - "input": 7.5, - "output": 7.5 + "input": 0.15, + "output": 0.6 }, "type": "chat" }, { - "id": "gemini-exp-1206", - "name": "Gemini 2.0 Pro 1206", - "display_name": "Gemini 2.0 Pro 1206", + "id": "openai/gpt-5-chat", + "name": "GPT-5 Chat", + "display_name": "GPT-5 Chat", "modalities": { "input": [ "text", - "image" + "image", + "pdf" ], "output": [ - "text" + "text", + "image" ] }, "limit": { - "context": 2097152, - "output": 8192 + "context": 128000, + "output": 16384 }, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "attachment": true, "open_weights": false, - "release_date": "2024-12-06", - "last_updated": "2024-12-06", + "knowledge": "2024-10", + "release_date": "2025-08-07", + "last_updated": "2025-08-07", "cost": { - "input": 1.258, - "output": 4.998 + "input": 1.25, + "output": 10, + "cache_read": 0.125 }, "type": "chat" }, { - "id": "Qwen3.5-27B-earica-Derestricted-Lite", - "name": "Qwen3.5 27B earica Derestricted Lite", - "display_name": "Qwen3.5 27B earica Derestricted Lite", + "id": "openai/gpt-3.5-turbo", + "name": "GPT-3.5 Turbo", + "display_name": "GPT-3.5 Turbo", "modalities": { "input": [ - "text", - "image", - "video" + "text" ], "output": [ "text" ] }, "limit": { - "context": 262144, - "output": 16384 + "context": 16385, + "output": 4096 }, + "temperature": true, "tool_call": false, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } + "supported": false }, - "attachment": true, + "attachment": false, "open_weights": false, - "release_date": "2026-04-30", - "last_updated": "2026-04-30", + "knowledge": "2021-09", + "release_date": "2023-05-28", + "last_updated": "2023-11-06", "cost": { - "input": 0.306, - "output": 0.306 + "input": 0.5, + "output": 1.5 }, "type": "chat" }, { - "id": "gemini-2.5-flash-nothinking", - "name": "Gemini 2.5 Flash (No Thinking)", - "display_name": "Gemini 2.5 Flash (No Thinking)", + "id": "openai/gpt-5-pro", + "name": "GPT-5 pro", + "display_name": "GPT-5 pro", "modalities": { "input": [ "text", @@ -12953,14 +13136,16 @@ "pdf" ], "output": [ - "text" + "text", + "image" ] }, "limit": { - "context": 1048756, - "output": 65536 + "context": 400000, + "output": 272000 }, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { "supported": true, "default": true @@ -12969,51 +13154,48 @@ "reasoning": { "supported": true, "default_enabled": true, - "mode": "budget", - "budget": { - "default": -1, - "min": 0, - "max": 24576, - "auto": -1, - "off": 0, - "unit": "tokens" - }, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thought_signatures" - ] + "mode": "fixed", + "effort": "high", + "verbosity": "medium", + "verbosity_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" } }, "attachment": true, "open_weights": false, - "release_date": "2025-06-05", - "last_updated": "2025-06-05", + "knowledge": "2024-10", + "release_date": "2025-08-07", + "last_updated": "2025-10-06", "cost": { - "input": 0.3, - "output": 2.5 + "input": 15, + "output": 120 }, "type": "chat" }, { - "id": "Qwen3.5-27B-Anko", - "name": "Qwen3.5 27B Anko", - "display_name": "Qwen3.5 27B Anko", + "id": "openai/o3-pro", + "name": "o3 Pro", + "display_name": "o3 Pro", "modalities": { "input": [ "text", "image", - "video" + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 262144, - "output": 16384 + "context": 200000, + "output": 100000 }, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { "supported": true, "default": true @@ -13021,178 +13203,240 @@ "extra_capabilities": { "reasoning": { "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] + "default_enabled": true, + "mode": "effort", + "effort": "medium", + "effort_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" } }, "attachment": true, "open_weights": false, - "release_date": "2026-04-30", - "last_updated": "2026-04-30", + "knowledge": "2024-10", + "release_date": "2025-04-16", + "last_updated": "2025-06-10", "cost": { - "input": 0.306, - "output": 0.306 + "input": 20, + "output": 80 }, "type": "chat" }, { - "id": "auto-model", - "name": "Auto model", - "display_name": "Auto model", + "id": "openai/gpt-5.4-nano", + "name": "GPT 5.4 Nano", + "display_name": "GPT 5.4 Nano", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 1000000, - "output": 1000000 + "context": 400000, + "output": 128000 }, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { - "supported": false - }, - "attachment": false, - "open_weights": false, - "release_date": "2024-06-01", - "last_updated": "2024-06-01", - "cost": { - "input": 0, - "output": 0 + "supported": true, + "default": false }, - "type": "chat" - }, - { - "id": "ernie-4.5-8k-preview", - "name": "Ernie 4.5 8k Preview", - "display_name": "Ernie 4.5 8k Preview", - "modalities": { - "input": [ - "text" - ], - "output": [ - "text" - ] - }, - "limit": { - "context": 8000, - "output": 16384 - }, - "tool_call": false, - "reasoning": { - "supported": false + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": false, + "mode": "effort", + "effort": "none", + "effort_options": [ + "none", + "low", + "medium", + "high", + "xhigh" + ], + "verbosity": "medium", + "verbosity_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" + } }, - "attachment": false, + "attachment": true, "open_weights": false, - "release_date": "2025-03-25", - "last_updated": "2025-03-25", + "knowledge": "2025-08-31", + "release_date": "2026-03-17", + "last_updated": "2026-03-17", "cost": { - "input": 0.66, - "output": 2.6 + "input": 0.2, + "output": 1.25, + "cache_read": 0.02 }, "type": "chat" }, { - "id": "doubao-seed-1-6-250615", - "name": "Doubao Seed 1.6", - "display_name": "Doubao Seed 1.6", + "id": "openai/gpt-5.3-chat", + "name": "GPT-5.3 Chat", + "display_name": "GPT-5.3 Chat", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 256000, + "context": 128000, "output": 16384 }, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": false, + "attachment": true, "open_weights": false, - "release_date": "2025-06-15", - "last_updated": "2025-06-15", + "release_date": "2026-03-03", + "last_updated": "2026-03-06", "cost": { - "input": 0.204, - "output": 0.51 + "input": 1.75, + "output": 14, + "cache_read": 0.175 }, "type": "chat" }, { - "id": "step-2-16k-exp", - "name": "Step-2 16k Exp", - "display_name": "Step-2 16k Exp", + "id": "openai/gpt-5.1-thinking", + "name": "GPT 5.1 Thinking", + "display_name": "GPT 5.1 Thinking", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ - "text" + "text", + "image" ] }, "limit": { - "context": 16000, - "output": 8192 + "context": 400000, + "output": 128000 }, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": false }, - "attachment": false, + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": false, + "mode": "effort", + "effort": "none", + "effort_options": [ + "none", + "low", + "medium", + "high" + ], + "verbosity": "medium", + "verbosity_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" + } + }, + "attachment": true, "open_weights": false, - "release_date": "2024-07-05", - "last_updated": "2024-07-05", + "knowledge": "2024-10", + "release_date": "2025-11-12", + "last_updated": "2025-08-07", "cost": { - "input": 7.004, - "output": 19.992 + "input": 1.25, + "output": 10, + "cache_read": 0.125 }, "type": "chat" }, { - "id": "step-2-mini", - "name": "Step-2 Mini", - "display_name": "Step-2 Mini", + "id": "openai/gpt-5.1-codex", + "name": "GPT-5.1-Codex", + "display_name": "GPT-5.1-Codex", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 8000, - "output": 4096 + "context": 400000, + "output": 128000 }, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": false }, - "attachment": false, + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": false, + "mode": "effort", + "effort": "none", + "effort_options": [ + "none", + "low", + "medium", + "high" + ], + "verbosity": "medium", + "verbosity_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" + } + }, + "attachment": true, "open_weights": false, - "release_date": "2024-07-05", - "last_updated": "2024-07-05", + "knowledge": "2024-10", + "release_date": "2025-11-12", + "last_updated": "2025-11-13", "cost": { - "input": 0.2006, - "output": 0.408 + "input": 1.25, + "output": 10, + "cache_read": 0.125 }, "type": "chat" }, { - "id": "gemini-2.5-flash-lite-preview-09-2025", - "name": "Gemini 2.5 Flash Lite Preview (09/2025)", - "display_name": "Gemini 2.5 Flash Lite Preview (09/2025)", + "id": "openai/gpt-5.1-codex-max", + "name": "GPT 5.1 Codex Max", + "display_name": "GPT 5.1 Codex Max", "modalities": { "input": [ "text", @@ -13204,9 +13448,10 @@ ] }, "limit": { - "context": 1048756, - "output": 65536 + "context": 400000, + "output": 128000 }, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, @@ -13216,73 +13461,66 @@ "reasoning": { "supported": true, "default_enabled": false, - "mode": "budget", - "budget": { - "default": -1, - "min": 512, - "max": 24576, - "auto": -1, - "unit": "tokens" - }, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thought_signatures" - ] + "mode": "effort", + "effort": "none", + "effort_options": [ + "none", + "low", + "medium", + "high" + ], + "verbosity": "medium", + "verbosity_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" } }, "attachment": true, "open_weights": false, - "release_date": "2025-09-25", - "last_updated": "2025-09-25", + "knowledge": "2024-10", + "release_date": "2025-11-19", + "last_updated": "2025-11-13", "cost": { - "input": 0.1, - "output": 0.4 + "input": 1.25, + "output": 10, + "cache_read": 0.125 }, "type": "chat" }, { - "id": "ernie-5.1", - "name": "ERNIE 5.1", - "display_name": "ERNIE 5.1", + "id": "openai/text-embedding-ada-002", + "name": "text-embedding-ada-002", + "display_name": "text-embedding-ada-002", "modalities": { "input": [ - "text", - "image", - "video" + "text" ], "output": [ "text" ] }, "limit": { - "context": 119000, - "output": 64000 + "context": 8192, + "output": 1536 }, + "temperature": true, "tool_call": false, "reasoning": { - "supported": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true - } + "supported": false }, - "attachment": true, + "attachment": false, "open_weights": false, - "release_date": "2026-05-10", - "last_updated": "2026-05-10", - "cost": { - "input": 0.75, - "output": 3, - "cache_read": 0.75 - }, - "type": "chat" + "release_date": "2022-12-15", + "last_updated": "2022-12-15", + "type": "embedding" }, { - "id": "claude-opus-4-thinking:1024", - "name": "Claude 4 Opus Thinking (1K)", - "display_name": "Claude 4 Opus Thinking (1K)", + "id": "openai/gpt-5.2", + "name": "GPT-5.2", + "display_name": "GPT-5.2", "modalities": { "input": [ "text", @@ -13294,64 +13532,69 @@ ] }, "limit": { - "context": 200000, - "output": 32000 + "context": 400000, + "output": 128000 }, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, - "default": true + "default": false }, "extra_capabilities": { "reasoning": { "supported": true, - "default_enabled": true, - "mode": "budget", - "budget": { - "min": 1024, - "unit": "tokens" - }, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" + "default_enabled": false, + "mode": "effort", + "effort": "none", + "effort_options": [ + "none", + "low", + "medium", + "high", + "xhigh" ], - "notes": [ - "Claude 4 manual thinking uses thinking.type = \"enabled\" with budget_tokens.", - "Interleaved thinking requires the interleaved-thinking-2025-05-14 beta header for this model family." - ] + "verbosity": "medium", + "verbosity_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" } }, "attachment": true, "open_weights": false, - "release_date": "2025-05-22", - "last_updated": "2025-05-22", + "knowledge": "2024-10", + "release_date": "2025-12-11", + "last_updated": "2025-12-11", "cost": { - "input": 14.994, - "output": 75.004 + "input": 1.75, + "output": 14, + "cache_read": 0.175 }, "type": "chat" }, { - "id": "Qwen3.5-27B-BlueStar-v3-Derestricted", - "name": "Qwen3.5 27B BlueStar v3 Derestricted", - "display_name": "Qwen3.5 27B BlueStar v3 Derestricted", + "id": "openai/gpt-5.3-codex", + "name": "GPT 5.3 Codex", + "display_name": "GPT 5.3 Codex", "modalities": { "input": [ "text", "image", - "video" + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 262144, - "output": 16384 + "context": 400000, + "output": 128000 }, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { "supported": true, "default": true @@ -13359,28 +13602,40 @@ "extra_capabilities": { "reasoning": { "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] + "default_enabled": true, + "mode": "effort", + "effort": "medium", + "effort_options": [ + "low", + "medium", + "high", + "xhigh" + ], + "verbosity": "medium", + "verbosity_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" } }, "attachment": true, "open_weights": false, - "release_date": "2026-04-30", - "last_updated": "2026-04-30", + "knowledge": "2025-08-31", + "release_date": "2026-02-24", + "last_updated": "2026-02-05", "cost": { - "input": 0.306, - "output": 0.306 + "input": 1.75, + "output": 14, + "cache_read": 0.175 }, "type": "chat" }, { - "id": "yi-medium-200k", - "name": "Yi Medium 200k", - "display_name": "Yi Medium 200k", + "id": "openai/text-embedding-3-small", + "name": "text-embedding-3-small", + "display_name": "text-embedding-3-small", "modalities": { "input": [ "text" @@ -13390,27 +13645,24 @@ ] }, "limit": { - "context": 200000, - "output": 4096 + "context": 8192, + "output": 1536 }, + "temperature": true, "tool_call": false, "reasoning": { "supported": false }, "attachment": false, "open_weights": false, - "release_date": "2024-03-01", - "last_updated": "2024-03-01", - "cost": { - "input": 2.499, - "output": 2.499 - }, - "type": "chat" + "release_date": "2024-01-25", + "last_updated": "2024-01-25", + "type": "embedding" }, { - "id": "claude-opus-4-5-20251101", - "name": "Claude 4.5 Opus", - "display_name": "Claude 4.5 Opus", + "id": "openai/gpt-5.1-codex-mini", + "name": "GPT-5.1 Codex mini", + "display_name": "GPT-5.1 Codex mini", "modalities": { "input": [ "text", @@ -13422,9 +13674,10 @@ ] }, "limit": { - "context": 200000, - "output": 32000 + "context": 400000, + "output": 128000 }, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, @@ -13434,73 +13687,71 @@ "reasoning": { "supported": true, "default_enabled": false, - "mode": "mixed", - "budget": { - "min": 1024, - "unit": "tokens" - }, - "effort": "high", + "mode": "effort", + "effort": "none", "effort_options": [ + "none", "low", "medium", "high" ], - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" + "verbosity": "medium", + "verbosity_options": [ + "low", + "medium", + "high" ], - "notes": [ - "Claude Opus 4.5 uses manual thinking.type = \"enabled\" with budget_tokens; effort can be used alongside the thinking budget.", - "Interleaved thinking requires the interleaved-thinking-2025-05-14 beta header." - ] + "visibility": "hidden" } }, "attachment": true, "open_weights": false, - "release_date": "2025-11-01", - "last_updated": "2025-11-01", + "knowledge": "2024-10", + "release_date": "2025-11-12", + "last_updated": "2025-11-13", "cost": { - "input": 4.998, - "output": 25.007 + "input": 0.25, + "output": 2, + "cache_read": 0.025 }, "type": "chat" }, { - "id": "glm-4-airx", - "name": "GLM-4 AirX", - "display_name": "GLM-4 AirX", + "id": "openai/gpt-image-1.5", + "name": "GPT Image 1.5", + "display_name": "GPT Image 1.5", "modalities": { "input": [ "text" ], "output": [ - "text" + "image" ] }, "limit": { - "context": 8000, - "output": 4096 + "context": 8192, + "output": 8192 }, + "temperature": true, "tool_call": false, "reasoning": { "supported": false }, "attachment": false, "open_weights": false, - "release_date": "2024-06-05", - "last_updated": "2024-06-05", + "release_date": "2025-12-16", + "last_updated": "2025-12-16", "cost": { - "input": 2.006, - "output": 2.006 + "input": 5, + "output": 32, + "cache_read": 1.25 }, - "type": "chat" + "type": "imageGeneration" }, { - "id": "MiniMax-M2", - "name": "MiniMax M2", - "display_name": "MiniMax M2", + "id": "openai/gpt-oss-120b", + "name": "GPT OSS 120B", + "display_name": "GPT OSS 120B", "modalities": { "input": [ "text" @@ -13510,10 +13761,11 @@ ] }, "limit": { - "context": 200000, - "output": 131072 + "context": 131072, + "output": 131000 }, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { "supported": true, "default": true @@ -13524,91 +13776,79 @@ } }, "attachment": false, - "open_weights": false, - "release_date": "2025-10-25", - "last_updated": "2025-10-25", + "open_weights": true, + "knowledge": "2024-10", + "release_date": "2025-08-05", + "last_updated": "2025-08-05", "cost": { - "input": 0.17, - "output": 1.53 + "input": 0.35, + "output": 0.75, + "cache_read": 0.25 }, "type": "chat" }, { - "id": "step-3", - "name": "Step-3", - "display_name": "Step-3", + "id": "openai/gpt-5.4", + "name": "GPT 5.4", + "display_name": "GPT 5.4", "modalities": { "input": [ "text", - "image" - ], - "output": [ - "text" - ] - }, - "limit": { - "context": 65536, - "output": 8192 - }, - "tool_call": false, - "reasoning": { - "supported": false - }, - "attachment": true, - "open_weights": false, - "release_date": "2025-07-31", - "last_updated": "2025-07-31", - "cost": { - "input": 0.2499, - "output": 0.6494 - }, - "type": "chat" - }, - { - "id": "qwq-32b", - "name": "Qwen: QwQ 32B", - "display_name": "Qwen: QwQ 32B", - "modalities": { - "input": [ - "text" + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 32768 + "context": 1050000, + "output": 128000 }, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { - "supported": true + "supported": true, + "default": false }, "extra_capabilities": { "reasoning": { "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] + "default_enabled": false, + "mode": "effort", + "effort": "none", + "effort_options": [ + "none", + "low", + "medium", + "high", + "xhigh" + ], + "verbosity": "medium", + "verbosity_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" } }, - "attachment": false, + "attachment": true, "open_weights": false, - "release_date": "2025-04-15", - "last_updated": "2025-04-15", + "knowledge": "2025-08-31", + "release_date": "2026-03-05", + "last_updated": "2026-03-05", "cost": { - "input": 0.25599999, - "output": 0.30499999 + "input": 2.5, + "output": 15, + "cache_read": 0.25 }, "type": "chat" }, { - "id": "claude-opus-4-1-thinking:32768", - "name": "Claude 4.1 Opus Thinking (32K)", - "display_name": "Claude 4.1 Opus Thinking (32K)", + "id": "openai/gpt-5.4-mini", + "name": "GPT 5.4 Mini", + "display_name": "GPT 5.4 Mini", "modalities": { "input": [ "text", @@ -13620,168 +13860,183 @@ ] }, "limit": { - "context": 200000, - "output": 32000 + "context": 400000, + "output": 128000 }, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, - "default": true + "default": false }, "extra_capabilities": { "reasoning": { "supported": true, - "default_enabled": true, - "mode": "budget", - "budget": { - "min": 1024, - "unit": "tokens" - }, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" + "default_enabled": false, + "mode": "effort", + "effort": "none", + "effort_options": [ + "none", + "low", + "medium", + "high", + "xhigh" ], - "notes": [ - "Claude 4 manual thinking uses thinking.type = \"enabled\" with budget_tokens.", - "Interleaved thinking requires the interleaved-thinking-2025-05-14 beta header for this model family." - ] + "verbosity": "medium", + "verbosity_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" } }, "attachment": true, "open_weights": false, - "release_date": "2025-05-22", - "last_updated": "2025-05-22", + "knowledge": "2025-08-31", + "release_date": "2026-03-17", + "last_updated": "2026-03-17", "cost": { - "input": 14.994, - "output": 75.004 + "input": 0.75, + "output": 4.5, + "cache_read": 0.075 }, "type": "chat" }, { - "id": "qwen3-max-2026-01-23", - "name": "Qwen3 Max 2026-01-23", - "display_name": "Qwen3 Max 2026-01-23", + "id": "openai/o3-deep-research", + "name": "o3-deep-research", + "display_name": "o3-deep-research", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 256000, - "output": 32768 + "context": 200000, + "output": 100000 }, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { - "supported": true + "supported": true, + "default": true }, "extra_capabilities": { "reasoning": { "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] + "default_enabled": true, + "mode": "effort", + "effort": "medium", + "effort_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" } }, - "attachment": false, + "attachment": true, "open_weights": false, - "release_date": "2026-01-26", - "last_updated": "2026-01-26", + "knowledge": "2024-10", + "release_date": "2024-06-26", + "last_updated": "2024-06-26", "cost": { - "input": 1.2002, - "output": 6.001 + "input": 10, + "output": 40, + "cache_read": 2.5 }, "type": "chat" }, { - "id": "qwen-3.6-plus", - "name": "Qwen 3.6 Plus", - "display_name": "Qwen 3.6 Plus", + "id": "openai/gpt-image-1", + "name": "GPT Image 1", + "display_name": "GPT Image 1", "modalities": { "input": [ - "text", - "image", - "video" + "text" ], "output": [ - "text" + "image" ] }, "limit": { - "context": 991800, - "output": 65536 + "context": 8192, + "output": 8192 }, + "temperature": true, "tool_call": false, "reasoning": { "supported": false }, "attachment": false, "open_weights": false, - "release_date": "2026-04-02", - "last_updated": "2026-04-02", + "release_date": "2025-03-25", + "last_updated": "2025-03-25", "cost": { - "input": 0.45, - "output": 2.7 + "input": 5, + "output": 40, + "cache_read": 1.25 }, - "type": "chat" + "type": "imageGeneration" }, { - "id": "qwen3.7-max:thinking", - "name": "Qwen3.7 Max Thinking", - "display_name": "Qwen3.7 Max Thinking", + "id": "openai/gpt-image-1-mini", + "name": "GPT Image 1 Mini", + "display_name": "GPT Image 1 Mini", "modalities": { "input": [ "text" ], "output": [ - "text" + "image" ] }, "limit": { - "context": 1000000, - "output": 65536 + "context": 8192, + "output": 8192 }, + "temperature": true, "tool_call": false, "reasoning": { - "supported": true, - "default": true + "supported": false }, "attachment": false, "open_weights": false, - "release_date": "2026-05-21", - "last_updated": "2026-05-21", + "release_date": "2025-10-06", + "last_updated": "2025-10-06", "cost": { - "input": 2.5, - "output": 7.5, - "cache_read": 0.25 + "input": 2, + "output": 8, + "cache_read": 0.2 }, - "type": "chat" + "type": "imageGeneration" }, { - "id": "gemini-2.5-pro-preview-03-25", - "name": "Gemini 2.5 Pro Preview 0325", - "display_name": "Gemini 2.5 Pro Preview 0325", + "id": "openai/gpt-5.4-pro", + "name": "GPT 5.4 Pro", + "display_name": "GPT 5.4 Pro", "modalities": { "input": [ "text", - "image" + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 1048756, - "output": 65536 + "context": 1050000, + "output": 128000 }, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { "supported": true, "default": true @@ -13790,66 +14045,77 @@ "reasoning": { "supported": true, "default_enabled": true, - "mode": "budget", - "budget": { - "default": -1, - "min": 128, - "max": 32768, - "auto": -1, - "unit": "tokens" - }, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thought_signatures" - ] + "mode": "effort", + "effort": "high", + "effort_options": [ + "medium", + "high", + "xhigh" + ], + "verbosity": "medium", + "verbosity_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" } }, "attachment": true, "open_weights": false, - "release_date": "2025-03-25", - "last_updated": "2025-03-25", + "knowledge": "2025-08-31", + "release_date": "2026-03-05", + "last_updated": "2026-03-05", "cost": { - "input": 2.5, - "output": 10 + "input": 30, + "output": 180 }, "type": "chat" }, { - "id": "doubao-1-5-thinking-vision-pro-250428", - "name": "Doubao 1.5 Thinking Vision Pro", - "display_name": "Doubao 1.5 Thinking Vision Pro", + "id": "openai/gpt-5.5-pro", + "name": "GPT 5.5 Pro", + "display_name": "GPT 5.5 Pro", "modalities": { "input": [ "text", - "image" + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 16384 + "context": 1000000, + "output": 128000 }, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true + } }, "attachment": true, "open_weights": false, - "release_date": "2025-05-15", - "last_updated": "2025-05-15", + "knowledge": "2025-12-01", + "release_date": "2026-04-24", + "last_updated": "2026-04-23", "cost": { - "input": 0.55, - "output": 1.43 + "input": 30, + "output": 180 }, "type": "chat" }, { - "id": "jamba-large-1.6", - "name": "Jamba Large 1.6", - "display_name": "Jamba Large 1.6", + "id": "openai/gpt-oss-20b", + "name": "GPT OSS 20B", + "display_name": "GPT OSS 20B", "modalities": { "input": [ "text" @@ -13859,186 +14125,252 @@ ] }, "limit": { - "context": 256000, - "output": 4096 + "context": 131072, + "output": 8192 }, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true + } }, "attachment": false, - "open_weights": false, - "release_date": "2025-03-12", - "last_updated": "2025-03-12", + "open_weights": true, + "knowledge": "2024-10", + "release_date": "2025-08-05", + "last_updated": "2025-08-05", "cost": { - "input": 1.989, - "output": 7.99 + "input": 0.05, + "output": 0.2 }, "type": "chat" }, { - "id": "glm-4.1v-thinking-flash", - "name": "GLM 4.1V Thinking Flash", - "display_name": "GLM 4.1V Thinking Flash", + "id": "openai/gpt-5.2-codex", + "name": "GPT-5.2-Codex", + "display_name": "GPT-5.2-Codex", "modalities": { "input": [ "text", - "image" + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 64000, - "output": 8192 + "context": 400000, + "output": 128000 }, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": true, + "mode": "effort", + "effort": "medium", + "effort_options": [ + "low", + "medium", + "high", + "xhigh" + ], + "verbosity": "medium", + "verbosity_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" + } }, "attachment": true, "open_weights": false, - "release_date": "2025-07-09", - "last_updated": "2025-07-09", + "knowledge": "2024-10", + "release_date": "2025-12-18", + "last_updated": "2025-12-11", "cost": { - "input": 0.3, - "output": 0.3 + "input": 1.75, + "output": 14, + "cache_read": 0.175 }, "type": "chat" }, { - "id": "gemini-2.5-pro-exp-03-25", - "name": "Gemini 2.5 Pro Experimental 0325", - "display_name": "Gemini 2.5 Pro Experimental 0325", + "id": "openai/gpt-5.1-instant", + "name": "GPT-5.1 Instant", + "display_name": "GPT-5.1 Instant", "modalities": { "input": [ "text", - "image" + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 1048756, - "output": 65536 + "context": 128000, + "output": 16384 }, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { "supported": true, - "default": true + "default": false }, "extra_capabilities": { "reasoning": { "supported": true, - "default_enabled": true, - "mode": "budget", - "budget": { - "default": -1, - "min": 128, - "max": 32768, - "auto": -1, - "unit": "tokens" - }, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thought_signatures" - ] + "default_enabled": false, + "mode": "effort", + "effort": "none", + "effort_options": [ + "none", + "low", + "medium", + "high" + ], + "verbosity": "medium", + "verbosity_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" } }, "attachment": true, "open_weights": false, - "release_date": "2025-03-25", - "last_updated": "2025-03-25", + "knowledge": "2024-10", + "release_date": "2025-11-12", + "last_updated": "2025-08-07", "cost": { - "input": 2.5, - "output": 10 + "input": 1.25, + "output": 10, + "cache_read": 0.125 }, "type": "chat" }, { - "id": "doubao-seed-1-6-thinking-250615", - "name": "Doubao Seed 1.6 Thinking", - "display_name": "Doubao Seed 1.6 Thinking", + "id": "openai/gpt-image-2", + "name": "GPT Image 2", + "display_name": "GPT Image 2", "modalities": { "input": [ "text" ], "output": [ - "text" + "image" ] }, "limit": { - "context": 256000, - "output": 16384 + "context": 8192, + "output": 8192 }, + "temperature": true, "tool_call": false, "reasoning": { "supported": false }, "attachment": false, "open_weights": false, - "release_date": "2025-06-15", - "last_updated": "2025-06-15", + "release_date": "2026-04-21", + "last_updated": "2026-04-21", "cost": { - "input": 0.204, - "output": 2.04 + "input": 5, + "output": 30, + "cache_read": 1.25 }, - "type": "chat" + "type": "imageGeneration" }, { - "id": "gemma-4-31B-Garnet", - "name": "Gemma 4 31B Garnet", - "display_name": "Gemma 4 31B Garnet", + "id": "openai/gpt-5.5", + "name": "GPT 5.5", + "display_name": "GPT 5.5", "modalities": { "input": [ "text", "image", - "video" + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 262144, - "output": 16384 + "context": 1000000, + "output": 128000 }, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { "supported": true, "default": true }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": true, + "mode": "effort", + "effort": "medium", + "effort_options": [ + "low", + "medium", + "high", + "xhigh" + ], + "verbosity": "medium", + "verbosity_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" + } + }, "attachment": true, "open_weights": false, - "release_date": "2026-05-02", - "last_updated": "2026-05-02", + "knowledge": "2025-12-01", + "release_date": "2026-04-24", + "last_updated": "2026-04-23", "cost": { - "input": 0.306, - "output": 0.306 + "input": 5, + "output": 30, + "cache_read": 0.5 }, "type": "chat" }, { - "id": "claude-opus-4-1-thinking", - "name": "Claude 4.1 Opus Thinking", - "display_name": "Claude 4.1 Opus Thinking", - "modalities": { + "id": "openai/gpt-5-codex", + "name": "GPT-5-Codex", + "display_name": "GPT-5-Codex", + "modalities": { "input": [ "text", - "image", - "pdf" + "image" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 32000 + "context": 400000, + "output": 128000 }, + "temperature": false, "tool_call": true, "reasoning": { "supported": true, @@ -14048,41 +14380,44 @@ "reasoning": { "supported": true, "default_enabled": true, - "mode": "budget", - "budget": { - "min": 1024, - "unit": "tokens" - }, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" + "mode": "effort", + "effort": "medium", + "effort_options": [ + "minimal", + "low", + "medium", + "high" ], - "notes": [ - "Claude 4 manual thinking uses thinking.type = \"enabled\" with budget_tokens.", - "Interleaved thinking requires the interleaved-thinking-2025-05-14 beta header for this model family." - ] + "verbosity": "medium", + "verbosity_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" } }, - "attachment": true, + "attachment": false, "open_weights": false, - "release_date": "2025-05-22", - "last_updated": "2025-05-22", + "knowledge": "2024-09-30", + "release_date": "2025-09-15", + "last_updated": "2025-09-15", "cost": { - "input": 14.994, - "output": 75.004 + "input": 1.25, + "output": 10, + "cache_read": 0.125 }, "type": "chat" }, { - "id": "doubao-1-5-thinking-pro-vision-250415", - "name": "Doubao 1.5 Thinking Pro Vision", - "display_name": "Doubao 1.5 Thinking Pro Vision", + "id": "openai/gpt-4o-mini", + "name": "GPT-4o mini", + "display_name": "GPT-4o mini", "modalities": { "input": [ "text", - "image" + "image", + "pdf" ], "output": [ "text" @@ -14092,99 +14427,166 @@ "context": 128000, "output": 16384 }, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { "supported": false }, "attachment": true, "open_weights": false, - "release_date": "2025-04-15", - "last_updated": "2025-04-15", + "knowledge": "2023-09", + "release_date": "2024-07-18", + "last_updated": "2024-07-18", "cost": { - "input": 0.6, - "output": 2.4 + "input": 0.15, + "output": 0.6, + "cache_read": 0.075 }, "type": "chat" }, { - "id": "owl", - "name": "OWL", - "display_name": "OWL", + "id": "openai/gpt-5-nano", + "name": "GPT-5 Nano", + "display_name": "GPT-5 Nano", "modalities": { "input": [ + "text", + "image" + ], + "output": [ "text" + ] + }, + "limit": { + "context": 400000, + "output": 128000 + }, + "temperature": false, + "tool_call": true, + "reasoning": { + "supported": true, + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": true, + "mode": "effort", + "effort": "medium", + "effort_options": [ + "minimal", + "low", + "medium", + "high" + ], + "verbosity": "medium", + "verbosity_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" + } + }, + "attachment": true, + "open_weights": false, + "knowledge": "2024-05-30", + "release_date": "2025-08-07", + "last_updated": "2025-08-07", + "cost": { + "input": 0.05, + "output": 0.4, + "cache_read": 0.005 + }, + "type": "chat" + }, + { + "id": "openai/gpt-4-turbo", + "name": "GPT-4 Turbo", + "display_name": "GPT-4 Turbo", + "modalities": { + "input": [ + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 1048756, - "output": 262144 + "context": 128000, + "output": 4096 }, + "temperature": true, "tool_call": true, "reasoning": { "supported": false }, - "attachment": false, + "attachment": true, "open_weights": false, - "release_date": "2026-05-01", - "last_updated": "2026-05-01", + "knowledge": "2023-12", + "release_date": "2023-11-06", + "last_updated": "2024-04-09", "cost": { - "input": 0.1, - "output": 0.3 + "input": 10, + "output": 30 }, "type": "chat" }, { - "id": "auto-model-premium", - "name": "Auto model (Premium)", - "display_name": "Auto model (Premium)", + "id": "openai/gpt-4.1-mini", + "name": "GPT-4.1 mini", + "display_name": "GPT-4.1 mini", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 1000000, - "output": 1000000 + "context": 1047576, + "output": 32768 }, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { "supported": false }, - "attachment": false, + "attachment": true, "open_weights": false, - "release_date": "2024-06-01", - "last_updated": "2024-06-01", + "knowledge": "2024-04", + "release_date": "2025-04-14", + "last_updated": "2025-04-14", "cost": { - "input": 9.996, - "output": 19.992 + "input": 0.4, + "output": 1.6, + "cache_read": 0.1 }, "type": "chat" }, { - "id": "Qwen3.5-27B-Writer-Derestricted", - "name": "Qwen3.5 27B Writer Derestricted", - "display_name": "Qwen3.5 27B Writer Derestricted", + "id": "openai/gpt-5-mini", + "name": "GPT-5 Mini", + "display_name": "GPT-5 Mini", "modalities": { "input": [ "text", - "image", - "video" + "image" ], "output": [ "text" ] }, "limit": { - "context": 262144, - "output": 16384 + "context": 400000, + "output": 128000 }, - "tool_call": false, + "temperature": false, + "tool_call": true, "reasoning": { "supported": true, "default": true @@ -14192,28 +14594,40 @@ "extra_capabilities": { "reasoning": { "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] + "default_enabled": true, + "mode": "effort", + "effort": "medium", + "effort_options": [ + "minimal", + "low", + "medium", + "high" + ], + "verbosity": "medium", + "verbosity_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" } }, "attachment": true, "open_weights": false, - "release_date": "2026-04-06", - "last_updated": "2026-04-06", + "knowledge": "2024-05-30", + "release_date": "2025-08-07", + "last_updated": "2025-08-07", "cost": { - "input": 0.306, - "output": 0.306 + "input": 0.25, + "output": 2, + "cache_read": 0.025 }, "type": "chat" }, { - "id": "claude-sonnet-4-20250514", - "name": "Claude 4 Sonnet", - "display_name": "Claude 4 Sonnet", + "id": "openai/gpt-4.1", + "name": "GPT-4.1", + "display_name": "GPT-4.1", "modalities": { "input": [ "text", @@ -14225,49 +14639,30 @@ ] }, "limit": { - "context": 200000, - "output": 64000 + "context": 1047576, + "output": 32768 }, + "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": false - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": false, - "mode": "budget", - "budget": { - "min": 1024, - "unit": "tokens" - }, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ], - "notes": [ - "Claude 4 manual thinking uses thinking.type = \"enabled\" with budget_tokens.", - "Interleaved thinking requires the interleaved-thinking-2025-05-14 beta header for this model family." - ] - } + "supported": false }, "attachment": true, "open_weights": false, - "release_date": "2025-09-29", - "last_updated": "2025-09-29", + "knowledge": "2024-04", + "release_date": "2025-04-14", + "last_updated": "2025-04-14", "cost": { - "input": 2.992, - "output": 14.994 + "input": 2, + "output": 8, + "cache_read": 0.5 }, "type": "chat" }, { - "id": "claude-opus-4-thinking:8192", - "name": "Claude 4 Opus Thinking (8K)", - "display_name": "Claude 4 Opus Thinking (8K)", + "id": "openai/o1", + "name": "o1", + "display_name": "o1", "modalities": { "input": [ "text", @@ -14280,8 +14675,9 @@ }, "limit": { "context": 200000, - "output": 32000 + "output": 100000 }, + "temperature": false, "tool_call": true, "reasoning": { "supported": true, @@ -14291,95 +14687,79 @@ "reasoning": { "supported": true, "default_enabled": true, - "mode": "budget", - "budget": { - "min": 1024, - "unit": "tokens" - }, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" + "mode": "effort", + "effort": "medium", + "effort_options": [ + "low", + "medium", + "high" ], - "notes": [ - "Claude 4 manual thinking uses thinking.type = \"enabled\" with budget_tokens.", - "Interleaved thinking requires the interleaved-thinking-2025-05-14 beta header for this model family." - ] + "visibility": "hidden" } }, "attachment": true, "open_weights": false, - "release_date": "2025-05-22", - "last_updated": "2025-05-22", + "knowledge": "2023-09", + "release_date": "2024-12-05", + "last_updated": "2024-12-05", "cost": { - "input": 14.994, - "output": 75.004 + "input": 15, + "output": 60, + "cache_read": 7.5 }, "type": "chat" }, { - "id": "qwen3.5-122b-a10b:thinking", - "name": "Qwen3.5 122B A10B Thinking", - "display_name": "Qwen3.5 122B A10B Thinking", + "id": "openai/gpt-4.1-nano", + "name": "GPT-4.1 nano", + "display_name": "GPT-4.1 nano", "modalities": { "input": [ "text", - "image", - "video" + "image" ], "output": [ "text" ] }, "limit": { - "context": 260096, - "output": 65536 + "context": 1047576, + "output": 32768 }, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } + "supported": false }, "attachment": true, "open_weights": false, - "release_date": "2026-02-24", - "last_updated": "2026-02-24", + "knowledge": "2024-04", + "release_date": "2025-04-14", + "last_updated": "2025-04-14", "cost": { - "input": 0.36, - "output": 2.88 + "input": 0.1, + "output": 0.4, + "cache_read": 0.025 }, "type": "chat" }, { - "id": "claude-sonnet-4-thinking", - "name": "Claude 4 Sonnet Thinking", - "display_name": "Claude 4 Sonnet Thinking", + "id": "openai/o3-mini", + "name": "o3-mini", + "display_name": "o3-mini", "modalities": { "input": [ - "text", - "image", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 1000000, - "output": 64000 + "context": 200000, + "output": 100000 }, + "temperature": false, "tool_call": true, "reasoning": { "supported": true, @@ -14389,73 +14769,85 @@ "reasoning": { "supported": true, "default_enabled": true, - "mode": "budget", - "budget": { - "min": 1024, - "unit": "tokens" - }, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" + "mode": "effort", + "effort": "medium", + "effort_options": [ + "low", + "medium", + "high" ], - "notes": [ - "Claude 4 manual thinking uses thinking.type = \"enabled\" with budget_tokens.", - "Interleaved thinking requires the interleaved-thinking-2025-05-14 beta header for this model family." - ] + "visibility": "hidden" } }, - "attachment": true, + "attachment": false, "open_weights": false, - "release_date": "2025-02-24", - "last_updated": "2025-02-24", + "knowledge": "2024-05", + "release_date": "2024-12-20", + "last_updated": "2025-01-29", "cost": { - "input": 2.992, - "output": 14.994 + "input": 1.1, + "output": 4.4, + "cache_read": 0.55 }, "type": "chat" }, { - "id": "Gemma-4-31B-Cognitive-Unshackled", - "name": "Gemma 4 31B Cognitive Unshackled", - "display_name": "Gemma 4 31B Cognitive Unshackled", + "id": "openai/o4-mini", + "name": "o4-mini", + "display_name": "o4-mini", "modalities": { "input": [ "text", - "image", - "video" + "image" ], "output": [ "text" ] }, "limit": { - "context": 262144, - "output": 16384 + "context": 200000, + "output": 100000 }, - "tool_call": false, + "temperature": false, + "tool_call": true, "reasoning": { "supported": true, "default": true }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": true, + "mode": "effort", + "effort": "medium", + "effort_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" + } + }, "attachment": true, "open_weights": false, - "release_date": "2026-05-01", - "last_updated": "2026-05-01", + "knowledge": "2024-05", + "release_date": "2025-04-16", + "last_updated": "2025-04-16", "cost": { - "input": 0.306, - "output": 0.306 + "input": 1.1, + "output": 4.4, + "cache_read": 0.275 }, "type": "chat" }, { - "id": "deepseek-chat-cheaper", - "name": "DeepSeek V3/Chat Cheaper", - "display_name": "DeepSeek V3/Chat Cheaper", + "id": "openai/gpt-4o", + "name": "GPT-4o", + "display_name": "GPT-4o", "modalities": { "input": [ "text", + "image", "pdf" ], "output": [ @@ -14464,67 +14856,85 @@ }, "limit": { "context": 128000, - "output": 8192 + "output": 16384 }, + "temperature": true, "tool_call": true, "reasoning": { "supported": false }, "attachment": true, "open_weights": false, - "release_date": "2025-04-15", - "last_updated": "2025-04-15", + "knowledge": "2023-09", + "release_date": "2024-05-13", + "last_updated": "2024-08-06", "cost": { - "input": 0.25, - "output": 0.7 + "input": 2.5, + "output": 10, + "cache_read": 1.25 }, "type": "chat" }, { - "id": "qwen3.6-max-preview", - "name": "Qwen3.6 Max Preview", - "display_name": "Qwen3.6 Max Preview", + "id": "openai/gpt-5", + "name": "GPT-5", + "display_name": "GPT-5", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 245800, - "output": 65536 + "context": 400000, + "output": 128000 }, - "tool_call": false, + "temperature": false, + "tool_call": true, "reasoning": { - "supported": true + "supported": true, + "default": true }, "extra_capabilities": { "reasoning": { "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] + "default_enabled": true, + "mode": "effort", + "effort": "medium", + "effort_options": [ + "minimal", + "low", + "medium", + "high" + ], + "verbosity": "medium", + "verbosity_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" } }, - "attachment": false, + "attachment": true, "open_weights": false, - "release_date": "2026-04-20", - "last_updated": "2026-04-21", + "knowledge": "2024-09-30", + "release_date": "2025-08-07", + "last_updated": "2025-08-07", "cost": { - "input": 1.3, - "output": 7.8 + "input": 1.25, + "output": 10, + "cache_read": 0.125 }, "type": "chat" }, { - "id": "claude-opus-4-1-thinking:1024", - "name": "Claude 4.1 Opus Thinking (1K)", - "display_name": "Claude 4.1 Opus Thinking (1K)", + "id": "openai/o3", + "name": "o3", + "display_name": "o3", "modalities": { "input": [ "text", @@ -14537,8 +14947,9 @@ }, "limit": { "context": 200000, - "output": 32000 + "output": 100000 }, + "temperature": false, "tool_call": true, "reasoning": { "supported": true, @@ -14548,37 +14959,32 @@ "reasoning": { "supported": true, "default_enabled": true, - "mode": "budget", - "budget": { - "min": 1024, - "unit": "tokens" - }, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" + "mode": "effort", + "effort": "medium", + "effort_options": [ + "low", + "medium", + "high" ], - "notes": [ - "Claude 4 manual thinking uses thinking.type = \"enabled\" with budget_tokens.", - "Interleaved thinking requires the interleaved-thinking-2025-05-14 beta header for this model family." - ] + "visibility": "hidden" } }, "attachment": true, "open_weights": false, - "release_date": "2025-05-22", - "last_updated": "2025-05-22", + "knowledge": "2024-05", + "release_date": "2025-04-16", + "last_updated": "2025-04-16", "cost": { - "input": 14.994, - "output": 75.004 + "input": 2, + "output": 8, + "cache_read": 0.5 }, "type": "chat" }, { - "id": "glm-z1-airx", - "name": "GLM Z1 AirX", - "display_name": "GLM Z1 AirX", + "id": "zai/glm-4.7", + "name": "GLM 4.7", + "display_name": "GLM 4.7", "modalities": { "input": [ "text" @@ -14588,41 +14994,10 @@ ] }, "limit": { - "context": 32000, - "output": 16384 - }, - "tool_call": true, - "reasoning": { - "supported": false - }, - "attachment": false, - "open_weights": false, - "release_date": "2025-04-15", - "last_updated": "2025-04-15", - "cost": { - "input": 0.7, - "output": 0.7 - }, - "type": "chat" - }, - { - "id": "claude-opus-4-5-20251101:thinking", - "name": "Claude 4.5 Opus Thinking", - "display_name": "Claude 4.5 Opus Thinking", - "modalities": { - "input": [ - "text", - "image", - "pdf" - ], - "output": [ - "text" - ] - }, - "limit": { - "context": 200000, - "output": 32000 + "context": 131000, + "output": 40000 }, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, @@ -14631,74 +15006,65 @@ "extra_capabilities": { "reasoning": { "supported": true, - "default_enabled": true, - "mode": "mixed", - "budget": { - "min": 1024, - "unit": "tokens" - }, - "effort": "high", - "effort_options": [ - "low", - "medium", - "high" - ], "interleaved": true, "summaries": true, "visibility": "summary", "continuation": [ "thinking_blocks" - ], - "notes": [ - "Claude Opus 4.5 uses manual thinking.type = \"enabled\" with budget_tokens; effort can be used alongside the thinking budget.", - "Interleaved thinking requires the interleaved-thinking-2025-05-14 beta header." ] } }, - "attachment": true, + "attachment": false, "open_weights": false, - "release_date": "2025-11-01", - "last_updated": "2025-11-01", + "knowledge": "2024-10", + "release_date": "2025-12-22", + "last_updated": "2025-12-22", "cost": { - "input": 4.998, - "output": 25.007 + "input": 2.25, + "output": 2.75, + "cache_read": 2.25 }, "type": "chat" }, { - "id": "brave-research", - "name": "Brave (Research)", - "display_name": "Brave (Research)", + "id": "zai/glm-4.5v", + "name": "GLM 4.5V", + "display_name": "GLM 4.5V", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 16384, - "output": 16384 + "context": 66000, + "output": 16000 }, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": false, - "open_weights": false, - "release_date": "2023-03-02", - "last_updated": "2024-01-01", + "attachment": true, + "open_weights": true, + "knowledge": "2025-08", + "release_date": "2025-08-11", + "last_updated": "2025-08-11", "cost": { - "input": 5, - "output": 5 + "input": 0.6, + "output": 1.8, + "cache_read": 0.11 }, "type": "chat" }, { - "id": "universal-summarizer", - "name": "Universal Summarizer", - "display_name": "Universal Summarizer", + "id": "zai/glm-4.5", + "name": "GLM 4.5", + "display_name": "GLM 4.5", "modalities": { "input": [ "text" @@ -14708,27 +15074,37 @@ ] }, "limit": { - "context": 32768, - "output": 32768 + "context": 128000, + "output": 96000 }, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true + } }, "attachment": false, - "open_weights": false, - "release_date": "2023-05-01", - "last_updated": "2024-01-01", + "open_weights": true, + "knowledge": "2025-07", + "release_date": "2025-07-28", + "last_updated": "2025-07-28", "cost": { - "input": 30, - "output": 30 + "input": 0.6, + "output": 2.2, + "cache_read": 0.11 }, "type": "chat" }, { - "id": "Baichuan4-Air", - "name": "Baichuan 4 Air", - "display_name": "Baichuan 4 Air", + "id": "zai/glm-4.7-flashx", + "name": "GLM 4.7 FlashX", + "display_name": "GLM 4.7 FlashX", "modalities": { "input": [ "text" @@ -14738,86 +15114,91 @@ ] }, "limit": { - "context": 32768, - "output": 32768 + "context": 200000, + "output": 128000 }, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true + } }, "attachment": false, - "open_weights": false, - "release_date": "2025-08-19", - "last_updated": "2025-08-19", + "open_weights": true, + "knowledge": "2025-01", + "release_date": "2025-01-01", + "last_updated": "2026-01-19", "cost": { - "input": 0.157, - "output": 0.157 + "input": 0.06, + "output": 0.4, + "cache_read": 0.01 }, "type": "chat" }, { - "id": "Qwen3.5-27B-BlueStar-v2-Derestricted-Lite", - "name": "Qwen3.5 27B BlueStar v2 Derestricted Lite", - "display_name": "Qwen3.5 27B BlueStar v2 Derestricted Lite", + "id": "zai/glm-5.1", + "name": "GLM 5.1", + "display_name": "GLM 5.1", "modalities": { "input": [ "text", "image", - "video" + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 262144, - "output": 16384 + "context": 202800, + "output": 64000 }, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { "supported": true, "default": true }, "extra_capabilities": { "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] + "supported": true } }, "attachment": true, "open_weights": false, - "release_date": "2026-04-06", - "last_updated": "2026-04-06", + "release_date": "2026-04-07", + "last_updated": "2026-03-27", "cost": { - "input": 0.306, - "output": 0.306 + "input": 1.4, + "output": 4.4, + "cache_read": 0.26 }, "type": "chat" }, { - "id": "Qwen3.5-27B-earica-Derestricted", - "name": "Qwen3.5 27B earica Derestricted", - "display_name": "Qwen3.5 27B earica Derestricted", + "id": "zai/glm-4.6", + "name": "GLM 4.6", + "display_name": "GLM 4.6", "modalities": { "input": [ - "text", - "image", - "video" + "text" ], "output": [ "text" ] }, "limit": { - "context": 262144, - "output": 16384 + "context": 200000, + "output": 96000 }, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { "supported": true, "default": true @@ -14825,85 +15206,76 @@ "extra_capabilities": { "reasoning": { "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] + "interleaved": true } }, - "attachment": true, - "open_weights": false, - "release_date": "2026-04-30", - "last_updated": "2026-04-30", + "attachment": false, + "open_weights": true, + "knowledge": "2025-04", + "release_date": "2025-09-30", + "last_updated": "2025-09-30", "cost": { - "input": 0.306, - "output": 0.306 + "input": 0.6, + "output": 2.2, + "cache_read": 0.11 }, "type": "chat" }, { - "id": "Qwen3.5-27B-RpRMax-v1", - "name": "Qwen3.5 27B RpRMax v1", - "display_name": "Qwen3.5 27B RpRMax v1", + "id": "zai/glm-4.6v", + "name": "GLM-4.6V", + "display_name": "GLM-4.6V", "modalities": { "input": [ "text", "image", - "video" + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 262144, - "output": 16384 + "context": 128000, + "output": 24000 }, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { "supported": true, "default": true }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } - }, "attachment": true, "open_weights": false, - "release_date": "2026-04-30", - "last_updated": "2026-04-30", + "knowledge": "2024-10", + "release_date": "2025-09-30", + "last_updated": "2025-12-08", "cost": { - "input": 0.306, - "output": 0.306 + "input": 0.3, + "output": 0.9, + "cache_read": 0.05 }, "type": "chat" }, { - "id": "holo3-35b-a3b", - "name": "Holo3-35B-A3B", - "display_name": "Holo3-35B-A3B", + "id": "zai/glm-5v-turbo", + "name": "GLM 5V Turbo", + "display_name": "GLM 5V Turbo", "modalities": { "input": [ "text", - "image" + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 65536, - "output": 65536 + "context": 200000, + "output": 128000 }, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, @@ -14911,108 +15283,84 @@ }, "attachment": true, "open_weights": false, - "release_date": "2024-01-01", - "last_updated": "2024-01-01", + "release_date": "2026-04-01", + "last_updated": "2026-04-01", "cost": { - "input": 0.25, - "output": 1.8 + "input": 1.2, + "output": 4, + "cache_read": 0.24 }, "type": "chat" }, { - "id": "qwen3.7-plus", - "name": "Qwen3.7 Plus", - "display_name": "Qwen3.7 Plus", + "id": "zai/glm-4.6v-flash", + "name": "GLM-4.6V-Flash", + "display_name": "GLM-4.6V-Flash", "modalities": { "input": [ "text", "image", - "video" + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 991808, - "output": 65536 + "context": 128000, + "output": 24000 }, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { - "supported": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true - } + "supported": true, + "default": true }, "attachment": true, "open_weights": false, - "release_date": "2026-06-01", - "last_updated": "2026-06-01", - "cost": { - "input": 0.4, - "output": 1.6, - "cache_read": 0.04 - }, + "knowledge": "2024-10", + "release_date": "2025-09-30", + "last_updated": "2025-09-30", "type": "chat" }, { - "id": "gemini-2.5-flash-preview-05-20:thinking", - "name": "Gemini 2.5 Flash 0520 Thinking", - "display_name": "Gemini 2.5 Flash 0520 Thinking", + "id": "zai/glm-4.5-air", + "name": "GLM 4.5 Air", + "display_name": "GLM 4.5 Air", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 1048000, - "output": 65536 + "context": 128000, + "output": 96000 }, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { "supported": true, "default": true }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": true, - "mode": "budget", - "budget": { - "default": -1, - "min": 0, - "max": 24576, - "auto": -1, - "off": 0, - "unit": "tokens" - }, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thought_signatures" - ] - } - }, - "attachment": true, - "open_weights": false, - "release_date": "2025-05-20", - "last_updated": "2025-05-20", + "attachment": false, + "open_weights": true, + "knowledge": "2025-04", + "release_date": "2025-07-28", + "last_updated": "2025-07-28", "cost": { - "input": 0.15, - "output": 3.5 + "input": 0.2, + "output": 1.1, + "cache_read": 0.03 }, "type": "chat" }, { - "id": "GLM-4.6-Derestricted-v5", - "name": "GLM 4.6 Derestricted v5", - "display_name": "GLM 4.6 Derestricted v5", + "id": "zai/glm-4.7-flash", + "name": "GLM 4.7 Flash", + "display_name": "GLM 4.7 Flash", "modalities": { "input": [ "text" @@ -15022,41 +15370,48 @@ ] }, "limit": { - "context": 131072, - "output": 8192 + "context": 200000, + "output": 131000 }, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true + } }, "attachment": false, "open_weights": false, - "release_date": "2025-12-23", - "last_updated": "2025-12-23", + "knowledge": "2025-04", + "release_date": "2026-03-13", + "last_updated": "2026-01-19", "cost": { - "input": 0.4, - "output": 1.5 + "input": 0.07, + "output": 0.4 }, "type": "chat" }, { - "id": "claude-opus-4-thinking", - "name": "Claude 4 Opus Thinking", - "display_name": "Claude 4 Opus Thinking", + "id": "zai/glm-5", + "name": "GLM-5", + "display_name": "GLM-5", "modalities": { "input": [ - "text", - "image", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 32000 + "context": 202800, + "output": 131100 }, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, @@ -15065,38 +15420,29 @@ "extra_capabilities": { "reasoning": { "supported": true, - "default_enabled": true, - "mode": "budget", - "budget": { - "min": 1024, - "unit": "tokens" - }, "interleaved": true, "summaries": true, "visibility": "summary", "continuation": [ "thinking_blocks" - ], - "notes": [ - "Claude 4 manual thinking uses thinking.type = \"enabled\" with budget_tokens.", - "Interleaved thinking requires the interleaved-thinking-2025-05-14 beta header for this model family." ] } }, - "attachment": true, - "open_weights": false, - "release_date": "2025-07-15", - "last_updated": "2025-07-15", + "attachment": false, + "open_weights": true, + "release_date": "2026-02-12", + "last_updated": "2026-02-11", "cost": { - "input": 14.994, - "output": 75.004 + "input": 1, + "output": 3.2, + "cache_read": 0.2 }, "type": "chat" }, { - "id": "deepseek-math-v2", - "name": "DeepSeek Math V2", - "display_name": "DeepSeek Math V2", + "id": "zai/glm-5-turbo", + "name": "GLM 5 Turbo", + "display_name": "GLM 5 Turbo", "modalities": { "input": [ "text" @@ -15106,637 +15452,471 @@ ] }, "limit": { - "context": 128000, - "output": 65536 + "context": 202800, + "output": 131100 }, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true + } }, "attachment": false, "open_weights": false, - "release_date": "2025-12-03", - "last_updated": "2025-12-03", + "release_date": "2026-03-15", + "last_updated": "2026-03-16", "cost": { - "input": 0.6, - "output": 2.2 + "input": 1.2, + "output": 4, + "cache_read": 0.24 }, "type": "chat" }, { - "id": "qwen25-vl-72b-instruct", - "name": "Qwen25 VL 72b", - "display_name": "Qwen25 VL 72b", + "id": "bytedance/seedream-5.0-lite", + "name": "Seedream 5.0 Lite", + "display_name": "Seedream 5.0 Lite", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ - "text" + "image" ] }, "limit": { - "context": 32000, - "output": 32768 + "context": 8192, + "output": 8192 }, + "temperature": true, "tool_call": false, "reasoning": { "supported": false }, - "attachment": true, + "attachment": false, "open_weights": false, - "release_date": "2025-05-10", - "last_updated": "2025-05-10", - "cost": { - "input": 0.69989, - "output": 0.69989 - }, + "release_date": "2026-01-28", + "last_updated": "2026-01-28", "type": "chat" }, { - "id": "Qwen3.5-27B-Omega-Evolution-v2.0-Derestricted", - "name": "Qwen3.5 27B Omega Evolution v2.0 Derestricted", - "display_name": "Qwen3.5 27B Omega Evolution v2.0 Derestricted", + "id": "bytedance/seedance-2.0-fast", + "name": "Seedance 2.0 Fast", + "display_name": "Seedance 2.0 Fast", "modalities": { "input": [ "text", - "image", - "video" + "image" ], "output": [ - "text" + "video" ] }, "limit": { - "context": 262144, - "output": 16384 + "context": 8192, + "output": 8192 }, + "temperature": true, "tool_call": false, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } + "supported": false }, "attachment": true, "open_weights": false, - "release_date": "2026-04-06", - "last_updated": "2026-04-06", - "cost": { - "input": 0.306, - "output": 0.306 - }, + "release_date": "2026-04-14", + "last_updated": "2026-04-14", "type": "chat" }, { - "id": "ernie-x1.1-preview", - "name": "ERNIE X1.1", - "display_name": "ERNIE X1.1", + "id": "bytedance/seedance-v1.0-pro", + "name": "Seedance v1.0 Pro", + "display_name": "Seedance v1.0 Pro", "modalities": { "input": [ - "text", - "pdf" + "text" ], "output": [ - "text" + "video" ] }, "limit": { - "context": 64000, + "context": 8192, "output": 8192 }, + "temperature": true, "tool_call": false, "reasoning": { - "supported": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true - } + "supported": false }, - "attachment": true, + "attachment": false, "open_weights": false, - "release_date": "2025-09-10", - "last_updated": "2025-09-10", - "cost": { - "input": 0.15, - "output": 0.6 - }, + "release_date": "2025-06-11", + "last_updated": "2025-06-11", "type": "chat" }, { - "id": "Qwen3.5-27B-Writer-Derestricted-Lite", - "name": "Qwen3.5 27B Writer Derestricted Lite", - "display_name": "Qwen3.5 27B Writer Derestricted Lite", + "id": "bytedance/seed-1.6", + "name": "Seed 1.6", + "display_name": "Seed 1.6", "modalities": { "input": [ - "text", - "image", - "video" + "text" ], "output": [ "text" ] }, "limit": { - "context": 262144, - "output": 16384 + "context": 256000, + "output": 32000 }, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { "supported": true, "default": true }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } - }, - "attachment": true, + "attachment": false, "open_weights": false, - "release_date": "2026-04-06", - "last_updated": "2026-04-06", + "knowledge": "2024-10", + "release_date": "2025-09-01", + "last_updated": "2025-09", "cost": { - "input": 0.306, - "output": 0.306 + "input": 0.25, + "output": 2, + "cache_read": 0.05 }, "type": "chat" }, { - "id": "claude-opus-4-1-thinking:8192", - "name": "Claude 4.1 Opus Thinking (8K)", - "display_name": "Claude 4.1 Opus Thinking (8K)", + "id": "bytedance/seedance-2.0", + "name": "Seedance 2.0", + "display_name": "Seedance 2.0", "modalities": { "input": [ "text", - "image", - "pdf" + "image" ], "output": [ - "text" + "video" ] }, "limit": { - "context": 200000, - "output": 32000 + "context": 8192, + "output": 8192 }, - "tool_call": true, + "temperature": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": true, - "mode": "budget", - "budget": { - "min": 1024, - "unit": "tokens" - }, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ], - "notes": [ - "Claude 4 manual thinking uses thinking.type = \"enabled\" with budget_tokens.", - "Interleaved thinking requires the interleaved-thinking-2025-05-14 beta header for this model family." - ] - } + "supported": false }, "attachment": true, "open_weights": false, - "release_date": "2025-05-22", - "last_updated": "2025-05-22", - "cost": { - "input": 14.994, - "output": 75.004 - }, + "release_date": "2026-04-14", + "last_updated": "2026-04-14", "type": "chat" }, { - "id": "claude-sonnet-4-5-20250929-thinking", - "name": "Claude Sonnet 4.5 Thinking", - "display_name": "Claude Sonnet 4.5 Thinking", + "id": "bytedance/seedance-v1.5-pro", + "name": "Seedance v1.5 Pro", + "display_name": "Seedance v1.5 Pro", "modalities": { "input": [ - "text", - "image", - "pdf" + "text" ], "output": [ - "text" + "video" ] }, "limit": { - "context": 1000000, - "output": 64000 + "context": 8192, + "output": 8192 }, - "tool_call": true, + "temperature": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": true, - "mode": "budget", - "budget": { - "min": 1024, - "unit": "tokens" - }, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ], - "notes": [ - "Claude 4 manual thinking uses thinking.type = \"enabled\" with budget_tokens.", - "Interleaved thinking requires the interleaved-thinking-2025-05-14 beta header for this model family." - ] - } + "supported": false }, - "attachment": true, + "attachment": false, "open_weights": false, - "release_date": "2025-09-29", - "last_updated": "2025-09-29", - "cost": { - "input": 2.992, - "output": 14.994 - }, + "release_date": "2025-12-16", + "last_updated": "2025-12-16", "type": "chat" }, { - "id": "qwen3.5-27b", - "name": "Qwen3.5 27B", - "display_name": "Qwen3.5 27B", + "id": "bytedance/seedance-v1.0-lite-t2v", + "name": "Seedance v1.0 Lite Text-to-Video", + "display_name": "Seedance v1.0 Lite Text-to-Video", "modalities": { "input": [ - "text", - "image", - "video" + "text" ], "output": [ - "text" + "video" ] }, "limit": { - "context": 260096, - "output": 65536 + "context": 8192, + "output": 8192 }, + "temperature": true, "tool_call": false, "reasoning": { - "supported": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } + "supported": false }, - "attachment": true, + "attachment": false, "open_weights": false, - "release_date": "2026-02-24", - "last_updated": "2026-02-24", - "cost": { - "input": 0.27, - "output": 2.16 - }, + "release_date": "2025-06-01", + "last_updated": "2025-06-01", "type": "chat" }, { - "id": "glm-4-plus-0111", - "name": "GLM 4 Plus 0111", - "display_name": "GLM 4 Plus 0111", + "id": "bytedance/seedance-v1.0-pro-fast", + "name": "Seedance v1.0 Pro Fast", + "display_name": "Seedance v1.0 Pro Fast", "modalities": { "input": [ "text" ], "output": [ - "text" + "video" ] }, "limit": { - "context": 128000, - "output": 4096 + "context": 8192, + "output": 8192 }, + "temperature": true, "tool_call": false, "reasoning": { "supported": false }, "attachment": false, "open_weights": false, - "release_date": "2025-02-19", - "last_updated": "2025-02-19", - "cost": { - "input": 9.996, - "output": 9.996 - }, + "release_date": "2025-10-31", + "last_updated": "2025-10-31", "type": "chat" }, { - "id": "ernie-x1-turbo-32k", - "name": "Ernie X1 Turbo 32k", - "display_name": "Ernie X1 Turbo 32k", + "id": "bytedance/seedream-4.0", + "name": "Seedream 4.0", + "display_name": "Seedream 4.0", "modalities": { "input": [ - "text", - "image", - "pdf" + "text" ], "output": [ - "text" + "image" ] }, "limit": { - "context": 32000, - "output": 16384 + "context": 8192, + "output": 8192 }, + "temperature": true, "tool_call": false, "reasoning": { "supported": false }, - "attachment": true, + "attachment": false, "open_weights": false, - "release_date": "2025-05-08", - "last_updated": "2025-05-08", - "cost": { - "input": 0.165, - "output": 0.66 - }, + "release_date": "2025-08-28", + "last_updated": "2025-08-28", "type": "chat" }, { - "id": "gemma-4-31B-Fabled", - "name": "Gemma 4 31B Fabled", - "display_name": "Gemma 4 31B Fabled", + "id": "bytedance/seedream-4.5", + "name": "Seedream 4.5", + "display_name": "Seedream 4.5", "modalities": { "input": [ - "text", - "image", - "video" + "text" ], "output": [ - "text" + "image" ] }, "limit": { - "context": 262144, - "output": 16384 + "context": 8192, + "output": 8192 }, + "temperature": true, "tool_call": false, "reasoning": { - "supported": true, - "default": true + "supported": false }, - "attachment": true, + "attachment": false, "open_weights": false, - "release_date": "2026-05-02", - "last_updated": "2026-05-02", - "cost": { - "input": 0.306, - "output": 0.306 - }, + "release_date": "2025-11-28", + "last_updated": "2025-11-28", "type": "chat" }, { - "id": "claude-sonnet-4-thinking:32768", - "name": "Claude 4 Sonnet Thinking (32K)", - "display_name": "Claude 4 Sonnet Thinking (32K)", + "id": "bytedance/seed-1.8", + "name": "Seed 1.8", + "display_name": "Seed 1.8", "modalities": { "input": [ "text", - "image", - "pdf" + "image" ], "output": [ "text" ] }, "limit": { - "context": 1000000, + "context": 256000, "output": 64000 }, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, "default": true }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": true, - "mode": "budget", - "budget": { - "min": 1024, - "unit": "tokens" - }, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ], - "notes": [ - "Claude 4 manual thinking uses thinking.type = \"enabled\" with budget_tokens.", - "Interleaved thinking requires the interleaved-thinking-2025-05-14 beta header for this model family." - ] - } - }, - "attachment": true, + "attachment": false, "open_weights": false, - "release_date": "2025-05-22", - "last_updated": "2025-05-22", + "knowledge": "2024-10", + "release_date": "2025-09-01", + "last_updated": "2025-10", "cost": { - "input": 2.992, - "output": 14.994 + "input": 0.25, + "output": 2, + "cache_read": 0.05 }, "type": "chat" }, { - "id": "qwen-long", - "name": "Qwen Long 10M", - "display_name": "Qwen Long 10M", + "id": "bytedance/seedance-v1.0-lite-i2v", + "name": "Seedance v1.0 Lite Image-to-Video", + "display_name": "Seedance v1.0 Lite Image-to-Video", "modalities": { "input": [ - "text", - "pdf" + "text" ], "output": [ - "text" + "video" ] }, "limit": { - "context": 10000000, + "context": 8192, "output": 8192 }, + "temperature": true, "tool_call": false, "reasoning": { "supported": false }, - "attachment": true, + "attachment": false, "open_weights": false, - "release_date": "2025-01-25", - "last_updated": "2025-01-25", - "cost": { - "input": 0.1003, - "output": 0.408 - }, + "release_date": "2025-06-01", + "last_updated": "2025-06-01", "type": "chat" }, { - "id": "qwen3.5-35b-a3b:thinking", - "name": "Qwen3.5 35B A3B Thinking", - "display_name": "Qwen3.5 35B A3B Thinking", + "id": "morph/morph-v3-large", + "name": "Morph v3 Large", + "display_name": "Morph v3 Large", "modalities": { "input": [ - "text", - "image", - "video" + "text" ], "output": [ "text" ] }, "limit": { - "context": 260096, - "output": 65536 + "context": 32000, + "output": 32000 }, + "temperature": false, "tool_call": false, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } + "supported": false }, - "attachment": true, + "attachment": false, "open_weights": false, - "release_date": "2026-02-24", - "last_updated": "2026-02-24", + "release_date": "2024-08-15", + "last_updated": "2024-08-15", "cost": { - "input": 0.225, - "output": 1.8 + "input": 0.9, + "output": 1.9 }, "type": "chat" }, { - "id": "qvq-max", - "name": "Qwen: QvQ Max", - "display_name": "Qwen: QvQ Max", + "id": "morph/morph-v3-fast", + "name": "Morph v3 Fast", + "display_name": "Morph v3 Fast", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 8192 + "context": 16000, + "output": 16000 }, + "temperature": false, "tool_call": false, "reasoning": { "supported": false }, - "attachment": true, + "attachment": false, "open_weights": false, - "release_date": "2025-03-28", - "last_updated": "2025-03-28", + "release_date": "2024-08-15", + "last_updated": "2024-08-15", "cost": { - "input": 1.4, - "output": 5.3 + "input": 0.8, + "output": 1.2 }, "type": "chat" }, { - "id": "gemini-3-pro-image-preview", - "name": "Gemini 3 Pro Image", - "display_name": "Gemini 3 Pro Image", + "id": "nvidia/nemotron-3-ultra-550b-a55b", + "name": "Nemotron 3 Ultra", + "display_name": "Nemotron 3 Ultra", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 1048756, - "output": 65536 + "context": 1000000, + "output": 65000 }, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { "supported": true, "default": true }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": true, - "mode": "level", - "level": "high", - "level_options": [ - "low", - "high" - ], - "summaries": true, - "visibility": "summary", - "continuation": [ - "thought_signatures" - ] - } - }, - "attachment": true, + "attachment": false, "open_weights": false, - "release_date": "2025-11-18", - "last_updated": "2025-11-18", + "release_date": "2026-06-04", + "last_updated": "2026-06-04", "cost": { - "input": 2, - "output": 12 + "input": 0.6, + "output": 2.4, + "cache_read": 0.12 }, - "type": "imageGeneration" + "type": "chat" }, { - "id": "doubao-seed-2-0-pro-260215", - "name": "Doubao Seed 2.0 Pro", - "display_name": "Doubao Seed 2.0 Pro", + "id": "nvidia/nemotron-3-nano-30b-a3b", + "name": "Nemotron 3 Nano 30B A3B", + "display_name": "Nemotron 3 Nano 30B A3B", "modalities": { "input": [ "text" @@ -15746,27 +15926,63 @@ ] }, "limit": { - "context": 256000, - "output": 128000 + "context": 262144, + "output": 262144 }, + "temperature": true, "tool_call": false, "reasoning": { - "supported": false + "supported": true, + "default": true }, "attachment": false, "open_weights": false, - "release_date": "2026-02-14", - "last_updated": "2026-02-14", + "knowledge": "2024-10", + "release_date": "2024-12-01", + "last_updated": "2025-12-15", "cost": { - "input": 0.782, - "output": 3.876 + "input": 0.05, + "output": 0.24 }, "type": "chat" }, { - "id": "jamba-mini", - "name": "Jamba Mini", - "display_name": "Jamba Mini", + "id": "nvidia/nemotron-nano-9b-v2", + "name": "Nvidia Nemotron Nano 9B V2", + "display_name": "Nvidia Nemotron Nano 9B V2", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 131072, + "output": 131072 + }, + "temperature": true, + "tool_call": true, + "reasoning": { + "supported": true, + "default": true + }, + "attachment": false, + "open_weights": false, + "knowledge": "2024-10", + "release_date": "2025-08-18", + "last_updated": "2025-08-18", + "cost": { + "input": 0.06, + "output": 0.23 + }, + "type": "chat" + }, + { + "id": "nvidia/nemotron-3-super-120b-a12b", + "name": "NVIDIA Nemotron 3 Super 120B A12B", + "display_name": "NVIDIA Nemotron 3 Super 120B A12B", "modalities": { "input": [ "text" @@ -15777,26 +15993,27 @@ }, "limit": { "context": 256000, - "output": 4096 + "output": 32000 }, + "temperature": true, "tool_call": false, "reasoning": { "supported": false }, "attachment": false, "open_weights": false, - "release_date": "2025-07-09", - "last_updated": "2025-07-09", + "release_date": "2026-03-18", + "last_updated": "2026-03-11", "cost": { - "input": 0.1989, - "output": 0.408 + "input": 0.15, + "output": 0.65 }, "type": "chat" }, { - "id": "qwen3-vl-235b-a22b-thinking", - "name": "Qwen3 VL 235B A22B Thinking", - "display_name": "Qwen3 VL 235B A22B Thinking", + "id": "nvidia/nemotron-nano-12b-v2-vl", + "name": "Nvidia Nemotron Nano 12B V2 VL", + "display_name": "Nvidia Nemotron Nano 12B V2 VL", "modalities": { "input": [ "text", @@ -15807,72 +16024,66 @@ ] }, "limit": { - "context": 32768, - "output": 32768 + "context": 131072, + "output": 131072 }, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { "supported": true, "default": true }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } - }, "attachment": true, "open_weights": false, - "release_date": "2025-08-26", - "last_updated": "2025-08-26", + "knowledge": "2024-10", + "release_date": "2024-12-01", + "last_updated": "2025-10-28", "cost": { - "input": 0.5, - "output": 6 + "input": 0.2, + "output": 0.6 }, "type": "chat" }, { - "id": "qwen3.5-27b:thinking", - "name": "Qwen3.5 27B Thinking", - "display_name": "Qwen3.5 27B Thinking", + "id": "xiaomi/mimo-v2.5", + "name": "MiMo M2.5", + "display_name": "MiMo M2.5", "modalities": { "input": [ "text", "image", - "video" + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 260096, - "output": 65536 + "context": 1050000, + "output": 131100 }, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { "supported": true, "default": true }, "attachment": true, "open_weights": false, - "release_date": "2026-02-24", - "last_updated": "2026-02-24", + "knowledge": "2024-12", + "release_date": "2026-04-22", + "last_updated": "2026-04-22", "cost": { - "input": 0.27, - "output": 2.16 + "input": 0.14, + "output": 0.28, + "cache_read": 0.0028 }, "type": "chat" }, { - "id": "mercury-2", - "name": "Mercury 2", - "display_name": "Mercury 2", + "id": "xiaomi/mimo-v2-flash", + "name": "MiMo V2 Flash", + "display_name": "MiMo V2 Flash", "modalities": { "input": [ "text" @@ -15882,9 +16093,10 @@ ] }, "limit": { - "context": 128000, - "output": 50000 + "context": 262144, + "output": 32000 }, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, @@ -15892,63 +16104,90 @@ }, "attachment": false, "open_weights": false, - "release_date": "2024-01-01", - "last_updated": "2024-01-01", + "knowledge": "2024-10", + "release_date": "2025-12-17", + "last_updated": "2026-02-04", "cost": { - "input": 0.25, - "output": 0.75, - "cache_read": 0.025 + "input": 0.1, + "output": 0.3, + "cache_read": 0.01 }, "type": "chat" }, { - "id": "Qwen3.5-27B-BlueStar-Derestricted-Lite", - "name": "Qwen3.5 27B BlueStar Derestricted Lite", - "display_name": "Qwen3.5 27B BlueStar Derestricted Lite", + "id": "xiaomi/mimo-v2-pro", + "name": "MiMo V2 Pro", + "display_name": "MiMo V2 Pro", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 1000000, + "output": 128000 + }, + "temperature": true, + "tool_call": true, + "reasoning": { + "supported": true, + "default": true + }, + "attachment": false, + "open_weights": false, + "knowledge": "2024-12", + "release_date": "2026-03-18", + "last_updated": "2026-03-18", + "cost": { + "input": 1, + "output": 3, + "cache_read": 0.2 + }, + "type": "chat" + }, + { + "id": "xiaomi/mimo-v2.5-pro", + "name": "MiMo V2.5 Pro", + "display_name": "MiMo V2.5 Pro", "modalities": { "input": [ "text", "image", - "video" + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 262144, - "output": 16384 + "context": 1050000, + "output": 131000 }, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { "supported": true, "default": true }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } - }, "attachment": true, "open_weights": false, - "release_date": "2026-04-06", - "last_updated": "2026-04-06", + "knowledge": "2024-12", + "release_date": "2026-04-22", + "last_updated": "2026-04-22", "cost": { - "input": 0.306, - "output": 0.306 + "input": 0.435, + "output": 0.87, + "cache_read": 0.0036 }, "type": "chat" }, { - "id": "sonar-deep-research", - "name": "Perplexity Deep Research", - "display_name": "Perplexity Deep Research", + "id": "inception/mercury-coder-small", + "name": "Mercury Coder Small Beta", + "display_name": "Mercury Coder Small Beta", "modalities": { "input": [ "text" @@ -15958,27 +16197,28 @@ ] }, "limit": { - "context": 60000, - "output": 128000 + "context": 32000, + "output": 16384 }, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { "supported": false }, "attachment": false, "open_weights": false, - "release_date": "2025-02-25", - "last_updated": "2025-02-25", + "release_date": "2025-02-26", + "last_updated": "2025-02-26", "cost": { - "input": 3.4, - "output": 13.6 + "input": 0.25, + "output": 1 }, "type": "chat" }, { - "id": "glm-4-flash", - "name": "GLM-4 Flash", - "display_name": "GLM-4 Flash", + "id": "inception/mercury-2", + "name": "Mercury 2", + "display_name": "Mercury 2", "modalities": { "input": [ "text" @@ -15989,157 +16229,228 @@ }, "limit": { "context": 128000, - "output": 4096 + "output": 128000 }, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "attachment": false, "open_weights": false, - "release_date": "2024-08-01", - "last_updated": "2024-08-01", + "release_date": "2026-02-24", + "last_updated": "2026-03-06", "cost": { - "input": 0.1003, - "output": 0.1003 + "input": 0.25, + "output": 0.75, + "cache_read": 0.024999999999999998 }, "type": "chat" }, { - "id": "Qwen3.5-27B-Omega-Evolution-v2.2-Derestricted", - "name": "Qwen3.5 27B Omega Evolution v2.2 Derestricted", - "display_name": "Qwen3.5 27B Omega Evolution v2.2 Derestricted", + "id": "anthropic/claude-haiku-4.5", + "name": "Claude Haiku 4.5", + "display_name": "Claude Haiku 4.5", "modalities": { "input": [ "text", "image", - "video" + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 262144, - "output": 16384 + "context": 200000, + "output": 64000 }, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { "supported": true, - "default": true + "default": false }, "extra_capabilities": { "reasoning": { "supported": true, + "default_enabled": false, + "mode": "budget", + "budget": { + "min": 1024, + "unit": "tokens" + }, "interleaved": true, "summaries": true, "visibility": "summary", "continuation": [ "thinking_blocks" + ], + "notes": [ + "Claude 4 manual thinking uses thinking.type = \"enabled\" with budget_tokens.", + "Interleaved thinking requires the interleaved-thinking-2025-05-14 beta header for this model family." ] } }, "attachment": true, "open_weights": false, - "release_date": "2026-05-02", - "last_updated": "2026-05-02", + "knowledge": "2025-02-28", + "release_date": "2025-10-15", + "last_updated": "2025-10-15", "cost": { - "input": 0.306, - "output": 0.306 + "input": 1, + "output": 5, + "cache_read": 0.1, + "cache_write": 1.25 }, "type": "chat" }, { - "id": "doubao-seed-2-0-mini-260215", - "name": "Doubao Seed 2.0 Mini", - "display_name": "Doubao Seed 2.0 Mini", + "id": "anthropic/claude-opus-4.7", + "name": "Claude Opus 4.7", + "display_name": "Claude Opus 4.7", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 256000, - "output": 32000 + "context": 1000000, + "output": 128000 }, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": false }, - "attachment": false, + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": false, + "mode": "effort", + "effort": "high", + "effort_options": [ + "low", + "medium", + "high", + "xhigh", + "max" + ], + "interleaved": true, + "summaries": true, + "visibility": "omitted", + "continuation": [ + "thinking_blocks" + ], + "notes": [ + "Claude Opus 4.7 and newer Opus models require thinking.type = \"adaptive\" to enable thinking explicitly.", + "Manual budget_tokens requests return 400 on Claude Opus 4.7 and newer adaptive-only Opus models.", + "task_budget is separate from thinking control and should not be treated as a thinking budget." + ] + } + }, + "attachment": true, "open_weights": false, - "release_date": "2026-02-14", - "last_updated": "2026-02-14", + "knowledge": "2026-01-31", + "release_date": "2026-04-16", + "last_updated": "2026-04-16", "cost": { - "input": 0.0493, - "output": 0.4845 + "input": 5, + "output": 25, + "cache_read": 0.5, + "cache_write": 6.25 }, "type": "chat" }, { - "id": "Qwen3.5-27B-Marvin-V2-Derestricted", - "name": "Qwen3.5 27B Marvin V2 Derestricted", - "display_name": "Qwen3.5 27B Marvin V2 Derestricted", + "id": "anthropic/claude-opus-4.8", + "name": "Claude Opus 4.8", + "display_name": "Claude Opus 4.8", "modalities": { "input": [ "text", "image", - "video" + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 262144, - "output": 16384 + "context": 1000000, + "output": 128000 }, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { "supported": true, - "default": true + "default": false }, "extra_capabilities": { "reasoning": { "supported": true, + "default_enabled": false, + "mode": "effort", + "effort": "high", + "effort_options": [ + "low", + "medium", + "high", + "xhigh", + "max" + ], "interleaved": true, "summaries": true, - "visibility": "summary", + "visibility": "omitted", "continuation": [ "thinking_blocks" + ], + "notes": [ + "Claude Opus 4.7 and newer Opus models require thinking.type = \"adaptive\" to enable thinking explicitly.", + "Manual budget_tokens requests return 400 on Claude Opus 4.7 and newer adaptive-only Opus models.", + "task_budget is separate from thinking control and should not be treated as a thinking budget." ] } }, "attachment": true, "open_weights": false, - "release_date": "2026-04-30", - "last_updated": "2026-04-30", + "release_date": "2026-05-28", + "last_updated": "2026-05-28", "cost": { - "input": 0.306, - "output": 0.306 + "input": 5, + "output": 25, + "cache_read": 0.5, + "cache_write": 6.25 }, "type": "chat" }, { - "id": "qwen-plus", - "name": "Qwen Plus", - "display_name": "Qwen Plus", + "id": "anthropic/claude-fable-5", + "name": "Claude Fable 5", + "display_name": "Claude Fable 5", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 995904, - "output": 32768 + "context": 1000000, + "output": 128000 }, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { "supported": true, "default": true @@ -16147,321 +16458,562 @@ "extra_capabilities": { "reasoning": { "supported": true, + "default_enabled": true, + "mode": "effort", + "effort": "high", + "effort_options": [ + "low", + "medium", + "high", + "xhigh", + "max" + ], "interleaved": true, "summaries": true, - "visibility": "summary", + "visibility": "omitted", "continuation": [ "thinking_blocks" + ], + "notes": [ + "Adaptive thinking is always on for Claude Fable 5 and Claude Mythos 5; thinking.type = \"disabled\" is rejected.", + "Manual budget_tokens requests return 400 on Claude Fable 5 and Claude Mythos 5.", + "thinking.display defaults to omitted; set display to summarized to receive readable thinking summaries." ] } }, - "attachment": false, + "attachment": true, "open_weights": false, - "release_date": "2024-01-25", - "last_updated": "2024-01-25", + "knowledge": "2026-01-31", + "release_date": "2026-06-09", + "last_updated": "2026-06-09", "cost": { - "input": 0.3995, - "output": 1.2002 + "input": 10, + "output": 50, + "cache_read": 1, + "cache_write": 12.5 }, "type": "chat" }, { - "id": "kwaipilot/kat-coder-pro-v2", - "name": "KAT Coder Pro V2", - "display_name": "KAT Coder Pro V2", + "id": "anthropic/claude-opus-4.5", + "name": "Claude Opus 4.5", + "display_name": "Claude Opus 4.5", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 256000, - "output": 80000 + "context": 200000, + "output": 64000 }, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": false }, - "attachment": false, + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": false, + "mode": "mixed", + "budget": { + "min": 1024, + "unit": "tokens" + }, + "effort": "high", + "effort_options": [ + "low", + "medium", + "high" + ], + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ], + "notes": [ + "Claude Opus 4.5 uses manual thinking.type = \"enabled\" with budget_tokens; effort can be used alongside the thinking budget.", + "Interleaved thinking requires the interleaved-thinking-2025-05-14 beta header." + ] + } + }, + "attachment": true, "open_weights": false, - "release_date": "2026-03-28", - "last_updated": "2026-03-28", + "knowledge": "2025-03-31", + "release_date": "2024-11-24", + "last_updated": "2025-11-24", "cost": { - "input": 0.3, - "output": 1.2 + "input": 5, + "output": 25, + "cache_read": 0.5, + "cache_write": 6.25 }, "type": "chat" }, { - "id": "z-ai/glm-4.6:thinking", - "name": "GLM 4.6 Thinking", - "display_name": "GLM 4.6 Thinking", + "id": "anthropic/claude-sonnet-4.6", + "name": "Claude Sonnet 4.6", + "display_name": "Claude Sonnet 4.6", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 65535 + "context": 1000000, + "output": 128000 }, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, - "default": true + "default": false }, - "attachment": false, + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": false, + "mode": "mixed", + "budget": { + "min": 1024, + "unit": "tokens" + }, + "effort": "high", + "effort_options": [ + "low", + "medium", + "high", + "max" + ], + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ], + "notes": [ + "Anthropic recommends adaptive thinking with effort for Claude 4.6; budget_tokens remains a deprecated compatibility path.", + "Anthropic API defaults effort to high; lower effort levels should be chosen per workload." + ] + } + }, + "attachment": true, "open_weights": false, - "release_date": "2025-09-29", - "last_updated": "2025-09-29", + "knowledge": "2025-08-31", + "release_date": "2026-02-17", + "last_updated": "2026-03-13", "cost": { - "input": 0.4, - "output": 1.5 + "input": 3, + "output": 15, + "cache_read": 0.3, + "cache_write": 3.75, + "tiers": [ + { + "input": 6, + "output": 22.5, + "cache_read": 0.6, + "cache_write": 7.5, + "tier": { + "type": "context", + "size": 200000 + } + } + ], + "context_over_200k": { + "input": 6, + "output": 22.5, + "cache_read": 0.6, + "cache_write": 7.5 + } }, "type": "chat" }, { - "id": "z-ai/glm-4.6", - "name": "GLM 4.6", - "display_name": "GLM 4.6", + "id": "anthropic/claude-opus-4.6", + "name": "Claude Opus 4.6", + "display_name": "Claude Opus 4.6", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 65535 + "context": 1000000, + "output": 128000 }, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, - "default": true + "default": false }, "extra_capabilities": { "reasoning": { - "supported": true + "supported": true, + "default_enabled": false, + "mode": "mixed", + "budget": { + "min": 1024, + "unit": "tokens" + }, + "effort": "high", + "effort_options": [ + "low", + "medium", + "high", + "max" + ], + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ], + "notes": [ + "Anthropic recommends adaptive thinking with effort for Claude 4.6; budget_tokens remains a deprecated compatibility path.", + "Anthropic API defaults effort to high; lower effort levels should be chosen per workload." + ] } }, - "attachment": false, + "attachment": true, "open_weights": false, - "release_date": "2025-09-30", - "last_updated": "2025-09-30", + "knowledge": "2025-05-31", + "release_date": "2026-02-05", + "last_updated": "2026-03-13", "cost": { - "input": 0.4, - "output": 1.5 + "input": 5, + "output": 25, + "cache_read": 0.5, + "cache_write": 6.25 }, "type": "chat" }, { - "id": "z-ai/glm-5v-turbo:thinking", - "name": "GLM 5V Turbo Thinking", - "display_name": "GLM 5V Turbo Thinking", + "id": "anthropic/claude-opus-4", + "name": "Claude Opus 4", + "display_name": "Claude Opus 4", "modalities": { "input": [ "text", - "image" + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 202800, - "output": 131100 + "context": 200000, + "output": 32000 }, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, - "default": true + "default": false + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": false, + "mode": "budget", + "budget": { + "min": 1024, + "unit": "tokens" + }, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ], + "notes": [ + "Claude 4 manual thinking uses thinking.type = \"enabled\" with budget_tokens.", + "Interleaved thinking requires the interleaved-thinking-2025-05-14 beta header for this model family." + ] + } }, "attachment": true, "open_weights": false, - "release_date": "2026-04-02", - "last_updated": "2026-04-02", + "knowledge": "2025-03-31", + "release_date": "2025-05-22", + "last_updated": "2025-05-22", "cost": { - "input": 1.2, - "output": 4, - "cache_read": 0.24 + "input": 15, + "output": 75, + "cache_read": 1.5, + "cache_write": 18.75 }, "type": "chat" }, { - "id": "z-ai/glm-4.5v", - "name": "GLM 4.5V", - "display_name": "GLM 4.5V", + "id": "anthropic/claude-3-haiku", + "name": "Claude Haiku 3", + "display_name": "Claude Haiku 3", "modalities": { "input": [ "text", - "image" + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 64000, - "output": 96000 + "context": 200000, + "output": 4096 }, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, "attachment": true, "open_weights": false, - "release_date": "2025-11-22", - "last_updated": "2025-11-22", + "knowledge": "2023-08-31", + "release_date": "2024-03-13", + "last_updated": "2024-03-13", "cost": { - "input": 0.6, - "output": 1.7999999999999998 + "input": 0.25, + "output": 1.25, + "cache_read": 0.03, + "cache_write": 0.3 }, "type": "chat" }, { - "id": "z-ai/glm-5v-turbo", - "name": "GLM 5V Turbo", - "display_name": "GLM 5V Turbo", + "id": "anthropic/claude-opus-4.1", + "name": "Claude Opus 4.1", + "display_name": "Claude Opus 4.1", "modalities": { "input": [ "text", - "image" + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 202800, - "output": 131100 + "context": 200000, + "output": 32000 }, + "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": false + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": false, + "mode": "budget", + "budget": { + "min": 1024, + "unit": "tokens" + }, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ], + "notes": [ + "Claude 4 manual thinking uses thinking.type = \"enabled\" with budget_tokens.", + "Interleaved thinking requires the interleaved-thinking-2025-05-14 beta header for this model family." + ] + } }, "attachment": true, "open_weights": false, - "release_date": "2026-04-01", - "last_updated": "2026-04-01", + "knowledge": "2025-03-31", + "release_date": "2025-08-05", + "last_updated": "2025-08-05", "cost": { - "input": 1.2, - "output": 4, - "cache_read": 0.24 + "input": 15, + "output": 75, + "cache_read": 1.5, + "cache_write": 18.75 }, "type": "chat" }, { - "id": "z-ai/glm-5-turbo", - "name": "GLM 5 Turbo", - "display_name": "GLM 5 Turbo", + "id": "anthropic/claude-sonnet-4", + "name": "Claude Sonnet 4", + "display_name": "Claude Sonnet 4", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 202800, - "output": 131072 + "context": 200000, + "output": 64000 }, + "temperature": true, "tool_call": true, "reasoning": { - "supported": true + "supported": true, + "default": false }, "extra_capabilities": { "reasoning": { - "supported": true + "supported": true, + "default_enabled": false, + "mode": "budget", + "budget": { + "min": 1024, + "unit": "tokens" + }, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ], + "notes": [ + "Claude 4 manual thinking uses thinking.type = \"enabled\" with budget_tokens.", + "Interleaved thinking requires the interleaved-thinking-2025-05-14 beta header for this model family." + ] } }, - "attachment": false, + "attachment": true, "open_weights": false, - "release_date": "2026-03-15", - "last_updated": "2026-03-15", + "knowledge": "2025-03-31", + "release_date": "2025-05-22", + "last_updated": "2025-05-22", "cost": { - "input": 1.2, - "output": 4, - "cache_read": 0.24 + "input": 3, + "output": 15, + "cache_read": 0.3, + "cache_write": 3.75 }, "type": "chat" }, { - "id": "z-ai/glm-4.5v:thinking", - "name": "GLM 4.5V Thinking", - "display_name": "GLM 4.5V Thinking", + "id": "anthropic/claude-sonnet-4.5", + "name": "Claude Sonnet 4.5", + "display_name": "Claude Sonnet 4.5", "modalities": { "input": [ "text", - "image" + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 64000, - "output": 96000 + "context": 200000, + "output": 64000 }, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { "supported": true, - "default": true + "default": false + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": false, + "mode": "budget", + "budget": { + "min": 1024, + "unit": "tokens" + }, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ], + "notes": [ + "Claude 4 manual thinking uses thinking.type = \"enabled\" with budget_tokens.", + "Interleaved thinking requires the interleaved-thinking-2025-05-14 beta header for this model family." + ] + } }, "attachment": true, "open_weights": false, - "release_date": "2025-11-22", - "last_updated": "2025-11-22", + "knowledge": "2025-07-31", + "release_date": "2025-09-29", + "last_updated": "2025-09-29", "cost": { - "input": 0.6, - "output": 1.7999999999999998 + "input": 3, + "output": 15, + "cache_read": 0.3, + "cache_write": 3.75 }, "type": "chat" }, { - "id": "upstage/solar-pro-3", - "name": "Solar Pro 3", - "display_name": "Solar Pro 3", + "id": "anthropic/claude-3.5-haiku", + "name": "Claude Haiku 3.5", + "display_name": "Claude Haiku 3.5", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 128000 + "context": 200000, + "output": 8192 }, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { "supported": false }, - "attachment": false, + "attachment": true, "open_weights": false, - "release_date": "2026-03-03", - "last_updated": "2026-03-03", + "knowledge": "2024-07-31", + "release_date": "2024-10-22", + "last_updated": "2024-10-22", "cost": { - "input": 0.15, - "output": 0.6, - "cache_read": 0.015 + "input": 0.8, + "output": 4, + "cache_read": 0.08, + "cache_write": 1 }, "type": "chat" }, { - "id": "Alibaba-NLP/Tongyi-DeepResearch-30B-A3B", - "name": "Tongyi DeepResearch 30B A3B", - "display_name": "Tongyi DeepResearch 30B A3B", + "id": "cohere/rerank-v3.5", + "name": "Cohere Rerank 3.5", + "display_name": "Cohere Rerank 3.5", "modalities": { "input": [ "text" @@ -16471,27 +17023,24 @@ ] }, "limit": { - "context": 128000, - "output": 65536 + "context": 4096, + "output": 4096 }, + "temperature": true, "tool_call": false, "reasoning": { "supported": false }, "attachment": false, "open_weights": false, - "release_date": "2025-08-26", - "last_updated": "2025-08-26", - "cost": { - "input": 0.08, - "output": 0.24000000000000002 - }, + "release_date": "2024-12-02", + "last_updated": "2024-12-02", "type": "chat" }, { - "id": "THUDM/GLM-Z1-32B-0414", - "name": "GLM Z1 32B 0414", - "display_name": "GLM Z1 32B 0414", + "id": "cohere/command-a", + "name": "Command A", + "display_name": "Command A", "modalities": { "input": [ "text" @@ -16501,27 +17050,29 @@ ] }, "limit": { - "context": 128000, - "output": 65536 + "context": 256000, + "output": 8000 }, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { "supported": false }, "attachment": false, "open_weights": false, - "release_date": "2025-04-15", - "last_updated": "2025-04-15", + "knowledge": "2024-10", + "release_date": "2025-03-13", + "last_updated": "2025-03-13", "cost": { - "input": 0.2, - "output": 0.2 + "input": 2.5, + "output": 10 }, "type": "chat" }, { - "id": "THUDM/GLM-Z1-9B-0414", - "name": "GLM Z1 9B 0414", - "display_name": "GLM Z1 9B 0414", + "id": "cohere/rerank-v4-fast", + "name": "Cohere Rerank 4 Fast", + "display_name": "Cohere Rerank 4 Fast", "modalities": { "input": [ "text" @@ -16532,26 +17083,23 @@ }, "limit": { "context": 32000, - "output": 8000 + "output": 32000 }, + "temperature": true, "tool_call": false, "reasoning": { "supported": false }, "attachment": false, "open_weights": false, - "release_date": "2025-04-14", - "last_updated": "2025-04-14", - "cost": { - "input": 0.2, - "output": 0.2 - }, + "release_date": "2025-12-11", + "last_updated": "2025-12-11", "type": "chat" }, { - "id": "THUDM/GLM-4-32B-0414", - "name": "GLM 4 32B 0414", - "display_name": "GLM 4 32B 0414", + "id": "cohere/embed-v4.0", + "name": "Embed v4.0", + "display_name": "Embed v4.0", "modalities": { "input": [ "text" @@ -16562,26 +17110,23 @@ }, "limit": { "context": 128000, - "output": 65536 + "output": 1536 }, + "temperature": true, "tool_call": false, "reasoning": { "supported": false }, "attachment": false, "open_weights": false, - "release_date": "2025-04-14", - "last_updated": "2025-04-14", - "cost": { - "input": 0.2, - "output": 0.2 - }, + "release_date": "2025-04-15", + "last_updated": "2025-04-15", "type": "chat" }, { - "id": "THUDM/GLM-4-9B-0414", - "name": "GLM 4 9B 0414", - "display_name": "GLM 4 9B 0414", + "id": "cohere/rerank-v4-pro", + "name": "Cohere Rerank 4 Pro", + "display_name": "Cohere Rerank 4 Pro", "modalities": { "input": [ "text" @@ -16592,57 +17137,58 @@ }, "limit": { "context": 32000, - "output": 8000 + "output": 32000 }, + "temperature": true, "tool_call": false, "reasoning": { "supported": false }, "attachment": false, "open_weights": false, - "release_date": "2025-04-14", - "last_updated": "2025-04-14", - "cost": { - "input": 0.2, - "output": 0.2 - }, + "release_date": "2025-12-11", + "last_updated": "2025-12-11", "type": "chat" }, { - "id": "TheDrummer/Skyfall-31B-v4.2", - "name": "TheDrummer Skyfall 31B v4.2", - "display_name": "TheDrummer Skyfall 31B v4.2", + "id": "stepfun/step-3.7-flash", + "name": "Step 3.7 Flash", + "display_name": "Step 3.7 Flash", "modalities": { "input": [ "text", - "pdf" + "image" ], "output": [ "text" ] }, "limit": { - "context": 131072, - "output": 16384 + "context": 256000, + "output": 256000 }, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "attachment": true, "open_weights": false, - "release_date": "2026-03-26", - "last_updated": "2026-03-26", + "knowledge": "2026-01-01", + "release_date": "2026-05-28", + "last_updated": "2026-05-29", "cost": { - "input": 0.55, - "output": 0.8 + "input": 0.2, + "output": 1.15, + "cache_read": 0.04 }, "type": "chat" }, { - "id": "TheDrummer/Rocinante-12B-v1.1", - "name": "Rocinante 12b", - "display_name": "Rocinante 12b", + "id": "stepfun/step-3.5-flash", + "name": "StepFun 3.5 Flash", + "display_name": "StepFun 3.5 Flash", "modalities": { "input": [ "text" @@ -16652,27 +17198,31 @@ ] }, "limit": { - "context": 16384, - "output": 8192 + "context": 262114, + "output": 262114 }, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "attachment": false, "open_weights": false, - "release_date": "2024-01-01", - "last_updated": "2024-01-01", + "knowledge": "2025-01", + "release_date": "2026-01-29", + "last_updated": "2026-02-13", "cost": { - "input": 0.408, - "output": 0.595 + "input": 0.09, + "output": 0.3, + "cache_write": 0.02 }, "type": "chat" }, { - "id": "TheDrummer/Cydonia-24B-v4", - "name": "The Drummer Cydonia 24B v4", - "display_name": "The Drummer Cydonia 24B v4", + "id": "interfaze/interfaze-beta", + "name": "Interfaze Beta", + "display_name": "Interfaze Beta", "modalities": { "input": [ "text" @@ -16682,602 +17232,547 @@ ] }, "limit": { - "context": 16384, - "output": 32768 + "context": 1000000, + "output": 32000 }, + "temperature": true, "tool_call": false, "reasoning": { - "supported": false + "supported": true, + "default": true }, "attachment": false, "open_weights": false, - "release_date": "2025-07-22", - "last_updated": "2025-07-22", + "release_date": "2025-10-07", + "last_updated": "2026-04-29", "cost": { - "input": 0.2006, - "output": 0.2414 + "input": 1.5, + "output": 3.5 }, "type": "chat" }, { - "id": "TheDrummer/Magidonia-24B-v4.3", - "name": "The Drummer Magidonia 24B v4.3", - "display_name": "The Drummer Magidonia 24B v4.3", + "id": "bfl/flux-kontext-max", + "name": "FLUX.1 Kontext Max", + "display_name": "FLUX.1 Kontext Max", "modalities": { "input": [ "text" ], "output": [ - "text" + "image" ] }, "limit": { - "context": 32768, - "output": 32768 + "context": 512, + "output": 8192 }, + "temperature": true, "tool_call": false, "reasoning": { "supported": false }, "attachment": false, "open_weights": false, - "release_date": "2025-12-25", - "last_updated": "2025-12-25", - "cost": { - "input": 0.1003, - "output": 0.1207 - }, + "release_date": "2025-06-01", + "last_updated": "2025-06", "type": "chat" }, { - "id": "TheDrummer/Cydonia-24B-v4.3", - "name": "The Drummer Cydonia 24B v4.3", - "display_name": "The Drummer Cydonia 24B v4.3", + "id": "bfl/flux-2-flex", + "name": "FLUX.2 [flex]", + "display_name": "FLUX.2 [flex]", "modalities": { "input": [ "text" ], "output": [ - "text" + "image" ] }, "limit": { - "context": 32768, - "output": 32768 + "context": 8192, + "output": 8192 }, + "temperature": true, "tool_call": false, "reasoning": { "supported": false }, "attachment": false, "open_weights": false, - "release_date": "2025-12-25", - "last_updated": "2025-12-25", - "cost": { - "input": 0.1003, - "output": 0.1207 - }, - "type": "chat" + "release_date": "2026-06-08", + "last_updated": "2026-06-08", + "type": "imageGeneration" }, { - "id": "TheDrummer/Anubis-70B-v1.1", - "name": "Anubis 70B v1.1", - "display_name": "Anubis 70B v1.1", + "id": "bfl/flux-pro-1.1-ultra", + "name": "FLUX1.1 [pro] Ultra", + "display_name": "FLUX1.1 [pro] Ultra", "modalities": { "input": [ "text" ], "output": [ - "text" + "image" ] }, "limit": { - "context": 131072, - "output": 16384 + "context": 512, + "output": 8192 }, + "temperature": true, "tool_call": false, "reasoning": { "supported": false }, "attachment": false, "open_weights": false, - "release_date": "2024-01-01", - "last_updated": "2024-01-01", - "cost": { - "input": 0.31, - "output": 0.31 - }, + "release_date": "2024-11-01", + "last_updated": "2024-11", "type": "chat" }, { - "id": "TheDrummer/Anubis-70B-v1", - "name": "Anubis 70B v1", - "display_name": "Anubis 70B v1", + "id": "bfl/flux-2-max", + "name": "FLUX.2 [max]", + "display_name": "FLUX.2 [max]", "modalities": { "input": [ "text" ], "output": [ - "text" + "image" ] }, "limit": { - "context": 65536, - "output": 16384 + "context": 67300, + "output": 67300 }, + "temperature": true, "tool_call": false, "reasoning": { "supported": false }, "attachment": false, "open_weights": false, - "release_date": "2024-01-01", - "last_updated": "2024-01-01", - "cost": { - "input": 0.31, - "output": 0.31 - }, + "release_date": "2026-06-08", + "last_updated": "2026-06-08", "type": "chat" }, { - "id": "TheDrummer/skyfall-36b-v2", - "name": "TheDrummer Skyfall 36B V2", - "display_name": "TheDrummer Skyfall 36B V2", + "id": "bfl/flux-pro-1.1", + "name": "FLUX1.1 [pro]", + "display_name": "FLUX1.1 [pro]", "modalities": { "input": [ - "text", - "pdf" + "text" ], "output": [ - "text" + "image" ] }, "limit": { - "context": 64000, - "output": 32768 + "context": 512, + "output": 8192 }, + "temperature": true, "tool_call": false, "reasoning": { "supported": false }, - "attachment": true, + "attachment": false, "open_weights": false, - "release_date": "2025-03-10", - "last_updated": "2025-03-10", - "cost": { - "input": 0.493, - "output": 0.493 - }, + "release_date": "2024-10-01", + "last_updated": "2024-10", "type": "chat" }, { - "id": "TheDrummer/Cydonia-24B-v4.1", - "name": "The Drummer Cydonia 24B v4.1", - "display_name": "The Drummer Cydonia 24B v4.1", + "id": "bfl/flux-pro-1.0-fill", + "name": "FLUX.1 Fill [pro]", + "display_name": "FLUX.1 Fill [pro]", "modalities": { "input": [ "text" ], "output": [ - "text" + "image" ] }, "limit": { - "context": 16384, - "output": 32768 + "context": 512, + "output": 8192 }, + "temperature": true, "tool_call": false, "reasoning": { "supported": false }, "attachment": false, "open_weights": false, - "release_date": "2025-08-19", - "last_updated": "2025-08-19", - "cost": { - "input": 0.1003, - "output": 0.1207 - }, + "release_date": "2024-10-01", + "last_updated": "2024-10", "type": "chat" }, { - "id": "TheDrummer/Cydonia-24B-v2", - "name": "The Drummer Cydonia 24B v2", - "display_name": "The Drummer Cydonia 24B v2", + "id": "bfl/flux-2-klein-4b", + "name": "FLUX.2 [klein] 4B", + "display_name": "FLUX.2 [klein] 4B", "modalities": { "input": [ "text" ], "output": [ - "text" + "image" ] }, "limit": { - "context": 16384, - "output": 32768 + "context": 8192, + "output": 8192 }, + "temperature": true, "tool_call": false, "reasoning": { "supported": false }, "attachment": false, "open_weights": false, - "release_date": "2025-02-17", - "last_updated": "2025-02-17", - "cost": { - "input": 0.1003, - "output": 0.1207 - }, + "release_date": "2026-06-08", + "last_updated": "2026-06-08", "type": "chat" }, { - "id": "TheDrummer/UnslopNemo-12B-v4.1", - "name": "UnslopNemo 12b v4", - "display_name": "UnslopNemo 12b v4", + "id": "bfl/flux-2-klein-9b", + "name": "FLUX.2 [klein] 9B", + "display_name": "FLUX.2 [klein] 9B", "modalities": { "input": [ - "text", - "pdf" + "text" ], "output": [ - "text" + "image" ] }, "limit": { - "context": 32768, + "context": 8192, "output": 8192 }, + "temperature": true, "tool_call": false, "reasoning": { "supported": false }, - "attachment": true, + "attachment": false, "open_weights": false, - "release_date": "2024-01-01", - "last_updated": "2024-01-01", - "cost": { - "input": 0.493, - "output": 0.493 - }, + "release_date": "2026-06-08", + "last_updated": "2026-06-08", "type": "chat" }, { - "id": "mistralai/ministral-14b-instruct-2512", - "name": "Ministral 3 14B", - "display_name": "Ministral 3 14B", + "id": "bfl/flux-kontext-pro", + "name": "FLUX.1 Kontext Pro", + "display_name": "FLUX.1 Kontext Pro", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ - "text" + "image" ] }, "limit": { - "context": 262144, - "output": 32768 + "context": 512, + "output": 8192 }, + "temperature": true, "tool_call": false, "reasoning": { "supported": false }, - "attachment": true, + "attachment": false, "open_weights": false, - "release_date": "2025-12-02", - "last_updated": "2025-12-02", - "cost": { - "input": 0.1, - "output": 0.4 - }, + "release_date": "2025-06-01", + "last_updated": "2025-06", "type": "chat" }, { - "id": "mistralai/mistral-medium-3.1", - "name": "Mistral Medium 3.1", - "display_name": "Mistral Medium 3.1", + "id": "bfl/flux-2-pro", + "name": "FLUX.2 [pro]", + "display_name": "FLUX.2 [pro]", "modalities": { "input": [ "text" ], "output": [ - "text" + "image" ] }, "limit": { - "context": 131072, - "output": 32768 + "context": 67300, + "output": 67300 }, + "temperature": true, "tool_call": false, "reasoning": { "supported": false }, "attachment": false, "open_weights": false, - "release_date": "2025-09-05", - "last_updated": "2025-09-05", - "cost": { - "input": 0.4, - "output": 2 - }, - "type": "chat" + "release_date": "2026-06-08", + "last_updated": "2026-06-08", + "type": "imageGeneration" }, { - "id": "mistralai/ministral-14b-2512", - "name": "Ministral 14B", - "display_name": "Ministral 14B", + "id": "recraft/recraft-v4.1-pro", + "name": "Recraft V4.1 Pro", + "display_name": "Recraft V4.1 Pro", "modalities": { "input": [ "text" ], "output": [ - "text" + "image" ] }, "limit": { - "context": 262144, - "output": 32768 + "context": 8192, + "output": 8192 }, + "temperature": true, "tool_call": false, "reasoning": { "supported": false }, "attachment": false, "open_weights": false, - "release_date": "2025-12-04", - "last_updated": "2025-12-04", - "cost": { - "input": 0.2, - "output": 0.2 - }, + "release_date": "2026-05-14", + "last_updated": "2026-05-14", "type": "chat" }, { - "id": "mistralai/ministral-8b-2512", - "name": "Ministral 8B", - "display_name": "Ministral 8B", + "id": "recraft/recraft-v4.1", + "name": "Recraft V4.1", + "display_name": "Recraft V4.1", "modalities": { "input": [ "text" ], "output": [ - "text" + "image" ] }, "limit": { - "context": 262144, - "output": 32768 + "context": 8192, + "output": 8192 }, + "temperature": true, "tool_call": false, "reasoning": { "supported": false }, "attachment": false, "open_weights": false, - "release_date": "2025-12-04", - "last_updated": "2025-12-04", - "cost": { - "input": 0.15, - "output": 0.15 - }, + "release_date": "2026-05-14", + "last_updated": "2026-05-14", "type": "chat" }, { - "id": "mistralai/mistral-large-3-675b-instruct-2512", - "name": "Mistral Large 3 675B", - "display_name": "Mistral Large 3 675B", + "id": "recraft/recraft-v4", + "name": "Recraft V4", + "display_name": "Recraft V4", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ - "text" + "image" ] }, "limit": { - "context": 262144, - "output": 256000 + "context": 8192, + "output": 8192 }, + "temperature": true, "tool_call": false, "reasoning": { "supported": false }, - "attachment": true, + "attachment": false, "open_weights": false, - "release_date": "2025-12-02", - "last_updated": "2025-12-02", - "cost": { - "input": 1, - "output": 3 - }, + "release_date": "2026-02-17", + "last_updated": "2026-02-17", "type": "chat" }, { - "id": "mistralai/mixtral-8x22b-instruct-v0.1", - "name": "Mixtral 8x22B", - "display_name": "Mixtral 8x22B", + "id": "recraft/recraft-v4-pro", + "name": "Recraft V4 Pro", + "display_name": "Recraft V4 Pro", "modalities": { "input": [ "text" ], "output": [ - "text" + "image" ] }, "limit": { - "context": 65536, - "output": 32768 + "context": 8192, + "output": 8192 }, + "temperature": true, "tool_call": false, "reasoning": { "supported": false }, "attachment": false, "open_weights": false, - "release_date": "2025-12-11", - "last_updated": "2025-12-11", - "cost": { - "input": 0.8999999999999999, - "output": 0.8999999999999999 - }, + "release_date": "2026-02-17", + "last_updated": "2026-02-17", "type": "chat" }, { - "id": "mistralai/mistral-large", - "name": "Mistral Large 2411", - "display_name": "Mistral Large 2411", + "id": "recraft/recraft-v2", + "name": "Recraft V2", + "display_name": "Recraft V2", "modalities": { "input": [ "text" ], "output": [ - "text" + "image" ] }, "limit": { - "context": 128000, - "output": 256000 + "context": 512, + "output": 8192 }, + "temperature": true, "tool_call": false, "reasoning": { "supported": false }, "attachment": false, "open_weights": false, - "release_date": "2024-02-26", - "last_updated": "2024-02-26", - "cost": { - "input": 2.006, - "output": 6.001 - }, + "release_date": "2024-03-01", + "last_updated": "2024-03", "type": "chat" }, { - "id": "mistralai/ministral-3b-2512", - "name": "Ministral 3B", - "display_name": "Ministral 3B", + "id": "recraft/recraft-v3", + "name": "Recraft V3", + "display_name": "Recraft V3", "modalities": { "input": [ "text" ], "output": [ - "text" + "image" ] }, "limit": { - "context": 131072, - "output": 32768 + "context": 512, + "output": 8192 }, + "temperature": true, "tool_call": false, "reasoning": { "supported": false }, "attachment": false, "open_weights": false, - "release_date": "2025-12-04", - "last_updated": "2025-12-04", - "cost": { - "input": 0.1, - "output": 0.1 - }, + "release_date": "2024-10-01", + "last_updated": "2024-10", "type": "chat" }, { - "id": "mistralai/Mistral-Nemo-Instruct-2407", - "name": "Mistral Nemo", - "display_name": "Mistral Nemo", + "id": "recraft/recraft-v4.1-utility-pro", + "name": "Recraft V4.1 Utility Pro", + "display_name": "Recraft V4.1 Utility Pro", "modalities": { "input": [ "text" ], "output": [ - "text" + "image" ] }, "limit": { - "context": 16384, + "context": 8192, "output": 8192 }, + "temperature": true, "tool_call": false, "reasoning": { "supported": false }, "attachment": false, "open_weights": false, - "release_date": "2024-07-18", - "last_updated": "2024-07-18", - "cost": { - "input": 0.1003, - "output": 0.1207 - }, + "release_date": "2026-05-14", + "last_updated": "2026-05-14", "type": "chat" }, { - "id": "mistralai/mistral-saba", - "name": "Mistral Saba", - "display_name": "Mistral Saba", + "id": "recraft/recraft-v4.1-utility", + "name": "Recraft V4.1 Utility", + "display_name": "Recraft V4.1 Utility", "modalities": { "input": [ "text" ], "output": [ - "text" + "image" ] }, "limit": { - "context": 32000, - "output": 32768 + "context": 8192, + "output": 8192 }, + "temperature": true, "tool_call": false, "reasoning": { "supported": false }, "attachment": false, "open_weights": false, - "release_date": "2025-02-17", - "last_updated": "2025-02-17", - "cost": { - "input": 0.1989, - "output": 0.595 - }, + "release_date": "2026-05-14", + "last_updated": "2026-05-14", "type": "chat" }, { - "id": "mistralai/mistral-medium-3", - "name": "Mistral Medium 3", - "display_name": "Mistral Medium 3", + "id": "arcee-ai/trinity-large-preview", + "name": "Trinity Large Preview", + "display_name": "Trinity Large Preview", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 131072, - "output": 32768 + "context": 131000, + "output": 131000 }, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { "supported": false }, - "attachment": true, + "attachment": false, "open_weights": false, - "release_date": "2025-09-25", - "last_updated": "2025-09-25", + "knowledge": "2024-10", + "release_date": "2025-01-01", + "last_updated": "2025-01", "cost": { - "input": 0.4, - "output": 2 + "input": 0.25, + "output": 1 }, "type": "chat" }, { - "id": "mistralai/mixtral-8x7b-instruct-v0.1", - "name": "Mixtral 8x7B", - "display_name": "Mixtral 8x7B", + "id": "arcee-ai/trinity-large-thinking", + "name": "Trinity Large Thinking", + "display_name": "Trinity Large Thinking", "modalities": { "input": [ "text" @@ -17287,59 +17782,61 @@ ] }, "limit": { - "context": 32768, - "output": 32768 + "context": 262100, + "output": 80000 }, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "attachment": false, - "open_weights": false, - "release_date": "2025-12-11", - "last_updated": "2025-12-11", + "open_weights": true, + "release_date": "2026-04-01", + "last_updated": "2026-04-03", "cost": { - "input": 0.27, - "output": 0.27 + "input": 0.25, + "output": 0.8999999999999999 }, "type": "chat" }, { - "id": "mistralai/mistral-small-4-119b-2603:thinking", - "name": "Mistral Small 4 119B Thinking", - "display_name": "Mistral Small 4 119B Thinking", + "id": "arcee-ai/trinity-mini", + "name": "Trinity Mini", + "display_name": "Trinity Mini", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 262144, - "output": 16384 + "context": 131072, + "output": 131072 }, - "tool_call": true, + "temperature": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": true + "supported": false }, - "attachment": true, + "attachment": false, "open_weights": false, - "release_date": "2026-03-17", - "last_updated": "2026-03-17", + "knowledge": "2024-10", + "release_date": "2025-12-01", + "last_updated": "2025-12", "cost": { - "input": 0.4, - "output": 1.4 + "input": 0.045, + "output": 0.15 }, "type": "chat" }, { - "id": "mistralai/Devstral-Small-2505", - "name": "Mistral Devstral Small 2505", - "display_name": "Mistral Devstral Small 2505", + "id": "perplexity/sonar-reasoning-pro", + "name": "Sonar Reasoning Pro", + "display_name": "Sonar Reasoning Pro", "modalities": { "input": [ "text" @@ -17349,57 +17846,55 @@ ] }, "limit": { - "context": 32768, - "output": 8192 + "context": 127000, + "output": 8000 }, + "temperature": true, "tool_call": false, "reasoning": { - "supported": false + "supported": true, + "default": true }, "attachment": false, "open_weights": false, - "release_date": "2025-08-02", - "last_updated": "2025-08-02", - "cost": { - "input": 0.060000000000000005, - "output": 0.060000000000000005 - }, + "knowledge": "2025-09", + "release_date": "2025-02-19", + "last_updated": "2025-02-19", "type": "chat" }, { - "id": "mistralai/codestral-2508", - "name": "Codestral 2508", - "display_name": "Codestral 2508", + "id": "perplexity/sonar", + "name": "Sonar", + "display_name": "Sonar", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 256000, - "output": 32768 + "context": 127000, + "output": 8000 }, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { "supported": false }, - "attachment": false, + "attachment": true, "open_weights": false, - "release_date": "2025-08-01", - "last_updated": "2025-08-01", - "cost": { - "input": 0.3, - "output": 0.8999999999999999 - }, + "knowledge": "2025-02", + "release_date": "2025-02-19", + "last_updated": "2025-02-19", "type": "chat" }, { - "id": "mistralai/mistral-small-4-119b-2603", - "name": "Mistral Small 4 119B", - "display_name": "Mistral Small 4 119B", + "id": "perplexity/sonar-pro", + "name": "Sonar Pro", + "display_name": "Sonar Pro", "modalities": { "input": [ "text", @@ -17410,28 +17905,25 @@ ] }, "limit": { - "context": 262144, - "output": 16384 + "context": 200000, + "output": 8000 }, + "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, "attachment": true, "open_weights": false, - "release_date": "2026-03-16", - "last_updated": "2026-03-16", - "cost": { - "input": 0.4, - "output": 1.4 - }, + "knowledge": "2025-09", + "release_date": "2025-02-19", + "last_updated": "2025-02-19", "type": "chat" }, { - "id": "mistralai/devstral-2-123b-instruct-2512", - "name": "Devstral 2 123B", - "display_name": "Devstral 2 123B", + "id": "amazon/titan-embed-text-v2", + "name": "Titan Text Embeddings V2", + "display_name": "Titan Text Embeddings V2", "modalities": { "input": [ "text" @@ -17441,253 +17933,268 @@ ] }, "limit": { - "context": 262144, - "output": 65536 + "context": 8192, + "output": 1536 }, + "temperature": true, "tool_call": false, "reasoning": { "supported": false }, "attachment": false, "open_weights": false, - "release_date": "2025-12-09", - "last_updated": "2025-12-09", - "cost": { - "input": 0.4, - "output": 1.4 - }, + "release_date": "2024-04-01", + "last_updated": "2024-04", "type": "chat" }, { - "id": "deepseek/deepseek-v3.2:thinking", - "name": "DeepSeek V3.2 Thinking", - "display_name": "DeepSeek V3.2 Thinking", + "id": "amazon/nova-2-lite", + "name": "Nova 2 Lite", + "display_name": "Nova 2 Lite", "modalities": { "input": [ "text", - "pdf" + "image" ], "output": [ "text" ] }, "limit": { - "context": 163000, - "output": 65536 + "context": 1000000, + "output": 1000000 }, - "tool_call": true, + "temperature": true, + "tool_call": false, "reasoning": { "supported": true, "default": true }, "attachment": true, "open_weights": false, - "release_date": "2025-12-01", - "last_updated": "2025-12-01", + "knowledge": "2024-10", + "release_date": "2024-12-01", + "last_updated": "2024-12-01", "cost": { - "input": 0.27999999999999997, - "output": 0.42000000000000004 + "input": 0.3, + "output": 2.5, + "cache_read": 0.075 }, "type": "chat" }, { - "id": "deepseek/deepseek-v4-pro-cheaper", - "name": "DeepSeek V4 Pro Cheaper", - "display_name": "DeepSeek V4 Pro Cheaper", + "id": "amazon/nova-lite", + "name": "Nova Lite", + "display_name": "Nova Lite", "modalities": { "input": [ - "text" + "text", + "image", + "video" ], "output": [ "text" ] }, "limit": { - "context": 1048576, - "output": 384000 + "context": 300000, + "output": 8192 }, + "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, - "attachment": false, + "attachment": true, "open_weights": false, - "release_date": "2026-04-25", - "last_updated": "2026-04-25", + "knowledge": "2024-10", + "release_date": "2024-12-03", + "last_updated": "2024-12-03", "cost": { - "input": 0.435, - "output": 0.87, - "cache_read": 0.003625 + "input": 0.06, + "output": 0.24, + "cache_read": 0.015 }, "type": "chat" }, { - "id": "deepseek/deepseek-v3.2", - "name": "DeepSeek V3.2", - "display_name": "DeepSeek V3.2", + "id": "amazon/nova-micro", + "name": "Nova Micro", + "display_name": "Nova Micro", "modalities": { "input": [ - "text", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 163000, - "output": 65536 + "context": 128000, + "output": 8192 }, + "temperature": true, "tool_call": true, "reasoning": { - "supported": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true - } + "supported": false }, - "attachment": true, + "attachment": false, "open_weights": false, - "release_date": "2025-12-01", - "last_updated": "2025-12-01", + "knowledge": "2024-10", + "release_date": "2024-12-03", + "last_updated": "2024-12-03", "cost": { - "input": 0.27999999999999997, - "output": 0.42000000000000004 + "input": 0.035, + "output": 0.14, + "cache_read": 0.00875 }, "type": "chat" }, { - "id": "deepseek/deepseek-prover-v2-671b", - "name": "DeepSeek Prover v2 671B", - "display_name": "DeepSeek Prover v2 671B", + "id": "amazon/nova-pro", + "name": "Nova Pro", + "display_name": "Nova Pro", "modalities": { "input": [ - "text" + "text", + "image", + "video" ], "output": [ "text" ] }, "limit": { - "context": 160000, - "output": 16384 + "context": 300000, + "output": 8192 }, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { "supported": false }, - "attachment": false, + "attachment": true, "open_weights": false, - "release_date": "2025-04-30", - "last_updated": "2025-04-30", + "knowledge": "2024-10", + "release_date": "2024-12-03", + "last_updated": "2024-12-03", "cost": { - "input": 1, - "output": 2.5 + "input": 0.8, + "output": 3.2, + "cache_read": 0.2 }, "type": "chat" }, { - "id": "deepseek/deepseek-v4-flash:thinking", - "name": "DeepSeek V4 Flash (Thinking)", - "display_name": "DeepSeek V4 Flash (Thinking)", + "id": "alibaba/qwen3-vl-thinking", + "name": "Qwen3 VL Thinking", + "display_name": "Qwen3 VL Thinking", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 1048576, - "output": 384000 + "context": 131072, + "output": 32768 }, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, "default": true }, - "attachment": false, - "open_weights": false, - "release_date": "2026-04-24", - "last_updated": "2026-04-24", + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } + }, + "attachment": true, + "open_weights": true, + "knowledge": "2025-09", + "release_date": "2025-09-24", + "last_updated": "2025-09-24", "cost": { - "input": 0.14, - "output": 0.28, - "cache_read": 0.028 + "input": 0.4, + "output": 4 }, "type": "chat" }, { - "id": "deepseek/deepseek-v3.2-speciale", - "name": "DeepSeek V3.2 Speciale", - "display_name": "DeepSeek V3.2 Speciale", + "id": "alibaba/qwen3-coder-plus", + "name": "Qwen3 Coder Plus", + "display_name": "Qwen3 Coder Plus", "modalities": { "input": [ - "text", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 163000, + "context": 1000000, "output": 65536 }, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, - "attachment": true, - "open_weights": false, - "release_date": "2025-12-02", - "last_updated": "2025-12-02", + "attachment": false, + "open_weights": true, + "knowledge": "2025-04", + "release_date": "2025-07-23", + "last_updated": "2025-07-23", "cost": { - "input": 0.27999999999999997, - "output": 0.42000000000000004 + "input": 1, + "output": 5, + "cache_read": 0.2 }, "type": "chat" }, { - "id": "deepseek/deepseek-v4-pro:thinking", - "name": "DeepSeek V4 Pro (Thinking)", - "display_name": "DeepSeek V4 Pro (Thinking)", + "id": "alibaba/wan-v2.6-r2v", + "name": "Wan v2.6 Reference-to-Video", + "display_name": "Wan v2.6 Reference-to-Video", "modalities": { "input": [ "text" ], "output": [ - "text" + "video" ] }, "limit": { - "context": 1048576, - "output": 384000 + "context": 8192, + "output": 8192 }, - "tool_call": true, + "temperature": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": true + "supported": false }, "attachment": false, "open_weights": false, - "release_date": "2026-04-24", - "last_updated": "2026-04-24", - "cost": { - "input": 1.1, - "output": 2.2, - "cache_read": 0.11 - }, + "release_date": "2025-12-16", + "last_updated": "2025-12-16", "type": "chat" }, { - "id": "deepseek/deepseek-v4-pro-cheaper:thinking", - "name": "DeepSeek V4 Pro Cheaper (Thinking)", - "display_name": "DeepSeek V4 Pro Cheaper (Thinking)", + "id": "alibaba/qwen3-embedding-0.6b", + "name": "Qwen3 Embedding 0.6B", + "display_name": "Qwen3 Embedding 0.6B", "modalities": { "input": [ "text" @@ -17697,29 +18204,24 @@ ] }, "limit": { - "context": 1048576, - "output": 384000 + "context": 32768, + "output": 32768 }, - "tool_call": true, + "temperature": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": true + "supported": false }, "attachment": false, "open_weights": false, - "release_date": "2026-04-25", - "last_updated": "2026-04-25", - "cost": { - "input": 0.435, - "output": 0.87, - "cache_read": 0.003625 - }, - "type": "chat" + "release_date": "2025-11-14", + "last_updated": "2025-11-14", + "type": "embedding" }, { - "id": "deepseek/deepseek-v4-flash", - "name": "DeepSeek V4 Flash", - "display_name": "DeepSeek V4 Flash", + "id": "alibaba/qwen3-max-preview", + "name": "Qwen3 Max Preview", + "display_name": "Qwen3 Max Preview", "modalities": { "input": [ "text" @@ -17729,13 +18231,13 @@ ] }, "limit": { - "context": 1048576, - "output": 384000 + "context": 262144, + "output": 32768 }, + "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": true }, "extra_capabilities": { "reasoning": { @@ -17750,19 +18252,20 @@ }, "attachment": false, "open_weights": false, - "release_date": "2026-04-24", - "last_updated": "2026-04-24", + "knowledge": "2025-04", + "release_date": "2025-09-23", + "last_updated": "2025-09-23", "cost": { - "input": 0.14, - "output": 0.28, - "cache_read": 0.028 + "input": 1.2, + "output": 6, + "cache_read": 0.24 }, "type": "chat" }, { - "id": "deepseek/deepseek-v4-pro", - "name": "DeepSeek V4 Pro", - "display_name": "DeepSeek V4 Pro", + "id": "alibaba/qwen3-embedding-8b", + "name": "Qwen3 Embedding 8B", + "display_name": "Qwen3 Embedding 8B", "modalities": { "input": [ "text" @@ -17772,40 +18275,24 @@ ] }, "limit": { - "context": 1048576, - "output": 384000 + "context": 32768, + "output": 32768 }, - "tool_call": true, + "temperature": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } + "supported": false }, "attachment": false, "open_weights": false, - "release_date": "2026-04-24", - "last_updated": "2026-04-24", - "cost": { - "input": 1.1, - "output": 2.2, - "cache_read": 0.11 - }, - "type": "chat" + "release_date": "2025-06-05", + "last_updated": "2025-06-05", + "type": "embedding" }, { - "id": "deepseek/deepseek-latest", - "name": "DeepSeek Latest", - "display_name": "DeepSeek Latest", + "id": "alibaba/qwen3-next-80b-a3b-instruct", + "name": "Qwen3 Next 80B A3B Instruct", + "display_name": "Qwen3 Next 80B A3B Instruct", "modalities": { "input": [ "text" @@ -17815,149 +18302,172 @@ ] }, "limit": { - "context": 1048576, - "output": 384000 + "context": 131072, + "output": 32768 }, + "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, "attachment": false, - "open_weights": false, - "release_date": "2026-05-03", - "last_updated": "2026-05-03", + "open_weights": true, + "knowledge": "2025-04", + "release_date": "2025-09-12", + "last_updated": "2025-09", "cost": { - "input": 1.1, - "output": 2.2, - "cache_read": 0.11 + "input": 0.15, + "output": 1.2 }, "type": "chat" }, { - "id": "Tongyi-Zhiwen/QwenLong-L1-32B", - "name": "QwenLong L1 32B", - "display_name": "QwenLong L1 32B", + "id": "alibaba/qwen3.7-plus", + "name": "Qwen 3.7 Plus", + "display_name": "Qwen 3.7 Plus", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 40960 + "context": 1000000, + "output": 64000 }, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": false, + "extra_capabilities": { + "reasoning": { + "supported": true + } + }, + "attachment": true, "open_weights": false, - "release_date": "2025-01-25", - "last_updated": "2025-01-25", + "knowledge": "2025-04", + "release_date": "2026-06-01", + "last_updated": "2026-06-02", "cost": { - "input": 0.13999999999999999, - "output": 0.6 + "input": 0.4, + "output": 1.6, + "cache_read": 0.08, + "cache_write": 0.5 }, "type": "chat" }, { - "id": "chutesai/Mistral-Small-3.2-24B-Instruct-2506", - "name": "Mistral Small 3.2 24b Instruct", - "display_name": "Mistral Small 3.2 24b Instruct", + "id": "alibaba/qwen3-vl-instruct", + "name": "Qwen3 VL Instruct", + "display_name": "Qwen3 VL Instruct", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 131072 + "context": 131072, + "output": 129024 }, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { "supported": false }, - "attachment": false, - "open_weights": false, - "release_date": "2025-04-15", - "last_updated": "2025-04-15", + "attachment": true, + "open_weights": true, + "knowledge": "2025-04", + "release_date": "2025-09-24", + "last_updated": "2025-09-24", "cost": { - "input": 0.2, - "output": 0.4 + "input": 0.4, + "output": 1.6 }, "type": "chat" }, { - "id": "MiniMaxAI/MiniMax-M1-80k", - "name": "MiniMax M1 80K", - "display_name": "MiniMax M1 80K", + "id": "alibaba/qwen3.7-max", + "name": "Qwen 3.7 Max", + "display_name": "Qwen 3.7 Max", "modalities": { "input": [ - "text" + "text", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 1000000, - "output": 131072 + "context": 991000, + "output": 64000 }, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": false, + "extra_capabilities": { + "reasoning": { + "supported": true + } + }, + "attachment": true, "open_weights": false, - "release_date": "2025-06-16", - "last_updated": "2025-06-16", + "release_date": "2026-05-21", + "last_updated": "2026-05-21", "cost": { - "input": 0.6052, - "output": 2.4225000000000003 + "input": 1.25, + "output": 3.75, + "cache_read": 0.25, + "cache_write": 1.5625 }, "type": "chat" }, { - "id": "dmind/dmind-1-mini", - "name": "DMind-1-Mini", - "display_name": "DMind-1-Mini", + "id": "alibaba/wan-v2.5-t2v-preview", + "name": "Wan v2.5 Text-to-Video Preview", + "display_name": "Wan v2.5 Text-to-Video Preview", "modalities": { "input": [ "text" ], "output": [ - "text" + "video" ] }, "limit": { - "context": 32768, + "context": 8192, "output": 8192 }, + "temperature": true, "tool_call": false, "reasoning": { "supported": false }, "attachment": false, "open_weights": false, - "release_date": "2025-06-01", - "last_updated": "2025-06-01", - "cost": { - "input": 0.2, - "output": 0.4 - }, + "release_date": "2025-09-24", + "last_updated": "2025-09-24", "type": "chat" }, { - "id": "dmind/dmind-1", - "name": "DMind-1", - "display_name": "DMind-1", + "id": "alibaba/qwen3-max", + "name": "Qwen3 Max", + "display_name": "Qwen3 Max", "modalities": { "input": [ "text" @@ -17967,27 +18477,41 @@ ] }, "limit": { - "context": 32768, - "output": 8192 + "context": 262144, + "output": 32768 }, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { - "supported": false + "supported": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } }, "attachment": false, "open_weights": false, - "release_date": "2025-06-01", - "last_updated": "2025-06-01", + "knowledge": "2025-04", + "release_date": "2025-09-23", + "last_updated": "2025-09-23", "cost": { - "input": 0.3, - "output": 0.6 + "input": 1.2, + "output": 6, + "cache_read": 0.24 }, "type": "chat" }, { - "id": "zai-org/glm-5.1:thinking", - "name": "GLM 5.1 Thinking", - "display_name": "GLM 5.1 Thinking", + "id": "alibaba/qwen3-next-80b-a3b-thinking", + "name": "Qwen3 Next 80B A3B Thinking", + "display_name": "Qwen3 Next 80B A3B Thinking", "modalities": { "input": [ "text" @@ -17997,28 +18521,41 @@ ] }, "limit": { - "context": 200000, - "output": 131072 + "context": 131072, + "output": 32768 }, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, "default": true }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } + }, "attachment": false, "open_weights": true, - "release_date": "2026-03-27", - "last_updated": "2026-03-27", + "knowledge": "2025-09", + "release_date": "2025-09-12", + "last_updated": "2025-09", "cost": { - "input": 0.3, - "output": 2.55 + "input": 0.15, + "output": 1.2 }, "type": "chat" }, { - "id": "zai-org/GLM-4.6-turbo:thinking", - "name": "GLM 4.6 Turbo (Thinking)", - "display_name": "GLM 4.6 Turbo (Thinking)", + "id": "alibaba/qwen3-embedding-4b", + "name": "Qwen3 Embedding 4B", + "display_name": "Qwen3 Embedding 4B", "modalities": { "input": [ "text" @@ -18028,28 +18565,71 @@ ] }, "limit": { - "context": 200000, - "output": 204800 + "context": 32768, + "output": 32768 }, + "temperature": true, "tool_call": false, + "reasoning": { + "supported": false + }, + "attachment": false, + "open_weights": false, + "release_date": "2025-06-05", + "last_updated": "2025-06-05", + "type": "embedding" + }, + { + "id": "alibaba/qwen3.5-flash", + "name": "Qwen 3.5 Flash", + "display_name": "Qwen 3.5 Flash", + "modalities": { + "input": [ + "text", + "image", + "pdf" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 1000000, + "output": 64000 + }, + "temperature": true, + "tool_call": true, "reasoning": { "supported": true, "default": true }, - "attachment": false, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } + }, + "attachment": true, "open_weights": false, - "release_date": "2025-10-02", - "last_updated": "2025-10-02", + "release_date": "2026-02-24", + "last_updated": "2026-02-24", "cost": { - "input": 1, - "output": 3 + "input": 0.1, + "output": 0.4, + "cache_read": 0.001, + "cache_write": 0.125 }, "type": "chat" }, { - "id": "zai-org/glm-4.7-original", - "name": "GLM 4.7 Original", - "display_name": "GLM 4.7 Original", + "id": "alibaba/qwen3-coder", + "name": "Qwen3 Coder 480B A35B Instruct", + "display_name": "Qwen3 Coder 480B A35B Instruct", "modalities": { "input": [ "text" @@ -18059,29 +18639,30 @@ ] }, "limit": { - "context": 200000, - "output": 65535 + "context": 262144, + "output": 65536 }, + "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, "attachment": false, "open_weights": false, - "release_date": "2025-12-22", - "last_updated": "2025-12-22", + "knowledge": "2025-04", + "release_date": "2025-04-01", + "last_updated": "2025-04", "cost": { - "input": 0.6, - "output": 2.2, - "cache_read": 0.11 + "input": 1.5, + "output": 7.5, + "cache_read": 0.3 }, "type": "chat" }, { - "id": "zai-org/GLM-4.5-Air", - "name": "GLM 4.5 Air", - "display_name": "GLM 4.5 Air", + "id": "alibaba/qwen-3-235b", + "name": "Qwen3 235B A22B Instruct 2507", + "display_name": "Qwen3 235B A22B Instruct 2507", "modalities": { "input": [ "text" @@ -18091,91 +18672,104 @@ ] }, "limit": { - "context": 128000, - "output": 98304 + "context": 262144, + "output": 16384 }, + "temperature": true, "tool_call": true, "reasoning": { "supported": false }, "attachment": false, "open_weights": false, - "release_date": "2025-04-15", - "last_updated": "2025-04-15", + "knowledge": "2025-04", + "release_date": "2025-04-01", + "last_updated": "2025-04", "cost": { - "input": 0.12, - "output": 0.8 + "input": 0.22, + "output": 0.88 }, "type": "chat" }, { - "id": "zai-org/glm-4.6v-flash-original", - "name": "GLM 4.6V Flash", - "display_name": "GLM 4.6V Flash", + "id": "alibaba/qwen3.5-plus", + "name": "Qwen 3.5 Plus", + "display_name": "Qwen 3.5 Plus", "modalities": { "input": [ "text", "image", - "video" + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 24000 + "context": 1000000, + "output": 64000 }, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } }, "attachment": true, "open_weights": false, - "release_date": "2025-12-08", - "last_updated": "2025-12-08", + "knowledge": "2025-04", + "release_date": "2026-02-16", + "last_updated": "2026-02-16", "cost": { - "input": 0.1, - "output": 0.4 + "input": 0.4, + "output": 2.4, + "cache_read": 0.04, + "cache_write": 0.5 }, "type": "chat" }, { - "id": "zai-org/glm-latest", - "name": "GLM Latest", - "display_name": "GLM Latest", + "id": "alibaba/wan-v2.6-t2v", + "name": "Wan v2.6 Text-to-Video", + "display_name": "Wan v2.6 Text-to-Video", "modalities": { "input": [ "text" ], "output": [ - "text" + "video" ] }, "limit": { - "context": 200000, - "output": 131072 + "context": 8192, + "output": 8192 }, - "tool_call": true, + "temperature": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": true + "supported": false }, "attachment": false, "open_weights": false, - "release_date": "2026-05-03", - "last_updated": "2026-05-03", - "cost": { - "input": 0.75, - "output": 2.6, - "cache_read": 0.15 - }, + "release_date": "2025-12-16", + "last_updated": "2025-12-16", "type": "chat" }, { - "id": "zai-org/glm-4.7", - "name": "GLM 4.7", - "display_name": "GLM 4.7", + "id": "alibaba/qwen3-max-thinking", + "name": "Qwen 3 Max Thinking", + "display_name": "Qwen 3 Max Thinking", "modalities": { "input": [ "text" @@ -18185,9 +18779,10 @@ ] }, "limit": { - "context": 200000, - "output": 128000 + "context": 256000, + "output": 65536 }, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, @@ -18206,81 +18801,74 @@ }, "attachment": false, "open_weights": true, - "release_date": "2026-01-29", - "last_updated": "2026-01-29", + "knowledge": "2025-01", + "release_date": "2025-01", + "last_updated": "2025-01", "cost": { - "input": 0.15, - "output": 0.8 + "input": 1.2, + "output": 6, + "cache_read": 0.24 }, "type": "chat" }, { - "id": "zai-org/glm-4.7-flash-original:thinking", - "name": "GLM 4.7 Flash Original Thinking", - "display_name": "GLM 4.7 Flash Original Thinking", + "id": "alibaba/wan-v2.6-i2v-flash", + "name": "Wan v2.6 Image-to-Video Flash", + "display_name": "Wan v2.6 Image-to-Video Flash", "modalities": { "input": [ "text" ], "output": [ - "text" + "video" ] }, "limit": { - "context": 200000, - "output": 128000 + "context": 8192, + "output": 8192 }, + "temperature": true, "tool_call": false, "reasoning": { - "supported": true, - "default": true + "supported": false }, "attachment": false, "open_weights": false, - "release_date": "2026-01-19", - "last_updated": "2026-01-19", - "cost": { - "input": 0.07, - "output": 0.4 - }, + "release_date": "2025-12-16", + "last_updated": "2025-12-16", "type": "chat" }, { - "id": "zai-org/glm-5-original:thinking", - "name": "GLM 5 Original Thinking", - "display_name": "GLM 5 Original Thinking", + "id": "alibaba/wan-v2.6-r2v-flash", + "name": "Wan v2.6 Reference-to-Video Flash", + "display_name": "Wan v2.6 Reference-to-Video Flash", "modalities": { "input": [ "text" ], "output": [ - "text" + "video" ] }, "limit": { - "context": 200000, - "output": 128000 + "context": 8192, + "output": 8192 }, - "tool_call": true, + "temperature": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": true + "supported": false }, "attachment": false, "open_weights": false, - "release_date": "2026-02-11", - "last_updated": "2026-02-11", - "cost": { - "input": 1, - "output": 3.2, - "cache_read": 0.2 - }, + "release_date": "2025-12-16", + "last_updated": "2025-12-16", "type": "chat" }, { - "id": "zai-org/glm-4.6-original", - "name": "GLM 4.6 Original", - "display_name": "GLM 4.6 Original", + "id": "alibaba/qwen3-coder-next", + "name": "Qwen3 Coder Next", + "display_name": "Qwen3 Coder Next", "modalities": { "input": [ "text" @@ -18291,90 +18879,100 @@ }, "limit": { "context": 256000, - "output": 65535 + "output": 256000 }, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { "supported": true, "default": true }, "attachment": false, "open_weights": false, - "release_date": "2025-12-11", - "last_updated": "2025-12-11", + "release_date": "2025-07-22", + "last_updated": "2026-02-19", "cost": { - "input": 0.35, - "output": 1.4 + "input": 0.5, + "output": 1.2 }, "type": "chat" }, { - "id": "zai-org/glm-5-original", - "name": "GLM 5 Original", - "display_name": "GLM 5 Original", + "id": "alibaba/qwen3.6-27b", + "name": "Qwen 3.6 27B", + "display_name": "Qwen 3.6 27B", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 128000 + "context": 256000, + "output": 256000 }, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, "default": true }, - "attachment": false, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } + }, + "attachment": true, "open_weights": false, - "release_date": "2026-02-11", - "last_updated": "2026-02-11", + "release_date": "2026-04-22", + "last_updated": "2026-04-22", "cost": { - "input": 1, - "output": 3.2, - "cache_read": 0.2 + "input": 0.6, + "output": 3.6 }, "type": "chat" }, { - "id": "zai-org/glm-4.6v", - "name": "GLM 4.6V", - "display_name": "GLM 4.6V", + "id": "alibaba/wan-v2.6-i2v", + "name": "Wan v2.6 Image-to-Video", + "display_name": "Wan v2.6 Image-to-Video", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ - "text" + "video" ] }, "limit": { - "context": 128000, - "output": 24000 + "context": 8192, + "output": 8192 }, + "temperature": true, "tool_call": false, "reasoning": { "supported": false }, - "attachment": true, + "attachment": false, "open_weights": false, - "release_date": "2025-12-11", - "last_updated": "2025-12-11", - "cost": { - "input": 0.3, - "output": 0.9 - }, + "release_date": "2025-12-16", + "last_updated": "2025-12-16", "type": "chat" }, { - "id": "zai-org/GLM-4.6-turbo", - "name": "GLM 4.6 Turbo", - "display_name": "GLM 4.6 Turbo", + "id": "alibaba/qwen-3-30b", + "name": "Qwen3-30B-A3B", + "display_name": "Qwen3-30B-A3B", "modalities": { "input": [ "text" @@ -18384,58 +18982,109 @@ ] }, "limit": { - "context": 200000, - "output": 204800 + "context": 40960, + "output": 16384 }, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "attachment": false, "open_weights": false, - "release_date": "2025-10-02", - "last_updated": "2025-10-02", + "knowledge": "2025-04", + "release_date": "2025-04-01", + "last_updated": "2025-04", "cost": { - "input": 1, - "output": 3 + "input": 0.12, + "output": 0.5 }, "type": "chat" }, { - "id": "zai-org/GLM-4.5:thinking", - "name": "GLM 4.5 (Thinking)", - "display_name": "GLM 4.5 (Thinking)", + "id": "alibaba/qwen3-235b-a22b-thinking", + "name": "Qwen3 235B A22B Thinking 2507", + "display_name": "Qwen3 235B A22B Thinking 2507", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 65536 + "context": 131072, + "output": 32768 }, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { "supported": true, "default": true }, - "attachment": false, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } + }, + "attachment": true, "open_weights": false, - "release_date": "2024-01-01", - "last_updated": "2024-01-01", + "knowledge": "2025-04", + "release_date": "2025-09-24", + "last_updated": "2025-04", "cost": { - "input": 0.3, - "output": 1.3 + "input": 0.4, + "output": 4 }, "type": "chat" }, { - "id": "zai-org/glm-4.7-flash", - "name": "GLM 4.7 Flash", - "display_name": "GLM 4.7 Flash", + "id": "alibaba/qwen3-vl-235b-a22b-instruct", + "name": "Qwen3 VL 235B A22B Instruct", + "display_name": "Qwen3 VL 235B A22B Instruct", + "modalities": { + "input": [ + "text", + "image", + "pdf" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 131072, + "output": 129024 + }, + "temperature": true, + "tool_call": false, + "reasoning": { + "supported": false + }, + "attachment": true, + "open_weights": false, + "release_date": "2025-09-24", + "last_updated": "2026-05-01", + "cost": { + "input": 0.4, + "output": 1.6 + }, + "type": "chat" + }, + { + "id": "alibaba/qwen-3-14b", + "name": "Qwen3-14B", + "display_name": "Qwen3-14B", "modalities": { "input": [ "text" @@ -18445,33 +19094,30 @@ ] }, "limit": { - "context": 200000, - "output": 128000 + "context": 40960, + "output": 16384 }, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, "default": true }, - "extra_capabilities": { - "reasoning": { - "supported": true - } - }, "attachment": false, - "open_weights": true, - "release_date": "2026-01-19", - "last_updated": "2026-01-19", + "open_weights": false, + "knowledge": "2025-04", + "release_date": "2025-04-01", + "last_updated": "2025-04", "cost": { - "input": 0.07, - "output": 0.4 + "input": 0.12, + "output": 0.24 }, "type": "chat" }, { - "id": "zai-org/glm-4.7-flash-original", - "name": "GLM 4.7 Flash Original", - "display_name": "GLM 4.7 Flash Original", + "id": "alibaba/qwen-3-32b", + "name": "Qwen 3.32B", + "display_name": "Qwen 3.32B", "modalities": { "input": [ "text" @@ -18481,9 +19127,10 @@ ] }, "limit": { - "context": 200000, - "output": 128000 + "context": 128000, + "output": 8192 }, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, @@ -18491,49 +19138,54 @@ }, "attachment": false, "open_weights": false, - "release_date": "2026-01-19", - "last_updated": "2026-01-19", + "knowledge": "2025-04", + "release_date": "2025-04-01", + "last_updated": "2025-04", "cost": { - "input": 0.07, - "output": 0.4 + "input": 0.16, + "output": 0.64 }, "type": "chat" }, { - "id": "zai-org/glm-5:thinking", - "name": "GLM 5 Thinking", - "display_name": "GLM 5 Thinking", + "id": "alibaba/qwen-3.6-max-preview", + "name": "Qwen 3.6 Max Preview", + "display_name": "Qwen 3.6 Max Preview", "modalities": { "input": [ - "text" + "text", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 128000 + "context": 240000, + "output": 64000 }, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, "default": true }, - "attachment": false, + "attachment": true, "open_weights": true, - "release_date": "2026-02-11", - "last_updated": "2026-02-11", + "release_date": "2026-04-20", + "last_updated": "2026-04-24", "cost": { - "input": 0.3, - "output": 2.55 + "input": 1.3, + "output": 7.8, + "cache_read": 0.26, + "cache_write": 1.625 }, "type": "chat" }, { - "id": "zai-org/glm-4.7-original:thinking", - "name": "GLM 4.7 Original Thinking", - "display_name": "GLM 4.7 Original Thinking", + "id": "alibaba/qwen3-coder-30b-a3b", + "name": "Qwen 3 Coder 30B A3B Instruct", + "display_name": "Qwen 3 Coder 30B A3B Instruct", "modalities": { "input": [ "text" @@ -18543,9 +19195,10 @@ ] }, "limit": { - "context": 200000, - "output": 65535 + "context": 262144, + "output": 8192 }, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, @@ -18553,31 +19206,34 @@ }, "attachment": false, "open_weights": false, - "release_date": "2025-12-22", - "last_updated": "2025-12-22", + "knowledge": "2025-04", + "release_date": "2025-04-01", + "last_updated": "2025-04", "cost": { - "input": 0.6, - "output": 2.2, - "cache_read": 0.11 + "input": 0.15, + "output": 0.6 }, "type": "chat" }, { - "id": "zai-org/glm-5", - "name": "GLM 5", - "display_name": "GLM 5", + "id": "alibaba/qwen3.6-plus", + "name": "Qwen 3.6 Plus", + "display_name": "Qwen 3.6 Plus", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 128000 + "context": 1000000, + "output": 64000 }, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, @@ -18594,20 +19250,23 @@ ] } }, - "attachment": false, - "open_weights": true, - "release_date": "2026-02-11", - "last_updated": "2026-02-11", + "attachment": true, + "open_weights": false, + "knowledge": "2025-04", + "release_date": "2026-04-02", + "last_updated": "2026-04-02", "cost": { - "input": 0.3, - "output": 2.55 + "input": 0.5, + "output": 3, + "cache_read": 0.1, + "cache_write": 0.625 }, "type": "chat" }, { - "id": "zai-org/glm-4.7:thinking", - "name": "GLM 4.7 Thinking", - "display_name": "GLM 4.7 Thinking", + "id": "meituan/longcat-flash-thinking-2601", + "name": "LongCat Flash Thinking 2601", + "display_name": "LongCat Flash Thinking 2601", "modalities": { "input": [ "text" @@ -18617,28 +19276,25 @@ ] }, "limit": { - "context": 200000, - "output": 65535 + "context": 32768, + "output": 32768 }, - "tool_call": true, + "temperature": true, + "tool_call": false, "reasoning": { "supported": true, "default": true }, "attachment": false, "open_weights": false, - "release_date": "2025-12-22", - "last_updated": "2025-12-22", - "cost": { - "input": 0.2, - "output": 0.8 - }, + "release_date": "2026-03-13", + "last_updated": "2026-03-13", "type": "chat" }, { - "id": "zai-org/glm-4.5", - "name": "GLM 4.5", - "display_name": "GLM 4.5", + "id": "meituan/longcat-flash-chat", + "name": "LongCat Flash Chat", + "display_name": "LongCat Flash Chat", "modalities": { "input": [ "text" @@ -18649,26 +19305,24 @@ }, "limit": { "context": 128000, - "output": 65536 + "output": 100000 }, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { "supported": false }, "attachment": false, "open_weights": false, - "release_date": "2025-04-15", - "last_updated": "2025-04-15", - "cost": { - "input": 0.3, - "output": 1.3 - }, + "knowledge": "2024-10", + "release_date": "2025-08-30", + "last_updated": "2025-08-30", "type": "chat" }, { - "id": "zai-org/GLM-4.5-Air:thinking", - "name": "GLM 4.5 Air (Thinking)", - "display_name": "GLM 4.5 Air (Thinking)", + "id": "meta/llama-3.2-1b", + "name": "Llama 3.2 1B Instruct", + "display_name": "Llama 3.2 1B Instruct", "modalities": { "input": [ "text" @@ -18679,27 +19333,28 @@ }, "limit": { "context": 128000, - "output": 98304 + "output": 8192 }, - "tool_call": true, + "temperature": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": true + "supported": false }, "attachment": false, "open_weights": false, - "release_date": "2024-01-01", - "last_updated": "2024-01-01", + "knowledge": "2023-12", + "release_date": "2024-09-18", + "last_updated": "2024-09-18", "cost": { - "input": 0.12, - "output": 0.8 + "input": 0.1, + "output": 0.1 }, "type": "chat" }, { - "id": "zai-org/glm-4.6v-original", - "name": "GLM 4.6V Original", - "display_name": "GLM 4.6V Original", + "id": "meta/llama-3.2-11b", + "name": "Llama 3.2 11B Vision Instruct", + "display_name": "Llama 3.2 11B Vision Instruct", "modalities": { "input": [ "text", @@ -18711,26 +19366,28 @@ }, "limit": { "context": 128000, - "output": 24000 + "output": 8192 }, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { "supported": false }, "attachment": true, "open_weights": false, - "release_date": "2025-12-08", - "last_updated": "2025-12-08", + "knowledge": "2023-12", + "release_date": "2024-09-25", + "last_updated": "2024-09-25", "cost": { - "input": 0.6, - "output": 0.9 + "input": 0.16, + "output": 0.16 }, "type": "chat" }, { - "id": "zai-org/glm-4.7-flash:thinking", - "name": "GLM 4.7 Flash Thinking", - "display_name": "GLM 4.7 Flash Thinking", + "id": "meta/llama-3.1-8b", + "name": "Llama 3.1 8B Instruct", + "display_name": "Llama 3.1 8B Instruct", "modalities": { "input": [ "text" @@ -18740,64 +19397,62 @@ ] }, "limit": { - "context": 200000, - "output": 128000 + "context": 128000, + "output": 8192 }, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, "attachment": false, "open_weights": false, - "release_date": "2026-01-19", - "last_updated": "2026-01-19", + "knowledge": "2023-12", + "release_date": "2024-07-23", + "last_updated": "2024-07-23", "cost": { - "input": 0.07, - "output": 0.4 + "input": 0.22, + "output": 0.22 }, "type": "chat" }, { - "id": "zai-org/glm-5.1", - "name": "GLM 5.1", - "display_name": "GLM 5.1", + "id": "meta/llama-3.2-90b", + "name": "Llama 3.2 90B Vision Instruct", + "display_name": "Llama 3.2 90B Vision Instruct", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 131072 + "context": 128000, + "output": 8192 }, + "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true - } + "supported": false }, - "attachment": false, - "open_weights": true, - "release_date": "2026-03-27", - "last_updated": "2026-03-27", + "attachment": true, + "open_weights": false, + "knowledge": "2023-12", + "release_date": "2024-09-25", + "last_updated": "2024-09-25", "cost": { - "input": 0.3, - "output": 2.55 + "input": 0.72, + "output": 0.72 }, "type": "chat" }, { - "id": "MarinaraSpaghetti/NemoMix-Unleashed-12B", - "name": "NemoMix 12B Unleashed", - "display_name": "NemoMix 12B Unleashed", + "id": "meta/llama-3.1-70b", + "name": "Llama 3.1 70B Instruct", + "display_name": "Llama 3.1 70B Instruct", "modalities": { "input": [ "text" @@ -18807,27 +19462,29 @@ ] }, "limit": { - "context": 32768, + "context": 128000, "output": 8192 }, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { "supported": false }, "attachment": false, "open_weights": false, - "release_date": "2024-07-01", - "last_updated": "2024-07-01", + "knowledge": "2023-12", + "release_date": "2024-07-23", + "last_updated": "2024-07-23", "cost": { - "input": 0.49299999999999994, - "output": 0.49299999999999994 + "input": 0.72, + "output": 0.72 }, "type": "chat" }, { - "id": "deepcogito/cogito-v1-preview-qwen-32B", - "name": "Cogito v1 Preview Qwen 32B", - "display_name": "Cogito v1 Preview Qwen 32B", + "id": "meta/llama-3.2-3b", + "name": "Llama 3.2 3B Instruct", + "display_name": "Llama 3.2 3B Instruct", "modalities": { "input": [ "text" @@ -18838,56 +19495,61 @@ }, "limit": { "context": 128000, - "output": 32768 + "output": 8192 }, + "temperature": true, "tool_call": false, "reasoning": { "supported": false }, "attachment": false, "open_weights": false, - "release_date": "2025-05-10", - "last_updated": "2025-05-10", + "knowledge": "2023-12", + "release_date": "2024-09-18", + "last_updated": "2024-09-18", "cost": { - "input": 1.7999999999999998, - "output": 1.7999999999999998 + "input": 0.15, + "output": 0.15 }, "type": "chat" }, { - "id": "inflection/inflection-3-pi", - "name": "Inflection 3 Pi", - "display_name": "Inflection 3 Pi", + "id": "meta/llama-4-scout", + "name": "Llama-4-Scout-17B-16E-Instruct-FP8", + "display_name": "Llama-4-Scout-17B-16E-Instruct-FP8", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 8000, + "context": 128000, "output": 4096 }, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { "supported": false }, - "attachment": false, - "open_weights": false, - "release_date": "2024-10-11", - "last_updated": "2024-10-11", + "attachment": true, + "open_weights": true, + "knowledge": "2024-08", + "release_date": "2025-04-05", + "last_updated": "2025-04-05", "cost": { - "input": 2.499, - "output": 9.996 + "input": 0, + "output": 0 }, "type": "chat" }, { - "id": "inflection/inflection-3-productivity", - "name": "Inflection 3 Productivity", - "display_name": "Inflection 3 Productivity", + "id": "meta/llama-3.3-70b", + "name": "Llama-3.3-70B-Instruct", + "display_name": "Llama-3.3-70B-Instruct", "modalities": { "input": [ "text" @@ -18897,154 +19559,179 @@ ] }, "limit": { - "context": 8000, + "context": 128000, "output": 4096 }, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { "supported": false }, - "attachment": false, - "open_weights": false, - "release_date": "2024-10-11", - "last_updated": "2024-10-11", + "attachment": true, + "open_weights": true, + "knowledge": "2023-12", + "release_date": "2024-12-06", + "last_updated": "2024-12-06", "cost": { - "input": 2.499, - "output": 9.996 + "input": 0, + "output": 0 }, "type": "chat" }, { - "id": "LatitudeGames/Wayfarer-Large-70B-Llama-3.3", - "name": "Llama 3.3 70B Wayfarer", - "display_name": "Llama 3.3 70B Wayfarer", + "id": "meta/llama-4-maverick", + "name": "Llama-4-Maverick-17B-128E-Instruct-FP8", + "display_name": "Llama-4-Maverick-17B-128E-Instruct-FP8", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 16384, - "output": 16384 + "context": 128000, + "output": 4096 }, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { "supported": false }, - "attachment": false, - "open_weights": false, - "release_date": "2025-02-20", - "last_updated": "2025-02-20", + "attachment": true, + "open_weights": true, + "knowledge": "2024-08", + "release_date": "2025-04-05", + "last_updated": "2025-04-05", "cost": { - "input": 0.700000007, - "output": 0.700000007 + "input": 0, + "output": 0 }, "type": "chat" }, { - "id": "perceptron/perceptron-mk1", - "name": "Perceptron Mk1", - "display_name": "Perceptron Mk1", + "id": "deepseek/deepseek-v4-flash", + "name": "DeepSeek V4 Flash", + "display_name": "DeepSeek V4 Flash", "modalities": { "input": [ "text", "image", - "video" + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 32768, - "output": 8192 + "context": 1000000, + "output": 384000 }, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { "supported": true, "default": true }, - "attachment": true, - "open_weights": false, - "release_date": "2026-05-12", - "last_updated": "2026-05-12", + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } + }, + "attachment": false, + "open_weights": true, + "knowledge": "2025-05", + "release_date": "2026-04-23", + "last_updated": "2026-04-24", "cost": { - "input": 0.15, - "output": 1.5 + "input": 0.14, + "output": 0.28, + "cache_read": 0.0028 }, "type": "chat" }, { - "id": "anthropic/claude-opus-4.7:thinking", - "name": "Claude 4.7 Opus Thinking", - "display_name": "Claude 4.7 Opus Thinking", + "id": "deepseek/deepseek-v3.1-terminus", + "name": "DeepSeek V3.1 Terminus", + "display_name": "DeepSeek V3.1 Terminus", "modalities": { "input": [ - "text", - "image", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 1000000, - "output": 128000 + "context": 131072, + "output": 65536 }, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, "default": true }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": true, - "mode": "effort", - "effort": "high", - "effort_options": [ - "low", - "medium", - "high", - "xhigh", - "max" - ], - "interleaved": true, - "summaries": true, - "visibility": "omitted", - "continuation": [ - "thinking_blocks" - ], - "notes": [ - "Claude Opus 4.7 and newer Opus models require thinking.type = \"adaptive\" to enable thinking explicitly.", - "Manual budget_tokens requests return 400 on Claude Opus 4.7 and newer adaptive-only Opus models.", - "task_budget is separate from thinking control and should not be treated as a thinking budget." - ] - } + "attachment": false, + "open_weights": true, + "knowledge": "2025-07", + "release_date": "2025-09-22", + "last_updated": "2025-09-22", + "cost": { + "input": 0.27, + "output": 1, + "cache_read": 0.135 }, - "attachment": true, + "type": "chat" + }, + { + "id": "deepseek/deepseek-v3", + "name": "DeepSeek V3 0324", + "display_name": "DeepSeek V3 0324", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 163840, + "output": 163840 + }, + "temperature": true, + "tool_call": true, + "reasoning": { + "supported": false + }, + "attachment": false, "open_weights": false, - "release_date": "2026-04-16", - "last_updated": "2026-04-16", + "knowledge": "2024-07", + "release_date": "2024-12-26", + "last_updated": "2024-12-26", "cost": { - "input": 4.998, - "output": 25.007, - "cache_read": 0.4998 + "input": 0.27, + "output": 1.12, + "cache_read": 0.135 }, "type": "chat" }, { - "id": "anthropic/claude-opus-4.6:thinking", - "name": "Claude 4.6 Opus Thinking", - "display_name": "Claude 4.6 Opus Thinking", + "id": "deepseek/deepseek-v4-pro", + "name": "DeepSeek V4 Pro", + "display_name": "DeepSeek V4 Pro", "modalities": { "input": [ "text", - "image", "pdf" ], "output": [ @@ -19053,8 +19740,9 @@ }, "limit": { "context": 1000000, - "output": 128000 + "output": 384000 }, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, @@ -19063,45 +19751,30 @@ "extra_capabilities": { "reasoning": { "supported": true, - "default_enabled": true, - "mode": "mixed", - "budget": { - "min": 1024, - "unit": "tokens" - }, - "effort": "high", - "effort_options": [ - "low", - "medium", - "high", - "max" - ], "interleaved": true, "summaries": true, "visibility": "summary", "continuation": [ "thinking_blocks" - ], - "notes": [ - "Anthropic recommends adaptive thinking with effort for Claude 4.6; budget_tokens remains a deprecated compatibility path.", - "Anthropic API defaults effort to high; lower effort levels should be chosen per workload." ] } }, - "attachment": true, - "open_weights": false, - "release_date": "2026-02-05", - "last_updated": "2026-02-05", + "attachment": false, + "open_weights": true, + "knowledge": "2025-05", + "release_date": "2026-04-23", + "last_updated": "2026-04-24", "cost": { - "input": 4.998, - "output": 25.007 + "input": 0.435, + "output": 0.87, + "cache_read": 0.0036 }, "type": "chat" }, { - "id": "anthropic/claude-sonnet-4.6", - "name": "Claude Sonnet 4.6", - "display_name": "Claude Sonnet 4.6", + "id": "deepseek/deepseek-v3.2-thinking", + "name": "DeepSeek V3.2 Thinking", + "display_name": "DeepSeek V3.2 Thinking", "modalities": { "input": [ "text", @@ -19113,91 +19786,70 @@ ] }, "limit": { - "context": 1000000, - "output": 128000 + "context": 128000, + "output": 8000 }, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, - "default": false + "default": true }, "extra_capabilities": { "reasoning": { "supported": true, - "default_enabled": false, - "mode": "mixed", - "budget": { - "min": 1024, - "unit": "tokens" - }, - "effort": "high", - "effort_options": [ - "low", - "medium", - "high", - "max" - ], - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ], - "notes": [ - "Anthropic recommends adaptive thinking with effort for Claude 4.6; budget_tokens remains a deprecated compatibility path.", - "Anthropic API defaults effort to high; lower effort levels should be chosen per workload." - ] + "interleaved": true } }, - "attachment": true, + "attachment": false, "open_weights": false, - "knowledge": "2025-08-31", - "release_date": "2026-02-17", - "last_updated": "2026-02-17", + "knowledge": "2024-07", + "release_date": "2025-12-01", + "last_updated": "2025-12-01", "cost": { - "input": 2.992, - "output": 14.993999999999998 + "input": 0.62, + "output": 1.85 }, "type": "chat" }, { - "id": "anthropic/claude-opus-latest", - "name": "Claude Opus Latest", - "display_name": "Claude Opus Latest", + "id": "deepseek/deepseek-v3.1", + "name": "DeepSeek-V3.1", + "display_name": "DeepSeek-V3.1", "modalities": { "input": [ - "text", - "image", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 1000000, - "output": 128000 + "context": 163840, + "output": 8192 }, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, "default": true }, - "attachment": true, + "attachment": false, "open_weights": false, - "release_date": "2026-03-29", - "last_updated": "2026-03-29", + "knowledge": "2024-07", + "release_date": "2025-08-21", + "last_updated": "2025-08-21", "cost": { - "input": 4.998, - "output": 25.007, - "cache_read": 0.4998 + "input": 0.56, + "output": 1.68, + "cache_read": 0.28 }, "type": "chat" }, { - "id": "anthropic/claude-opus-4.7", - "name": "Claude 4.7 Opus", - "display_name": "Claude 4.7 Opus", + "id": "deepseek/deepseek-v3.2", + "name": "DeepSeek V3.2", + "display_name": "DeepSeek V3.2", "modalities": { "input": [ "text", @@ -19209,69 +19861,48 @@ ] }, "limit": { - "context": 1000000, - "output": 128000 + "context": 128000, + "output": 8000 }, - "tool_call": true, + "temperature": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": false + "supported": true }, "extra_capabilities": { "reasoning": { - "supported": true, - "default_enabled": false, - "mode": "effort", - "effort": "high", - "effort_options": [ - "low", - "medium", - "high", - "xhigh", - "max" - ], - "interleaved": true, - "summaries": true, - "visibility": "omitted", - "continuation": [ - "thinking_blocks" - ], - "notes": [ - "Claude Opus 4.7 and newer Opus models require thinking.type = \"adaptive\" to enable thinking explicitly.", - "Manual budget_tokens requests return 400 on Claude Opus 4.7 and newer adaptive-only Opus models.", - "task_budget is separate from thinking control and should not be treated as a thinking budget." - ] + "supported": true } }, - "attachment": true, + "attachment": false, "open_weights": false, - "release_date": "2026-04-16", - "last_updated": "2026-04-16", + "knowledge": "2024-07", + "release_date": "2025-12-01", + "last_updated": "2025-12-01", "cost": { - "input": 4.998, - "output": 25.007, - "cache_read": 0.4998 + "input": 0.28, + "output": 0.42, + "cache_read": 0.028 }, "type": "chat" }, { - "id": "anthropic/claude-opus-4.8:thinking", - "name": "Claude Opus 4.8 Thinking", - "display_name": "Claude Opus 4.8 Thinking", + "id": "deepseek/deepseek-r1", + "name": "DeepSeek-R1", + "display_name": "DeepSeek-R1", "modalities": { "input": [ - "text", - "image", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 1000000, - "output": 128000 + "context": 128000, + "output": 32768 }, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, @@ -19280,92 +19911,87 @@ "extra_capabilities": { "reasoning": { "supported": true, - "default_enabled": true, - "mode": "effort", - "effort": "high", - "effort_options": [ - "low", - "medium", - "high", - "xhigh", - "max" - ], "interleaved": true, "summaries": true, - "visibility": "omitted", + "visibility": "summary", "continuation": [ "thinking_blocks" - ], - "notes": [ - "Claude Opus 4.7 and newer Opus models require thinking.type = \"adaptive\" to enable thinking explicitly.", - "Manual budget_tokens requests return 400 on Claude Opus 4.7 and newer adaptive-only Opus models.", - "task_budget is separate from thinking control and should not be treated as a thinking budget." ] } }, - "attachment": true, + "attachment": false, "open_weights": false, - "release_date": "2026-05-28", - "last_updated": "2026-05-28", + "knowledge": "2024-07", + "release_date": "2025-01-20", + "last_updated": "2025-05-29", "cost": { - "input": 4.998, - "output": 25.007, - "cache_read": 0.4998 + "input": 1.35, + "output": 5.4 }, "type": "chat" }, { - "id": "anthropic/claude-haiku-latest", - "name": "Claude Haiku Latest", - "display_name": "Claude Haiku Latest", + "id": "minimax/minimax-m2.7-highspeed", + "name": "MiniMax M2.7 High Speed", + "display_name": "MiniMax M2.7 High Speed", "modalities": { "input": [ - "text", - "image", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 64000 + "context": 204800, + "output": 131100 }, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, "default": true }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } + }, "attachment": true, - "open_weights": false, - "release_date": "2026-03-29", - "last_updated": "2026-03-29", + "open_weights": true, + "release_date": "2026-03-18", + "last_updated": "2026-03-18", "cost": { - "input": 1, - "output": 5, - "cache_read": 0.1 + "input": 0.6, + "output": 2.4, + "cache_read": 0.06, + "cache_write": 0.375 }, "type": "chat" }, { - "id": "anthropic/claude-opus-4.6:thinking:max", - "name": "Claude 4.6 Opus Thinking Max", - "display_name": "Claude 4.6 Opus Thinking Max", + "id": "minimax/minimax-m2.5", + "name": "MiniMax M2.5", + "display_name": "MiniMax M2.5", "modalities": { "input": [ - "text", - "image", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 1000000, - "output": 128000 + "context": 204800, + "output": 131000 }, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, @@ -19373,107 +19999,66 @@ }, "extra_capabilities": { "reasoning": { - "supported": true, - "default_enabled": true, - "mode": "mixed", - "budget": { - "min": 1024, - "unit": "tokens" - }, - "effort": "high", - "effort_options": [ - "low", - "medium", - "high", - "max" - ], - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ], - "notes": [ - "Anthropic recommends adaptive thinking with effort for Claude 4.6; budget_tokens remains a deprecated compatibility path.", - "Anthropic API defaults effort to high; lower effort levels should be chosen per workload." - ] + "supported": true } }, - "attachment": true, + "attachment": false, "open_weights": false, - "release_date": "2026-02-05", - "last_updated": "2026-02-05", + "release_date": "2026-02-12", + "last_updated": "2026-02-12", "cost": { - "input": 4.998, - "output": 25.007 + "input": 0.3, + "output": 1.2, + "cache_read": 0.03, + "cache_write": 0.375 }, "type": "chat" }, { - "id": "anthropic/claude-opus-4.6", - "name": "Claude 4.6 Opus", - "display_name": "Claude 4.6 Opus", + "id": "minimax/minimax-m2.1", + "name": "MiniMax M2.1", + "display_name": "MiniMax M2.1", "modalities": { "input": [ - "text", - "image", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 1000000, - "output": 128000 + "context": 204800, + "output": 131072 }, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, - "default": false + "default": true }, "extra_capabilities": { "reasoning": { "supported": true, - "default_enabled": false, - "mode": "mixed", - "budget": { - "min": 1024, - "unit": "tokens" - }, - "effort": "high", - "effort_options": [ - "low", - "medium", - "high", - "max" - ], - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ], - "notes": [ - "Anthropic recommends adaptive thinking with effort for Claude 4.6; budget_tokens remains a deprecated compatibility path.", - "Anthropic API defaults effort to high; lower effort levels should be chosen per workload." - ] + "interleaved": true } }, - "attachment": true, + "attachment": false, "open_weights": false, - "release_date": "2026-02-05", - "last_updated": "2026-02-05", + "knowledge": "2024-10", + "release_date": "2025-10-27", + "last_updated": "2025-12-23", "cost": { - "input": 4.998, - "output": 25.007 + "input": 0.3, + "output": 1.2, + "cache_read": 0.03, + "cache_write": 0.375 }, "type": "chat" }, { - "id": "anthropic/claude-opus-4.8", - "name": "Claude Opus 4.8", - "display_name": "Claude Opus 4.8", + "id": "minimax/minimax-m3", + "name": "MiniMax M3", + "display_name": "MiniMax M3", "modalities": { "input": [ "text", @@ -19486,68 +20071,47 @@ }, "limit": { "context": 1000000, - "output": 128000 + "output": 1000000 }, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, - "default": false + "default": true }, "extra_capabilities": { "reasoning": { - "supported": true, - "default_enabled": false, - "mode": "effort", - "effort": "high", - "effort_options": [ - "low", - "medium", - "high", - "xhigh", - "max" - ], - "interleaved": true, - "summaries": true, - "visibility": "omitted", - "continuation": [ - "thinking_blocks" - ], - "notes": [ - "Claude Opus 4.7 and newer Opus models require thinking.type = \"adaptive\" to enable thinking explicitly.", - "Manual budget_tokens requests return 400 on Claude Opus 4.7 and newer adaptive-only Opus models.", - "task_budget is separate from thinking control and should not be treated as a thinking budget." - ] + "supported": true } }, "attachment": true, "open_weights": false, - "release_date": "2026-05-28", - "last_updated": "2026-05-28", + "release_date": "2026-05-31", + "last_updated": "2026-06-01", "cost": { - "input": 4.998, - "output": 25.007, - "cache_read": 0.4998 + "input": 0.3, + "output": 1.2, + "cache_read": 0.06 }, "type": "chat" }, { - "id": "anthropic/claude-opus-4.6:thinking:low", - "name": "Claude 4.6 Opus Thinking Low", - "display_name": "Claude 4.6 Opus Thinking Low", + "id": "minimax/minimax-m2", + "name": "MiniMax M2", + "display_name": "MiniMax M2", "modalities": { "input": [ - "text", - "image", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 1000000, - "output": 128000 + "context": 205000, + "output": 205000 }, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, @@ -19556,59 +20120,39 @@ "extra_capabilities": { "reasoning": { "supported": true, - "default_enabled": true, - "mode": "mixed", - "budget": { - "min": 1024, - "unit": "tokens" - }, - "effort": "high", - "effort_options": [ - "low", - "medium", - "high", - "max" - ], - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ], - "notes": [ - "Anthropic recommends adaptive thinking with effort for Claude 4.6; budget_tokens remains a deprecated compatibility path.", - "Anthropic API defaults effort to high; lower effort levels should be chosen per workload." - ] + "interleaved": true } }, - "attachment": true, - "open_weights": false, - "release_date": "2026-02-05", - "last_updated": "2026-02-05", + "attachment": false, + "open_weights": true, + "knowledge": "2024-10", + "release_date": "2025-10-27", + "last_updated": "2025-10-27", "cost": { - "input": 4.998, - "output": 25.007 + "input": 0.3, + "output": 1.2, + "cache_read": 0.03, + "cache_write": 0.375 }, "type": "chat" }, { - "id": "anthropic/claude-opus-4.6:thinking:medium", - "name": "Claude 4.6 Opus Thinking Medium", - "display_name": "Claude 4.6 Opus Thinking Medium", + "id": "minimax/minimax-m2.7", + "name": "Minimax M2.7", + "display_name": "Minimax M2.7", "modalities": { "input": [ - "text", - "image", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 1000000, - "output": 128000 + "context": 204800, + "output": 131000 }, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, @@ -19617,245 +20161,197 @@ "extra_capabilities": { "reasoning": { "supported": true, - "default_enabled": true, - "mode": "mixed", - "budget": { - "min": 1024, - "unit": "tokens" - }, - "effort": "high", - "effort_options": [ - "low", - "medium", - "high", - "max" - ], "interleaved": true, "summaries": true, "visibility": "summary", "continuation": [ "thinking_blocks" - ], - "notes": [ - "Anthropic recommends adaptive thinking with effort for Claude 4.6; budget_tokens remains a deprecated compatibility path.", - "Anthropic API defaults effort to high; lower effort levels should be chosen per workload." ] } }, "attachment": true, - "open_weights": false, - "release_date": "2026-02-05", - "last_updated": "2026-02-05", + "open_weights": true, + "release_date": "2026-03-18", + "last_updated": "2026-03-18", "cost": { - "input": 4.998, - "output": 25.007 + "input": 0.3, + "output": 1.2, + "cache_read": 0.06, + "cache_write": 0.375 }, "type": "chat" }, { - "id": "anthropic/claude-sonnet-latest", - "name": "Claude Sonnet Latest", - "display_name": "Claude Sonnet Latest", + "id": "minimax/minimax-m2.5-highspeed", + "name": "MiniMax M2.5 High Speed", + "display_name": "MiniMax M2.5 High Speed", "modalities": { "input": [ - "text", - "image", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 1000000, - "output": 128000 + "context": 204800, + "output": 131000 }, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, "default": true }, - "attachment": true, + "extra_capabilities": { + "reasoning": { + "supported": true + } + }, + "attachment": false, "open_weights": false, - "release_date": "2026-03-01", - "last_updated": "2026-03-01", + "release_date": "2026-02-12", + "last_updated": "2026-02-13", "cost": { - "input": 2.992, - "output": 14.994, - "cache_read": 0.2992 + "input": 0.6, + "output": 2.4, + "cache_read": 0.03, + "cache_write": 0.375 }, "type": "chat" }, { - "id": "anthropic/claude-sonnet-4.6:thinking", - "name": "Claude Sonnet 4.6 Thinking", - "display_name": "Claude Sonnet 4.6 Thinking", + "id": "minimax/minimax-m2.1-lightning", + "name": "MiniMax M2.1 Lightning", + "display_name": "MiniMax M2.1 Lightning", "modalities": { "input": [ - "text", - "image", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 1000000, - "output": 128000 + "context": 204800, + "output": 131072 }, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, "default": true }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": true, - "mode": "mixed", - "budget": { - "min": 1024, - "unit": "tokens" - }, - "effort": "high", - "effort_options": [ - "low", - "medium", - "high", - "max" - ], - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ], - "notes": [ - "Anthropic recommends adaptive thinking with effort for Claude 4.6; budget_tokens remains a deprecated compatibility path.", - "Anthropic API defaults effort to high; lower effort levels should be chosen per workload." - ] - } - }, - "attachment": true, + "attachment": false, "open_weights": false, - "knowledge": "2025-08-31", - "release_date": "2026-02-17", - "last_updated": "2026-02-17", + "knowledge": "2024-10", + "release_date": "2025-10-27", + "last_updated": "2025-10-27", "cost": { - "input": 2.992, - "output": 14.993999999999998 + "input": 0.3, + "output": 2.4, + "cache_read": 0.03, + "cache_write": 0.375 }, "type": "chat" }, { - "id": "alibaba/qwen3.6-27b", - "name": "Qwen3.6 27B", - "display_name": "Qwen3.6 27B", + "id": "kwaipilot/kat-coder-pro-v1", + "name": "KAT-Coder-Pro V1", + "display_name": "KAT-Coder-Pro V1", "modalities": { "input": [ - "text", - "image", - "video" + "text" ], "output": [ "text" ] }, "limit": { - "context": 260096, - "output": 65536 + "context": 256000, + "output": 32000 }, + "temperature": true, "tool_call": false, "reasoning": { - "supported": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } + "supported": true, + "default": true }, - "attachment": true, + "attachment": false, "open_weights": false, - "release_date": "2026-04-23", - "last_updated": "2026-04-23", + "knowledge": "2024-10", + "release_date": "2025-10-24", + "last_updated": "2025-10-24", "cost": { - "input": 0.203, - "output": 2.24 + "input": 0.03, + "output": 1.2, + "cache_read": 0.06 }, "type": "chat" }, { - "id": "alibaba/qwen3.6-27b:thinking", - "name": "Qwen3.6 27B Thinking", - "display_name": "Qwen3.6 27B Thinking", + "id": "kwaipilot/kat-coder-pro-v2", + "name": "Kat Coder Pro V2", + "display_name": "Kat Coder Pro V2", "modalities": { "input": [ - "text", - "image", - "video" + "text" ], "output": [ "text" ] }, "limit": { - "context": 260096, - "output": 65536 + "context": 256000, + "output": 256000 }, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { "supported": true, "default": true }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } - }, - "attachment": true, + "attachment": false, "open_weights": false, - "release_date": "2026-04-23", - "last_updated": "2026-04-23", + "release_date": "2026-03-27", + "last_updated": "2026-03-30", "cost": { - "input": 0.203, - "output": 2.24 + "input": 0.3, + "output": 1.2, + "cache_read": 0.06 }, "type": "chat" - }, + } + ] + }, + "submodel": { + "id": "submodel", + "name": "submodel", + "display_name": "submodel", + "api": "https://llm.submodel.ai/v1", + "doc": "https://submodel.gitbook.io", + "models": [ { - "id": "alibaba/qwen3.6-flash", - "name": "Qwen3.6 Flash", - "display_name": "Qwen3.6 Flash", + "id": "Qwen/Qwen3-235B-A22B-Thinking-2507", + "name": "Qwen3 235B A22B Thinking 2507", + "display_name": "Qwen3 235B A22B Thinking 2507", "modalities": { "input": [ - "text", - "image", - "video" + "text" ], "output": [ "text" ] }, "limit": { - "context": 991800, - "output": 65536 + "context": 262144, + "output": 131072 }, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { - "supported": true + "supported": true, + "default": true }, "extra_capabilities": { "reasoning": { @@ -19869,25 +20365,22 @@ } }, "attachment": false, - "open_weights": false, - "release_date": "2026-04-17", - "last_updated": "2026-04-17", + "open_weights": true, + "release_date": "2025-08-23", + "last_updated": "2025-08-23", "cost": { - "input": 0.19, - "output": 1.16 + "input": 0.2, + "output": 0.6 }, "type": "chat" }, { - "id": "xiaomi/mimo-v2-omni", - "name": "MiMo V2 Omni", - "display_name": "MiMo V2 Omni", + "id": "Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8", + "name": "Qwen3 Coder 480B A35B Instruct", + "display_name": "Qwen3 Coder 480B A35B Instruct", "modalities": { "input": [ - "text", - "image", - "video", - "audio" + "text" ], "output": [ "text" @@ -19895,27 +20388,27 @@ }, "limit": { "context": 262144, - "output": 65536 + "output": 262144 }, + "temperature": true, "tool_call": true, "reasoning": { "supported": false }, - "attachment": true, + "attachment": false, "open_weights": false, - "release_date": "2026-03-19", - "last_updated": "2026-03-19", + "release_date": "2025-08-23", + "last_updated": "2025-08-23", "cost": { - "input": 0.4, - "output": 2, - "cache_read": 0.08 + "input": 0.2, + "output": 0.8 }, "type": "chat" }, { - "id": "xiaomi/mimo-v2-flash-thinking", - "name": "MiMo V2 Flash (Thinking)", - "display_name": "MiMo V2 Flash (Thinking)", + "id": "Qwen/Qwen3-235B-A22B-Instruct-2507", + "name": "Qwen3 235B A22B Instruct 2507", + "display_name": "Qwen3 235B A22B Instruct 2507", "modalities": { "input": [ "text" @@ -19925,27 +20418,28 @@ ] }, "limit": { - "context": 256000, - "output": 32768 + "context": 262144, + "output": 131072 }, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { "supported": false }, "attachment": false, - "open_weights": false, - "release_date": "2025-12-17", - "last_updated": "2025-12-17", + "open_weights": true, + "release_date": "2025-08-23", + "last_updated": "2025-08-23", "cost": { - "input": 0.102, - "output": 0.306 + "input": 0.2, + "output": 0.3 }, "type": "chat" }, { - "id": "xiaomi/mimo-v2-flash-thinking-original", - "name": "MiMo V2 Flash (Thinking) Original", - "display_name": "MiMo V2 Flash (Thinking) Original", + "id": "openai/gpt-oss-120b", + "name": "GPT OSS 120B", + "display_name": "GPT OSS 120B", "modalities": { "input": [ "text" @@ -19955,27 +20449,34 @@ ] }, "limit": { - "context": 256000, + "context": 131072, "output": 32768 }, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true + } }, "attachment": false, - "open_weights": false, - "release_date": "2025-12-17", - "last_updated": "2025-12-17", + "open_weights": true, + "release_date": "2025-08-23", + "last_updated": "2025-08-23", "cost": { - "input": 0.102, - "output": 0.306 + "input": 0.1, + "output": 0.5 }, "type": "chat" }, { - "id": "xiaomi/mimo-v2-flash-original", - "name": "MiMo V2 Flash Original", - "display_name": "MiMo V2 Flash Original", + "id": "zai-org/GLM-4.5-FP8", + "name": "GLM 4.5 FP8", + "display_name": "GLM 4.5 FP8", "modalities": { "input": [ "text" @@ -19985,27 +20486,29 @@ ] }, "limit": { - "context": 256000, - "output": 32768 + "context": 131072, + "output": 131072 }, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "attachment": false, - "open_weights": false, - "release_date": "2025-12-17", - "last_updated": "2025-12-17", + "open_weights": true, + "release_date": "2025-07-28", + "last_updated": "2025-07-28", "cost": { - "input": 0.102, - "output": 0.306 + "input": 0.2, + "output": 0.8 }, "type": "chat" }, { - "id": "xiaomi/mimo-v2-pro", - "name": "MiMo V2 Pro", - "display_name": "MiMo V2 Pro", + "id": "zai-org/GLM-4.5-Air", + "name": "GLM 4.5 Air", + "display_name": "GLM 4.5 Air", "modalities": { "input": [ "text" @@ -20015,63 +20518,59 @@ ] }, "limit": { - "context": 1048576, + "context": 131072, "output": 131072 }, + "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, "attachment": false, - "open_weights": false, - "release_date": "2026-03-19", - "last_updated": "2026-03-19", + "open_weights": true, + "release_date": "2025-07-28", + "last_updated": "2025-07-28", "cost": { - "input": 1, - "output": 3, - "cache_read": 0.2 + "input": 0.1, + "output": 0.5 }, "type": "chat" }, { - "id": "xiaomi/mimo-v2.5", - "name": "MiMo V2.5", - "display_name": "MiMo V2.5", + "id": "deepseek-ai/DeepSeek-V3-0324", + "name": "DeepSeek V3 0324", + "display_name": "DeepSeek V3 0324", "modalities": { "input": [ - "text", - "image", - "video" + "text" ], "output": [ "text" ] }, "limit": { - "context": 1048576, - "output": 131072 + "context": 75000, + "output": 163840 }, + "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, - "attachment": true, + "attachment": false, "open_weights": false, - "release_date": "2026-04-22", - "last_updated": "2026-04-22", + "release_date": "2025-08-23", + "last_updated": "2025-08-23", "cost": { - "input": 0.14, - "output": 0.28, - "cache_read": 0.0028 + "input": 0.2, + "output": 0.8 }, "type": "chat" }, { - "id": "xiaomi/mimo-v2-flash", - "name": "MiMo V2 Flash", - "display_name": "MiMo V2 Flash", + "id": "deepseek-ai/DeepSeek-R1-0528", + "name": "DeepSeek R1 0528", + "display_name": "DeepSeek R1 0528", "modalities": { "input": [ "text" @@ -20081,27 +20580,40 @@ ] }, "limit": { - "context": 256000, - "output": 32768 + "context": 75000, + "output": 163840 }, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } }, "attachment": false, "open_weights": false, - "release_date": "2025-12-17", - "last_updated": "2025-12-17", + "release_date": "2025-08-23", + "last_updated": "2025-08-23", "cost": { - "input": 0.102, - "output": 0.306 + "input": 0.5, + "output": 2.15 }, "type": "chat" }, { - "id": "xiaomi/mimo-v2.5-pro", - "name": "MiMo V2.5 Pro", - "display_name": "MiMo V2.5 Pro", + "id": "deepseek-ai/DeepSeek-V3.1", + "name": "DeepSeek V3.1", + "display_name": "DeepSeek V3.1", "modalities": { "input": [ "text" @@ -20111,9 +20623,10 @@ ] }, "limit": { - "context": 1048576, - "output": 131072 + "context": 75000, + "output": 163840 }, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, @@ -20121,19 +20634,27 @@ }, "attachment": false, "open_weights": false, - "release_date": "2026-04-22", - "last_updated": "2026-04-22", + "release_date": "2025-08-23", + "last_updated": "2025-08-23", "cost": { - "input": 0.435, - "output": 0.87, - "cache_read": 0.0036 + "input": 0.2, + "output": 0.8 }, "type": "chat" - }, + } + ] + }, + "huggingface": { + "id": "huggingface", + "name": "Hugging Face", + "display_name": "Hugging Face", + "api": "https://router.huggingface.co/v1", + "doc": "https://huggingface.co/docs/inference-providers", + "models": [ { - "id": "ReadyArt/MS3.2-The-Omega-Directive-24B-Unslop-v2.0", - "name": "Omega Directive 24B Unslop v2.0", - "display_name": "Omega Directive 24B Unslop v2.0", + "id": "moonshotai/Kimi-K2-Thinking", + "name": "Kimi-K2-Thinking", + "display_name": "Kimi-K2-Thinking", "modalities": { "input": [ "text" @@ -20143,107 +20664,125 @@ ] }, "limit": { - "context": 16384, - "output": 32768 + "context": 262144, + "output": 262144 }, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } }, "attachment": false, - "open_weights": false, - "release_date": "2025-12-08", - "last_updated": "2025-12-08", + "open_weights": true, + "knowledge": "2024-08", + "release_date": "2025-11-06", + "last_updated": "2025-11-06", "cost": { - "input": 0.5, - "output": 0.5 + "input": 0.6, + "output": 2.5, + "cache_read": 0.15 }, "type": "chat" }, { - "id": "mistral/mistral-medium-3.5", - "name": "Mistral Medium 3.5", - "display_name": "Mistral Medium 3.5", + "id": "moonshotai/Kimi-K2-Instruct-0905", + "name": "Kimi-K2-Instruct-0905", + "display_name": "Kimi-K2-Instruct-0905", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 256000, - "output": 32768 + "context": 262144, + "output": 16384 }, + "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, - "attachment": true, - "open_weights": false, - "release_date": "2026-04-29", - "last_updated": "2026-04-29", + "attachment": false, + "open_weights": true, + "knowledge": "2024-10", + "release_date": "2025-09-04", + "last_updated": "2025-09-04", "cost": { - "input": 1.5, - "output": 7.5 + "input": 1, + "output": 3 }, "type": "chat" }, { - "id": "mistral/mistral-medium-3.5:thinking", - "name": "Mistral Medium 3.5 Thinking", - "display_name": "Mistral Medium 3.5 Thinking", + "id": "moonshotai/Kimi-K2-Instruct", + "name": "Kimi-K2-Instruct", + "display_name": "Kimi-K2-Instruct", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 256000, - "output": 32768 + "context": 131072, + "output": 16384 }, + "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, - "attachment": true, - "open_weights": false, - "release_date": "2026-04-30", - "last_updated": "2026-04-30", + "attachment": false, + "open_weights": true, + "knowledge": "2024-10", + "release_date": "2025-07-14", + "last_updated": "2025-07-14", "cost": { - "input": 1.5, - "output": 7.5 + "input": 1, + "output": 3 }, "type": "chat" }, { - "id": "qwen/qwen3-32b", - "name": "Qwen 3 32b", - "display_name": "Qwen 3 32b", + "id": "moonshotai/Kimi-K2.6", + "name": "Kimi-K2.6", + "display_name": "Kimi-K2.6", "modalities": { "input": [ "text", - "pdf" + "image", + "video" ], "output": [ "text" ] }, "limit": { - "context": 41000, - "output": 32768 + "context": 262144, + "output": 262144 }, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { - "supported": true + "supported": true, + "default": true }, "extra_capabilities": { "reasoning": { @@ -20257,34 +20796,40 @@ } }, "attachment": true, - "open_weights": false, - "release_date": "2024-01-01", - "last_updated": "2024-01-01", + "open_weights": true, + "knowledge": "2025-01", + "release_date": "2026-04-20", + "last_updated": "2026-04-20", "cost": { - "input": 0.1, - "output": 0.3 + "input": 0.95, + "output": 4, + "cache_read": 0.16 }, "type": "chat" }, { - "id": "qwen/qwq-32b-preview", - "name": "Qwen QwQ 32B Preview", - "display_name": "Qwen QwQ 32B Preview", + "id": "moonshotai/Kimi-K2.5", + "name": "Kimi-K2.5", + "display_name": "Kimi-K2.5", "modalities": { "input": [ - "text" + "text", + "image", + "video" ], "output": [ "text" ] }, "limit": { - "context": 32768, - "output": 32768 + "context": 262144, + "output": 262144 }, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { - "supported": true + "supported": true, + "default": true }, "extra_capabilities": { "reasoning": { @@ -20297,64 +20842,54 @@ ] } }, - "attachment": false, - "open_weights": false, - "release_date": "2025-02-27", - "last_updated": "2025-02-27", + "attachment": true, + "open_weights": true, + "knowledge": "2025-01", + "release_date": "2026-01-01", + "last_updated": "2026-01-01", "cost": { - "input": 0.2, - "output": 0.2 + "input": 0.6, + "output": 3, + "cache_read": 0.1 }, "type": "chat" }, { - "id": "qwen/qwen3.5-plus", - "name": "Qwen3.5 Plus", - "display_name": "Qwen3.5 Plus", + "id": "Qwen/Qwen3-Coder-Next", + "name": "Qwen3-Coder-Next", + "display_name": "Qwen3-Coder-Next", "modalities": { "input": [ - "text", - "image", - "video" + "text" ], "output": [ "text" ] }, "limit": { - "context": 983616, + "context": 262144, "output": 65536 }, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { - "supported": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } + "supported": false }, - "attachment": true, - "open_weights": false, - "release_date": "2026-02-16", - "last_updated": "2026-02-16", + "attachment": false, + "open_weights": true, + "knowledge": "2025-04", + "release_date": "2026-02-03", + "last_updated": "2026-02-03", "cost": { - "input": 0.4, - "output": 2.4, - "cache_read": 0.04 + "input": 0.2, + "output": 1.5 }, "type": "chat" }, { - "id": "qwen/Qwen3-8B", - "name": "Qwen 3 8B", - "display_name": "Qwen 3 8B", + "id": "Qwen/Qwen3-Embedding-8B", + "name": "Qwen 3 Embedding 8B", + "display_name": "Qwen 3 Embedding 8B", "modalities": { "input": [ "text" @@ -20364,54 +20899,79 @@ ] }, "limit": { - "context": 41000, - "output": 32768 + "context": 32000, + "output": 4096 }, + "temperature": false, "tool_call": false, "reasoning": { - "supported": true + "supported": false }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } + "attachment": false, + "open_weights": true, + "knowledge": "2024-12", + "release_date": "2025-01-01", + "last_updated": "2025-01-01", + "cost": { + "input": 0.01, + "output": 0 + }, + "type": "embedding" + }, + { + "id": "Qwen/Qwen3-Next-80B-A3B-Instruct", + "name": "Qwen3-Next-80B-A3B-Instruct", + "display_name": "Qwen3-Next-80B-A3B-Instruct", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 262144, + "output": 66536 + }, + "temperature": true, + "tool_call": true, + "reasoning": { + "supported": false }, "attachment": false, - "open_weights": false, - "release_date": "2024-01-01", - "last_updated": "2024-01-01", + "open_weights": true, + "knowledge": "2025-04", + "release_date": "2025-09-11", + "last_updated": "2025-09-11", "cost": { - "input": 0.47, - "output": 0.47 + "input": 0.25, + "output": 1 }, "type": "chat" }, { - "id": "qwen/qwen3-235b-a22b", - "name": "Qwen 3 235b A22B", - "display_name": "Qwen 3 235b A22B", + "id": "Qwen/Qwen3.5-397B-A17B", + "name": "Qwen3.5-397B-A17B", + "display_name": "Qwen3.5-397B-A17B", "modalities": { "input": [ "text", - "pdf" + "image" ], "output": [ "text" ] }, "limit": { - "context": 41000, + "context": 262144, "output": 32768 }, + "temperature": true, "tool_call": true, "reasoning": { - "supported": true + "supported": true, + "default": true }, "extra_capabilities": { "reasoning": { @@ -20425,19 +20985,20 @@ } }, "attachment": true, - "open_weights": false, - "release_date": "2025-04-29", - "last_updated": "2025-04-29", + "open_weights": true, + "knowledge": "2025-04", + "release_date": "2026-02-01", + "last_updated": "2026-02-01", "cost": { - "input": 0.3, - "output": 0.5 + "input": 0.6, + "output": 3.6 }, "type": "chat" }, { - "id": "qwen/Qwen3-235B-A22B-Thinking-2507", - "name": "Qwen 3 235b A22B 2507 Thinking", - "display_name": "Qwen 3 235b A22B 2507 Thinking", + "id": "Qwen/Qwen3-235B-A22B-Thinking-2507", + "name": "Qwen3-235B-A22B-Thinking-2507", + "display_name": "Qwen3-235B-A22B-Thinking-2507", "modalities": { "input": [ "text" @@ -20447,12 +21008,14 @@ ] }, "limit": { - "context": 256000, - "output": 262144 + "context": 262144, + "output": 131072 }, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { - "supported": true + "supported": true, + "default": true }, "extra_capabilities": { "reasoning": { @@ -20466,19 +21029,20 @@ } }, "attachment": false, - "open_weights": false, - "release_date": "2025-09-11", - "last_updated": "2025-09-11", + "open_weights": true, + "knowledge": "2025-04", + "release_date": "2025-07-25", + "last_updated": "2025-07-25", "cost": { "input": 0.3, - "output": 0.5 + "output": 3 }, "type": "chat" }, { - "id": "qwen/qwen3-max", - "name": "Qwen3 Max", - "display_name": "Qwen3 Max", + "id": "Qwen/Qwen3-Embedding-4B", + "name": "Qwen 3 Embedding 4B", + "display_name": "Qwen 3 Embedding 4B", "modalities": { "input": [ "text" @@ -20488,38 +21052,29 @@ ] }, "limit": { - "context": 256000, - "output": 32768 + "context": 32000, + "output": 2048 }, + "temperature": false, "tool_call": false, "reasoning": { - "supported": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } + "supported": false }, "attachment": false, - "open_weights": false, - "release_date": "2025-09-05", - "last_updated": "2025-09-05", + "open_weights": true, + "knowledge": "2024-12", + "release_date": "2025-01-01", + "last_updated": "2025-01-01", "cost": { - "input": 1.08018, - "output": 5.4009 + "input": 0.01, + "output": 0 }, - "type": "chat" + "type": "embedding" }, { - "id": "qwen/qwen3-coder-plus", - "name": "Qwen3 Coder Plus", - "display_name": "Qwen3 Coder Plus", + "id": "Qwen/Qwen3-Coder-480B-A35B-Instruct", + "name": "Qwen3-Coder-480B-A35B-Instruct", + "display_name": "Qwen3-Coder-480B-A35B-Instruct", "modalities": { "input": [ "text" @@ -20529,27 +21084,29 @@ ] }, "limit": { - "context": 128000, - "output": 65536 + "context": 262144, + "output": 66536 }, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { "supported": false }, "attachment": false, - "open_weights": false, - "release_date": "2025-09-17", - "last_updated": "2025-09-17", + "open_weights": true, + "knowledge": "2025-04", + "release_date": "2025-07-23", + "last_updated": "2025-07-23", "cost": { - "input": 1, - "output": 5 + "input": 2, + "output": 2 }, "type": "chat" }, { - "id": "qwen/qwen3-14b", - "name": "Qwen 3 14b", - "display_name": "Qwen 3 14b", + "id": "Qwen/Qwen3-Next-80B-A3B-Thinking", + "name": "Qwen3-Next-80B-A3B-Thinking", + "display_name": "Qwen3-Next-80B-A3B-Thinking", "modalities": { "input": [ "text" @@ -20559,10 +21116,11 @@ ] }, "limit": { - "context": 41000, - "output": 32768 + "context": 262144, + "output": 131072 }, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { "supported": true }, @@ -20578,19 +21136,20 @@ } }, "attachment": false, - "open_weights": false, - "release_date": "2024-01-01", - "last_updated": "2024-01-01", + "open_weights": true, + "knowledge": "2025-04", + "release_date": "2025-09-11", + "last_updated": "2025-09-11", "cost": { - "input": 0.08, - "output": 0.24 + "input": 0.3, + "output": 2 }, "type": "chat" }, { - "id": "qwen/qwen3-coder-next", - "name": "Qwen3 Coder Next", - "display_name": "Qwen3 Coder Next", + "id": "XiaomiMiMo/MiMo-V2-Flash", + "name": "MiMo-V2-Flash", + "display_name": "MiMo-V2-Flash", "modalities": { "input": [ "text" @@ -20601,43 +21160,46 @@ }, "limit": { "context": 262144, - "output": 65536 + "output": 4096 }, + "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "attachment": false, - "open_weights": false, - "release_date": "2025-12-08", - "last_updated": "2025-12-08", + "open_weights": true, + "knowledge": "2024-12", + "release_date": "2025-12-16", + "last_updated": "2025-12-16", "cost": { - "input": 0.15, - "output": 1.5 + "input": 0.1, + "output": 0.3 }, "type": "chat" }, { - "id": "qwen/Qwen3.6-35B-A3B", - "name": "Qwen3.6 35B A3B", - "display_name": "Qwen3.6 35B A3B", + "id": "zai-org/GLM-4.7-Flash", + "name": "GLM-4.7-Flash", + "display_name": "GLM-4.7-Flash", "modalities": { "input": [ - "text", - "image", - "video" + "text" ], "output": [ "text" ] }, "limit": { - "context": 262144, - "output": 16384 + "context": 200000, + "output": 128000 }, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { - "supported": true + "supported": true, + "default": true }, "extra_capabilities": { "reasoning": { @@ -20650,35 +21212,35 @@ ] } }, - "attachment": true, - "open_weights": false, - "release_date": "2026-04-17", - "last_updated": "2026-04-17", + "attachment": false, + "open_weights": true, + "knowledge": "2025-04", + "release_date": "2025-08-08", + "last_updated": "2025-08-08", "cost": { - "input": 0.112, - "output": 0.8 + "input": 0, + "output": 0 }, "type": "chat" }, { - "id": "qwen/qwen3.5-plus-thinking", - "name": "Qwen3.5 Plus Thinking", - "display_name": "Qwen3.5 Plus Thinking", + "id": "zai-org/GLM-5", + "name": "GLM-5", + "display_name": "GLM-5", "modalities": { "input": [ - "text", - "image", - "video" + "text" ], "output": [ "text" ] }, "limit": { - "context": 983616, - "output": 65536 + "context": 202752, + "output": 131072 }, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { "supported": true, "default": true @@ -20694,21 +21256,21 @@ ] } }, - "attachment": true, - "open_weights": false, - "release_date": "2026-02-16", - "last_updated": "2026-02-16", + "attachment": false, + "open_weights": true, + "release_date": "2026-02-11", + "last_updated": "2026-02-11", "cost": { - "input": 0.4, - "output": 2.4, - "cache_read": 0.04 + "input": 1, + "output": 3.2, + "cache_read": 0.2 }, "type": "chat" }, { - "id": "qwen/Qwen3-235B-A22B-Instruct-2507-TEE", - "name": "Qwen 3 235b A22B 2507 (TEE)", - "display_name": "Qwen 3 235b A22B 2507 (TEE)", + "id": "zai-org/GLM-4.7", + "name": "GLM-4.7", + "display_name": "GLM-4.7", "modalities": { "input": [ "text" @@ -20718,27 +21280,42 @@ ] }, "limit": { - "context": 256000, - "output": 262144 + "context": 204800, + "output": 131072 }, + "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } }, "attachment": false, - "open_weights": false, - "release_date": "2025-07-25", - "last_updated": "2025-07-25", + "open_weights": true, + "knowledge": "2025-04", + "release_date": "2025-12-22", + "last_updated": "2025-12-22", "cost": { - "input": 0.13, - "output": 0.5 + "input": 0.6, + "output": 2.2, + "cache_read": 0.11 }, "type": "chat" }, { - "id": "qwen/qwen3-30b-a3b", - "name": "Qwen3 30B A3B", - "display_name": "Qwen3 30B A3B", + "id": "zai-org/GLM-5.1", + "name": "GLM-5.1", + "display_name": "GLM-5.1", "modalities": { "input": [ "text" @@ -20748,12 +21325,14 @@ ] }, "limit": { - "context": 41000, - "output": 32768 + "context": 202752, + "output": 131072 }, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { - "supported": true + "supported": true, + "default": true }, "extra_capabilities": { "reasoning": { @@ -20767,33 +21346,34 @@ } }, "attachment": false, - "open_weights": false, - "release_date": "2025-02-27", - "last_updated": "2025-02-27", + "open_weights": true, + "release_date": "2026-04-03", + "last_updated": "2026-04-03", "cost": { - "input": 0.1, - "output": 0.3 + "input": 1, + "output": 3.2, + "cache_read": 0.2 }, "type": "chat" }, { - "id": "qwen/qwen3.5-9b", - "name": "Qwen3.5 9B", - "display_name": "Qwen3.5 9B", + "id": "deepseek-ai/DeepSeek-R1-0528", + "name": "DeepSeek-R1-0528", + "display_name": "DeepSeek-R1-0528", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 256000, - "output": 65536 + "context": 163840, + "output": 163840 }, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { "supported": true, "default": true @@ -20809,20 +21389,21 @@ ] } }, - "attachment": true, - "open_weights": false, - "release_date": "2026-03-10", - "last_updated": "2026-03-10", + "attachment": false, + "open_weights": true, + "knowledge": "2025-05", + "release_date": "2025-05-28", + "last_updated": "2025-05-28", "cost": { - "input": 0.05, - "output": 0.15 + "input": 3, + "output": 5 }, "type": "chat" }, { - "id": "qwen/qwen3-next-80b-a3b-thinking", - "name": "Qwen3 Next 80B A3B (Thinking)", - "display_name": "Qwen3 Next 80B A3B (Thinking)", + "id": "deepseek-ai/DeepSeek-V4-Pro", + "name": "DeepSeek V4 Pro", + "display_name": "DeepSeek V4 Pro", "modalities": { "input": [ "text" @@ -20832,12 +21413,14 @@ ] }, "limit": { - "context": 256000, - "output": 32768 + "context": 1048576, + "output": 393216 }, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { - "supported": true + "supported": true, + "default": true }, "extra_capabilities": { "reasoning": { @@ -20851,19 +21434,21 @@ } }, "attachment": false, - "open_weights": false, - "release_date": "2024-01-01", - "last_updated": "2024-01-01", + "open_weights": true, + "knowledge": "2025-05", + "release_date": "2026-04-24", + "last_updated": "2026-04-24", "cost": { - "input": 0.15, - "output": 0.65 + "input": 0.435, + "output": 0.87, + "cache_read": 0.003625 }, "type": "chat" }, { - "id": "qwen/qwen3-coder-flash", - "name": "Qwen3 Coder Flash", - "display_name": "Qwen3 Coder Flash", + "id": "deepseek-ai/DeepSeek-V3.2", + "name": "DeepSeek-V3.2", + "display_name": "DeepSeek-V3.2", "modalities": { "input": [ "text" @@ -20873,27 +21458,35 @@ ] }, "limit": { - "context": 128000, + "context": 163840, "output": 65536 }, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true + } }, "attachment": false, - "open_weights": false, - "release_date": "2025-09-17", - "last_updated": "2025-09-17", + "open_weights": true, + "knowledge": "2024-07", + "release_date": "2025-12-01", + "last_updated": "2025-12-01", "cost": { - "input": 0.3, - "output": 1.5 + "input": 0.28, + "output": 0.4 }, "type": "chat" }, { - "id": "qwen/Qwen3-235B-A22B-Instruct-2507", - "name": "Qwen 3 235b A22B 2507", - "display_name": "Qwen 3 235b A22B 2507", + "id": "MiniMaxAI/MiniMax-M2.1", + "name": "MiniMax-M2.1", + "display_name": "MiniMax-M2.1", "modalities": { "input": [ "text" @@ -20903,27 +21496,41 @@ ] }, "limit": { - "context": 256000, - "output": 262144 + "context": 204800, + "output": 131072 }, + "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } }, "attachment": false, - "open_weights": false, - "release_date": "2025-07-25", - "last_updated": "2025-07-25", + "open_weights": true, + "knowledge": "2025-10", + "release_date": "2025-12-23", + "last_updated": "2025-12-23", "cost": { - "input": 0.13, - "output": 0.5 + "input": 0.3, + "output": 1.2 }, "type": "chat" }, { - "id": "qwen/Qwen3-Next-80B-A3B-Instruct", - "name": "Qwen3 Next 80B A3B (Instruct)", - "display_name": "Qwen3 Next 80B A3B (Instruct)", + "id": "MiniMaxAI/MiniMax-M2.5", + "name": "MiniMax-M2.5", + "display_name": "MiniMax-M2.5", "modalities": { "input": [ "text" @@ -20933,72 +21540,55 @@ ] }, "limit": { - "context": 256000, - "output": 262144 + "context": 204800, + "output": 131072 }, + "temperature": true, "tool_call": true, "reasoning": { - "supported": false - }, - "attachment": false, - "open_weights": false, - "release_date": "2025-09-11", - "last_updated": "2025-09-11", - "cost": { - "input": 0.15, - "output": 0.65 - }, - "type": "chat" - }, - { - "id": "qwen/Qwen2.5-Coder-32B-Instruct", - "name": "Qwen 2.5 Coder 32b", - "display_name": "Qwen 2.5 Coder 32b", - "modalities": { - "input": [ - "text" - ], - "output": [ - "text" - ] - }, - "limit": { - "context": 32000, - "output": 8192 + "supported": true, + "default": true }, - "tool_call": false, - "reasoning": { - "supported": false + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } }, "attachment": false, - "open_weights": false, - "release_date": "2025-07-03", - "last_updated": "2025-07-03", + "open_weights": true, + "release_date": "2026-02-12", + "last_updated": "2026-02-12", "cost": { - "input": 0.2006, - "output": 0.2006 + "input": 0.3, + "output": 1.2, + "cache_read": 0.03 }, "type": "chat" }, { - "id": "qwen/Qwen3.6-35B-A3B:thinking", - "name": "Qwen3.6 35B A3B Thinking", - "display_name": "Qwen3.6 35B A3B Thinking", + "id": "MiniMaxAI/MiniMax-M2.7", + "name": "MiniMax-M2.7", + "display_name": "MiniMax-M2.7", "modalities": { "input": [ - "text", - "image", - "video" + "text" ], "output": [ "text" ] }, "limit": { - "context": 262144, - "output": 16384 + "context": 204800, + "output": 131072 }, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { "supported": true, "default": true @@ -21014,20 +21604,30 @@ ] } }, - "attachment": true, - "open_weights": false, - "release_date": "2026-04-19", - "last_updated": "2026-04-19", + "attachment": false, + "open_weights": true, + "release_date": "2026-03-18", + "last_updated": "2026-03-18", "cost": { - "input": 0.112, - "output": 0.8 + "input": 0.3, + "output": 1.2, + "cache_read": 0.06 }, "type": "chat" - }, + } + ] + }, + "minimax-coding-plan": { + "id": "minimax-coding-plan", + "name": "MiniMax Coding Plan (minimax.io)", + "display_name": "MiniMax Coding Plan (minimax.io)", + "api": "https://api.minimax.io/anthropic/v1", + "doc": "https://platform.minimax.io/docs/coding-plan/intro", + "models": [ { - "id": "qwen/qwen3-coder", - "name": "Qwen 3 Coder 480B", - "display_name": "Qwen 3 Coder 480B", + "id": "MiniMax-M2.1", + "name": "MiniMax-M2.1", + "display_name": "MiniMax-M2.1", "modalities": { "input": [ "text" @@ -21037,85 +21637,87 @@ ] }, "limit": { - "context": 262000, - "output": 65536 + "context": 204800, + "output": 131072 }, + "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true + } }, "attachment": false, - "open_weights": false, - "release_date": "2026-03-17", - "last_updated": "2026-03-17", + "open_weights": true, + "release_date": "2025-12-23", + "last_updated": "2025-12-23", "cost": { - "input": 0.13, - "output": 0.5 + "input": 0, + "output": 0 }, "type": "chat" }, { - "id": "qwen/qwen3.5-397b-a17b", - "name": "Qwen3.5 397B A17B", - "display_name": "Qwen3.5 397B A17B", + "id": "MiniMax-M2.5-highspeed", + "name": "MiniMax-M2.5-highspeed", + "display_name": "MiniMax-M2.5-highspeed", "modalities": { "input": [ - "text", - "image", - "video" + "text" ], "output": [ "text" ] }, "limit": { - "context": 258048, - "output": 65536 + "context": 204800, + "output": 131072 }, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { - "supported": true + "supported": true, + "default": true }, "extra_capabilities": { "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] + "supported": true } }, "attachment": false, "open_weights": true, - "release_date": "2026-02-16", - "last_updated": "2026-02-16", + "release_date": "2026-02-13", + "last_updated": "2026-02-13", "cost": { - "input": 0.6, - "output": 3.6 + "input": 0, + "output": 0, + "cache_read": 0, + "cache_write": 0 }, "type": "chat" }, { - "id": "qwen/qwen3.5-397b-a17b-thinking", - "name": "Qwen3.5 397B A17B Thinking", - "display_name": "Qwen3.5 397B A17B Thinking", + "id": "MiniMax-M2.7-highspeed", + "name": "MiniMax-M2.7-highspeed", + "display_name": "MiniMax-M2.7-highspeed", "modalities": { "input": [ - "text", - "image", - "video" + "text" ], "output": [ "text" ] }, "limit": { - "context": 258048, - "output": 65536 + "context": 204800, + "output": 131072 }, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { "supported": true, "default": true @@ -21131,20 +21733,22 @@ ] } }, - "attachment": true, - "open_weights": false, - "release_date": "2026-02-16", - "last_updated": "2026-02-16", + "attachment": false, + "open_weights": true, + "release_date": "2026-03-18", + "last_updated": "2026-03-18", "cost": { - "input": 0.6, - "output": 3.6 + "input": 0, + "output": 0, + "cache_read": 0, + "cache_write": 0 }, "type": "chat" }, { - "id": "qwen/qwen-2.5-72b-instruct", - "name": "Qwen2.5 72B", - "display_name": "Qwen2.5 72B", + "id": "MiniMax-M2", + "name": "MiniMax-M2", + "display_name": "MiniMax-M2", "modalities": { "input": [ "text" @@ -21154,88 +21758,114 @@ ] }, "limit": { - "context": 131072, - "output": 8192 + "context": 196608, + "output": 128000 }, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true + } }, "attachment": false, - "open_weights": false, - "release_date": "2025-07-03", - "last_updated": "2025-07-03", + "open_weights": true, + "release_date": "2025-10-27", + "last_updated": "2025-10-27", "cost": { - "input": 0.357, - "output": 0.408 + "input": 0, + "output": 0 }, "type": "chat" }, { - "id": "qwen/Qwen3-VL-235B-A22B-Instruct", - "name": "Qwen3 VL 235B A22B Instruct", - "display_name": "Qwen3 VL 235B A22B Instruct", + "id": "MiniMax-M2.5", + "name": "MiniMax-M2.5", + "display_name": "MiniMax-M2.5", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 262144 + "context": 204800, + "output": 131072 }, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": true, - "open_weights": false, - "release_date": "2024-01-01", - "last_updated": "2024-01-01", + "extra_capabilities": { + "reasoning": { + "supported": true + } + }, + "attachment": false, + "open_weights": true, + "release_date": "2026-02-12", + "last_updated": "2026-02-12", "cost": { - "input": 0.3, - "output": 1.2 + "input": 0, + "output": 0, + "cache_read": 0, + "cache_write": 0 }, "type": "chat" }, { - "id": "Salesforce/Llama-xLAM-2-70b-fc-r", - "name": "Llama-xLAM-2 70B fc-r", - "display_name": "Llama-xLAM-2 70B fc-r", + "id": "MiniMax-M3", + "name": "MiniMax-M3", + "display_name": "MiniMax-M3", "modalities": { "input": [ - "text" + "text", + "image", + "video" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 16384 + "context": 512000, + "output": 128000 }, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": false, - "open_weights": false, - "release_date": "2025-04-13", - "last_updated": "2025-04-13", + "extra_capabilities": { + "reasoning": { + "supported": true + } + }, + "attachment": true, + "open_weights": true, + "release_date": "2026-06-01", + "last_updated": "2026-06-01", "cost": { - "input": 2.5, - "output": 2.5 + "input": 0, + "output": 0, + "cache_read": 0, + "cache_write": 0 }, "type": "chat" }, { - "id": "Gryphe/MythoMax-L2-13b", - "name": "MythoMax 13B", - "display_name": "MythoMax 13B", + "id": "MiniMax-M2.7", + "name": "MiniMax-M2.7", + "display_name": "MiniMax-M2.7", "modalities": { "input": [ "text" @@ -21245,27 +21875,51 @@ ] }, "limit": { - "context": 4000, - "output": 4096 + "context": 204800, + "output": 131072 }, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } }, "attachment": false, - "open_weights": false, - "release_date": "2025-08-08", - "last_updated": "2025-08-08", + "open_weights": true, + "release_date": "2026-03-18", + "last_updated": "2026-03-18", "cost": { - "input": 0.1003, - "output": 0.1003 + "input": 0, + "output": 0, + "cache_read": 0, + "cache_write": 0 }, "type": "chat" - }, + } + ] + }, + "novita-ai": { + "id": "novita-ai", + "name": "NovitaAI", + "display_name": "NovitaAI", + "api": "https://api.novita.ai/openai", + "doc": "https://novita.ai/docs/guides/introduction", + "models": [ { - "id": "Envoid/Llama-3.05-Nemotron-Tenyxchat-Storybreaker-70B", - "name": "Nemotron Tenyxchat Storybreaker 70b", - "display_name": "Nemotron Tenyxchat Storybreaker 70b", + "id": "inclusionai/ling-2.6-1t", + "name": "Ling-2.6-1T", + "display_name": "Ling-2.6-1T", "modalities": { "input": [ "text" @@ -21275,27 +21929,28 @@ ] }, "limit": { - "context": 16384, - "output": 8192 + "context": 262144, + "output": 32768 }, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { "supported": false }, "attachment": false, - "open_weights": false, - "release_date": "2024-12-01", - "last_updated": "2024-12-01", + "open_weights": true, + "release_date": "2026-04-23", + "last_updated": "2026-04-23", "cost": { - "input": 0.49299999999999994, - "output": 0.49299999999999994 + "input": 0, + "output": 0 }, "type": "chat" }, { - "id": "Envoid/Llama-3.05-NT-Storybreaker-Ministral-70B", - "name": "Llama 3.05 Storybreaker Ministral 70b", - "display_name": "Llama 3.05 Storybreaker Ministral 70b", + "id": "inclusionai/ring-2.6-1t", + "name": "Ring-2.6-1T", + "display_name": "Ring-2.6-1T", "modalities": { "input": [ "text" @@ -21305,27 +21960,30 @@ ] }, "limit": { - "context": 16384, - "output": 8192 + "context": 262144, + "output": 65536 }, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "attachment": false, "open_weights": false, - "release_date": "2024-12-01", - "last_updated": "2024-12-01", + "release_date": "2026-05-08", + "last_updated": "2026-05-27", "cost": { - "input": 0.49299999999999994, - "output": 0.49299999999999994 + "input": 0.3, + "output": 2.5, + "cache_read": 0.06 }, "type": "chat" }, { - "id": "pamanseau/OpenReasoning-Nemotron-32B", - "name": "OpenReasoning Nemotron 32B", - "display_name": "OpenReasoning Nemotron 32B", + "id": "inclusionai/ling-2.6-flash", + "name": "Ling-2.6-flash", + "display_name": "Ling-2.6-flash", "modalities": { "input": [ "text" @@ -21335,28 +21993,29 @@ ] }, "limit": { - "context": 32768, - "output": 65536 + "context": 262144, + "output": 32768 }, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, "attachment": false, - "open_weights": false, - "release_date": "2025-08-21", - "last_updated": "2025-08-21", + "open_weights": true, + "release_date": "2026-04-24", + "last_updated": "2026-04-24", "cost": { "input": 0.1, - "output": 0.4 + "output": 0.3, + "cache_read": 0.02 }, "type": "chat" }, { - "id": "GalrionSoftworks/MN-LooseCannon-12B-v1", - "name": "MN-LooseCannon-12B-v1", - "display_name": "MN-LooseCannon-12B-v1", + "id": "meta-llama/llama-3.1-8b-instruct", + "name": "Llama 3.1 8B Instruct", + "display_name": "Llama 3.1 8B Instruct", "modalities": { "input": [ "text" @@ -21367,26 +22026,27 @@ }, "limit": { "context": 16384, - "output": 8192 + "output": 16384 }, + "temperature": true, "tool_call": false, "reasoning": { "supported": false }, "attachment": false, - "open_weights": false, - "release_date": "2024-07-01", - "last_updated": "2024-07-01", + "open_weights": true, + "release_date": "2024-07-24", + "last_updated": "2024-07-24", "cost": { - "input": 0.49299999999999994, - "output": 0.49299999999999994 + "input": 0.02, + "output": 0.05 }, "type": "chat" }, { - "id": "liquid/lfm-2-24b-a2b", - "name": "LFM2 24B A2B", - "display_name": "LFM2 24B A2B", + "id": "meta-llama/llama-3-70b-instruct", + "name": "Llama3 70B Instruct", + "display_name": "Llama3 70B Instruct", "modalities": { "input": [ "text" @@ -21396,57 +22056,60 @@ ] }, "limit": { - "context": 32768, - "output": 32768 + "context": 8192, + "output": 8000 }, + "temperature": true, "tool_call": false, "reasoning": { "supported": false }, "attachment": false, - "open_weights": false, - "release_date": "2025-12-20", - "last_updated": "2025-12-20", + "open_weights": true, + "release_date": "2024-04-25", + "last_updated": "2024-04-25", "cost": { - "input": 0.03, - "output": 0.12 + "input": 0.51, + "output": 0.74 }, "type": "chat" }, { - "id": "soob3123/Veiled-Calla-12B", - "name": "Veiled Calla 12B", - "display_name": "Veiled Calla 12B", + "id": "meta-llama/llama-4-scout-17b-16e-instruct", + "name": "Llama 4 Scout Instruct", + "display_name": "Llama 4 Scout Instruct", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 32768, - "output": 8192 + "context": 131072, + "output": 131072 }, + "temperature": true, "tool_call": false, "reasoning": { "supported": false }, - "attachment": false, - "open_weights": false, - "release_date": "2025-04-13", - "last_updated": "2025-04-13", + "attachment": true, + "open_weights": true, + "release_date": "2025-04-06", + "last_updated": "2025-04-06", "cost": { - "input": 0.3, - "output": 0.3 + "input": 0.18, + "output": 0.59 }, "type": "chat" }, { - "id": "soob3123/amoral-gemma3-27B-v2", - "name": "Amoral Gemma3 27B v2", - "display_name": "Amoral Gemma3 27B v2", + "id": "meta-llama/llama-3.3-70b-instruct", + "name": "Llama 3.3 70B Instruct", + "display_name": "Llama 3.3 70B Instruct", "modalities": { "input": [ "text" @@ -21456,27 +22119,29 @@ ] }, "limit": { - "context": 32768, - "output": 8192 + "context": 131072, + "output": 120000 }, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { "supported": false }, "attachment": false, - "open_weights": false, - "release_date": "2025-05-23", - "last_updated": "2025-05-23", + "open_weights": true, + "knowledge": "2023-12", + "release_date": "2024-12-07", + "last_updated": "2024-12-07", "cost": { - "input": 0.3, - "output": 0.3 + "input": 0.135, + "output": 0.4 }, "type": "chat" }, { - "id": "soob3123/GrayLine-Qwen3-8B", - "name": "Grayline Qwen3 8B", - "display_name": "Grayline Qwen3 8B", + "id": "meta-llama/llama-3-8b-instruct", + "name": "Llama 3 8B Instruct", + "display_name": "Llama 3 8B Instruct", "modalities": { "input": [ "text" @@ -21486,27 +22151,28 @@ ] }, "limit": { - "context": 16384, - "output": 32768 + "context": 8192, + "output": 8192 }, + "temperature": true, "tool_call": false, "reasoning": { "supported": false }, "attachment": false, - "open_weights": false, - "release_date": "2025-09-25", - "last_updated": "2025-09-25", + "open_weights": true, + "release_date": "2024-04-25", + "last_updated": "2024-04-25", "cost": { - "input": 0.3, - "output": 0.3 + "input": 0.04, + "output": 0.04 }, "type": "chat" }, { - "id": "Unbabel/M-Prometheus-14B", - "name": "M-Prometheus 14B", - "display_name": "M-Prometheus 14B", + "id": "meta-llama/llama-3.2-3b-instruct", + "name": "Llama 3.2 3B Instruct", + "display_name": "Llama 3.2 3B Instruct", "modalities": { "input": [ "text" @@ -21517,56 +22183,59 @@ }, "limit": { "context": 32768, - "output": 8192 + "output": 32000 }, + "temperature": true, "tool_call": false, "reasoning": { "supported": false }, "attachment": false, - "open_weights": false, - "release_date": "2026-05-29", - "last_updated": "2026-05-29", + "open_weights": true, + "release_date": "2024-09-18", + "last_updated": "2024-09-18", "cost": { - "input": 0.2, - "output": 0.2 + "input": 0.03, + "output": 0.05 }, "type": "chat" }, { - "id": "NousResearch/hermes-4-70b", - "name": "Hermes 4 Medium", - "display_name": "Hermes 4 Medium", + "id": "meta-llama/llama-4-maverick-17b-128e-instruct-fp8", + "name": "Llama 4 Maverick Instruct", + "display_name": "Llama 4 Maverick Instruct", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 128000, + "context": 1048576, "output": 8192 }, + "temperature": true, "tool_call": false, "reasoning": { "supported": false }, - "attachment": false, - "open_weights": false, - "release_date": "2025-07-03", - "last_updated": "2025-07-03", + "attachment": true, + "open_weights": true, + "release_date": "2025-04-06", + "last_updated": "2025-04-06", "cost": { - "input": 0.2006, - "output": 0.3995 + "input": 0.27, + "output": 0.85 }, "type": "chat" }, { - "id": "NousResearch/DeepHermes-3-Mistral-24B-Preview", - "name": "DeepHermes-3 Mistral 24B (Preview)", - "display_name": "DeepHermes-3 Mistral 24B (Preview)", + "id": "moonshotai/kimi-k2-instruct", + "name": "Kimi K2 Instruct", + "display_name": "Kimi K2 Instruct", "modalities": { "input": [ "text" @@ -21576,27 +22245,28 @@ ] }, "limit": { - "context": 128000, + "context": 131072, "output": 32768 }, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { "supported": false }, "attachment": false, - "open_weights": false, - "release_date": "2025-05-10", - "last_updated": "2025-05-10", + "open_weights": true, + "release_date": "2025-07-11", + "last_updated": "2025-07-11", "cost": { - "input": 0.3, - "output": 0.3 + "input": 0.57, + "output": 2.3 }, "type": "chat" }, { - "id": "NousResearch/hermes-3-llama-3.1-70b", - "name": "Hermes 3 70B", - "display_name": "Hermes 3 70B", + "id": "moonshotai/kimi-k2-thinking", + "name": "Kimi K2 Thinking", + "display_name": "Kimi K2 Thinking", "modalities": { "input": [ "text" @@ -21606,87 +22276,134 @@ ] }, "limit": { - "context": 65536, - "output": 8192 + "context": 262144, + "output": 262144 }, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } }, "attachment": false, - "open_weights": false, - "release_date": "2026-01-07", - "last_updated": "2026-01-07", + "open_weights": true, + "release_date": "2025-11-07", + "last_updated": "2025-11-07", "cost": { - "input": 0.408, - "output": 0.408 + "input": 0.6, + "output": 2.5 }, "type": "chat" }, { - "id": "NousResearch/Hermes-4-70B:thinking", - "name": "Hermes 4 (Thinking)", - "display_name": "Hermes 4 (Thinking)", + "id": "moonshotai/kimi-k2.5", + "name": "Kimi K2.5", + "display_name": "Kimi K2.5", "modalities": { "input": [ - "text" + "text", + "image", + "video" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 8192 + "context": 262144, + "output": 262144 }, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": false, - "open_weights": false, - "release_date": "2025-09-17", - "last_updated": "2025-09-17", + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } + }, + "attachment": true, + "open_weights": true, + "knowledge": "2025-01", + "release_date": "2026-01-27", + "last_updated": "2026-01-27", "cost": { - "input": 0.2006, - "output": 0.3995 + "input": 0.6, + "output": 3, + "cache_read": 0.1 }, "type": "chat" }, { - "id": "NousResearch/hermes-4-405b", - "name": "Hermes 4 Large", - "display_name": "Hermes 4 Large", + "id": "moonshotai/kimi-k2.6", + "name": "Kimi K2.6", + "display_name": "Kimi K2.6", "modalities": { "input": [ - "text" + "text", + "image", + "video" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 8192 + "context": 262144, + "output": 262144 }, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": false, - "open_weights": false, - "release_date": "2025-08-26", - "last_updated": "2025-08-26", + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } + }, + "attachment": true, + "open_weights": true, + "knowledge": "2025-01", + "release_date": "2026-04-21", + "last_updated": "2026-04-21", "cost": { - "input": 0.3, - "output": 1.2 + "input": 0.95, + "output": 4, + "cache_read": 0.16 }, "type": "chat" }, { - "id": "NousResearch/hermes-4-405b:thinking", - "name": "Hermes 4 Large (Thinking)", - "display_name": "Hermes 4 Large (Thinking)", + "id": "moonshotai/kimi-k2-0905", + "name": "Kimi K2 0905", + "display_name": "Kimi K2 0905", "modalities": { "input": [ "text" @@ -21696,27 +22413,29 @@ ] }, "limit": { - "context": 128000, - "output": 8192 + "context": 262144, + "output": 262144 }, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { "supported": false }, "attachment": false, - "open_weights": false, - "release_date": "2024-01-01", - "last_updated": "2024-01-01", + "open_weights": true, + "knowledge": "2024-10", + "release_date": "2025-09-05", + "last_updated": "2025-09-05", "cost": { - "input": 0.3, - "output": 1.2 + "input": 0.6, + "output": 2.5 }, "type": "chat" }, { - "id": "Steelskull/L3.3-Nevoria-R1-70b", - "name": "Steelskull Nevoria R1 70b", - "display_name": "Steelskull Nevoria R1 70b", + "id": "minimaxai/minimax-m1-80k", + "name": "MiniMax M1", + "display_name": "MiniMax M1", "modalities": { "input": [ "text" @@ -21726,57 +22445,62 @@ ] }, "limit": { - "context": 16384, - "output": 16384 + "context": 1000000, + "output": 40000 }, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "attachment": false, - "open_weights": false, - "release_date": "2024-12-06", - "last_updated": "2024-12-06", + "open_weights": true, + "release_date": "2025-06-17", + "last_updated": "2025-06-17", "cost": { - "input": 0.49299999999999994, - "output": 0.49299999999999994 + "input": 0.55, + "output": 2.2 }, "type": "chat" }, { - "id": "Steelskull/L3.3-Cu-Mai-R1-70b", - "name": "Llama 3.3 70B Cu Mai", - "display_name": "Llama 3.3 70B Cu Mai", + "id": "baidu/ernie-4.5-vl-28b-a3b", + "name": "ERNIE 4.5 VL 28B A3B", + "display_name": "ERNIE 4.5 VL 28B A3B", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 16384, - "output": 16384 + "context": 30000, + "output": 8000 }, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": false, - "open_weights": false, - "release_date": "2024-12-06", - "last_updated": "2024-12-06", + "attachment": true, + "open_weights": true, + "release_date": "2025-06-30", + "last_updated": "2025-06-30", "cost": { - "input": 0.49299999999999994, - "output": 0.49299999999999994 + "input": 1.4, + "output": 5.6 }, "type": "chat" }, { - "id": "Steelskull/L3.3-MS-Nevoria-70b", - "name": "Steelskull Nevoria 70b", - "display_name": "Steelskull Nevoria 70b", + "id": "baidu/ernie-4.5-21B-a3b", + "name": "ERNIE 4.5 21B A3B", + "display_name": "ERNIE 4.5 21B A3B", "modalities": { "input": [ "text" @@ -21786,57 +22510,62 @@ ] }, "limit": { - "context": 16384, - "output": 16384 + "context": 120000, + "output": 8000 }, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { "supported": false }, "attachment": false, - "open_weights": false, - "release_date": "2024-12-06", - "last_updated": "2024-12-06", + "open_weights": true, + "knowledge": "2025-03", + "release_date": "2025-06-30", + "last_updated": "2025-06-30", "cost": { - "input": 0.49299999999999994, - "output": 0.49299999999999994 + "input": 0.07, + "output": 0.28 }, "type": "chat" }, { - "id": "Steelskull/L3.3-MS-Evayale-70B", - "name": "Evayale 70b ", - "display_name": "Evayale 70b ", + "id": "baidu/ernie-4.5-vl-424b-a47b", + "name": "ERNIE 4.5 VL 424B A47B", + "display_name": "ERNIE 4.5 VL 424B A47B", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 16384, - "output": 16384 + "context": 123000, + "output": 16000 }, + "temperature": true, "tool_call": false, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": false, - "open_weights": false, - "release_date": "2024-12-06", - "last_updated": "2024-12-06", + "attachment": true, + "open_weights": true, + "release_date": "2025-06-30", + "last_updated": "2025-06-30", "cost": { - "input": 0.49299999999999994, - "output": 0.49299999999999994 + "input": 0.42, + "output": 1.25 }, "type": "chat" }, { - "id": "Steelskull/L3.3-Electra-R1-70b", - "name": "Steelskull Electra R1 70b", - "display_name": "Steelskull Electra R1 70b", + "id": "baidu/ernie-4.5-21B-a3b-thinking", + "name": "ERNIE-4.5-21B-A3B-Thinking", + "display_name": "ERNIE-4.5-21B-A3B-Thinking", "modalities": { "input": [ "text" @@ -21846,27 +22575,30 @@ ] }, "limit": { - "context": 16384, - "output": 16384 + "context": 131072, + "output": 65536 }, + "temperature": true, "tool_call": false, "reasoning": { - "supported": false + "supported": true, + "default": true }, "attachment": false, - "open_weights": false, - "release_date": "2024-12-06", - "last_updated": "2024-12-06", + "open_weights": true, + "knowledge": "2025-03", + "release_date": "2025-09-19", + "last_updated": "2025-09-19", "cost": { - "input": 0.69989, - "output": 0.69989 + "input": 0.07, + "output": 0.28 }, "type": "chat" }, { - "id": "Steelskull/L3.3-MS-Evalebis-70b", - "name": "MS Evalebis 70b", - "display_name": "MS Evalebis 70b", + "id": "baidu/ernie-4.5-300b-a47b-paddle", + "name": "ERNIE 4.5 300B A47B", + "display_name": "ERNIE 4.5 300B A47B", "modalities": { "input": [ "text" @@ -21876,188 +22608,160 @@ ] }, "limit": { - "context": 16384, - "output": 16384 + "context": 123000, + "output": 12000 }, + "temperature": true, "tool_call": false, "reasoning": { "supported": false }, "attachment": false, - "open_weights": false, - "release_date": "2024-12-06", - "last_updated": "2024-12-06", + "open_weights": true, + "release_date": "2025-06-30", + "last_updated": "2025-06-30", "cost": { - "input": 0.49299999999999994, - "output": 0.49299999999999994 + "input": 0.28, + "output": 1.1 }, "type": "chat" }, { - "id": "essentialai/rnj-1-instruct", - "name": "RNJ-1 Instruct 8B", - "display_name": "RNJ-1 Instruct 8B", + "id": "baidu/ernie-4.5-vl-28b-a3b-thinking", + "name": "ERNIE-4.5-VL-28B-A3B-Thinking", + "display_name": "ERNIE-4.5-VL-28B-A3B-Thinking", "modalities": { "input": [ - "text" + "text", + "image", + "video" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 8192 + "context": 131072, + "output": 65536 }, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": false, - "open_weights": false, - "release_date": "2025-12-13", - "last_updated": "2025-12-13", + "attachment": true, + "open_weights": true, + "release_date": "2025-11-26", + "last_updated": "2025-11-26", "cost": { - "input": 0.15, - "output": 0.15 + "input": 0.39, + "output": 0.39 }, "type": "chat" }, { - "id": "cohere/command-r-plus-08-2024", - "name": "Cohere: Command R+", - "display_name": "Cohere: Command R+", + "id": "google/gemma-4-31b-it", + "name": "Gemma 4 31B", + "display_name": "Gemma 4 31B", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 4096 + "context": 262144, + "output": 131072 }, + "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": false, - "open_weights": false, - "release_date": "2024-08-30", - "last_updated": "2024-08-30", + "attachment": true, + "open_weights": true, + "release_date": "2026-04-02", + "last_updated": "2026-04-02", "cost": { - "input": 2.856, - "output": 14.246 + "input": 0.14, + "output": 0.4 }, "type": "chat" }, { - "id": "cohere/command-r", - "name": "Cohere: Command R", - "display_name": "Cohere: Command R", + "id": "google/gemma-4-26b-a4b-it", + "name": "Gemma 4 26B A4B", + "display_name": "Gemma 4 26B A4B", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 4096 + "context": 262144, + "output": 131072 }, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": false, - "open_weights": false, - "release_date": "2024-03-11", - "last_updated": "2024-03-11", + "attachment": true, + "open_weights": true, + "release_date": "2026-04-02", + "last_updated": "2026-04-02", "cost": { - "input": 0.476, - "output": 1.428 + "input": 0.13, + "output": 0.4 }, "type": "chat" }, { - "id": "moonshotai/kimi-k2-instruct-0711", - "name": "Kimi K2 0711", - "display_name": "Kimi K2 0711", + "id": "google/gemma-3-12b-it", + "name": "Gemma 3 12B", + "display_name": "Gemma 3 12B", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 128000, + "context": 131072, "output": 8192 }, - "tool_call": true, + "temperature": true, + "tool_call": false, "reasoning": { "supported": false }, - "attachment": false, - "open_weights": false, - "release_date": "2025-07-11", - "last_updated": "2025-07-11", - "cost": { - "input": 0.1, - "output": 2 - }, - "type": "chat" - }, - { - "id": "moonshotai/kimi-k2-thinking", - "name": "Kimi K2 Thinking", - "display_name": "Kimi K2 Thinking", - "modalities": { - "input": [ - "text" - ], - "output": [ - "text" - ] - }, - "limit": { - "context": 256000, - "output": 262144 - }, - "tool_call": true, - "reasoning": { - "supported": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } - }, - "attachment": false, - "open_weights": false, - "release_date": "2025-11-06", - "last_updated": "2025-11-06", + "attachment": true, + "open_weights": true, + "release_date": "2025-03-13", + "last_updated": "2025-03-13", "cost": { - "input": 0.3, - "output": 1.2 + "input": 0.05, + "output": 0.1 }, "type": "chat" }, { - "id": "moonshotai/kimi-k2.5:thinking", - "name": "Kimi K2.5 Thinking", - "display_name": "Kimi K2.5 Thinking", + "id": "google/gemma-3-27b-it", + "name": "Gemma 3 27B", + "display_name": "Gemma 3 27B", "modalities": { "input": [ "text", @@ -22068,28 +22772,28 @@ ] }, "limit": { - "context": 256000, - "output": 65536 + "context": 98304, + "output": 16384 }, - "tool_call": true, + "temperature": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": true + "supported": false }, "attachment": true, - "open_weights": false, - "release_date": "2026-01-26", - "last_updated": "2026-01-26", + "open_weights": true, + "release_date": "2025-03-25", + "last_updated": "2025-03-25", "cost": { - "input": 0.3, - "output": 1.9 + "input": 0.119, + "output": 0.2 }, "type": "chat" }, { - "id": "moonshotai/kimi-k2-instruct", - "name": "Kimi K2 Instruct", - "display_name": "Kimi K2 Instruct", + "id": "microsoft/wizardlm-2-8x22b", + "name": "Wizardlm 2 8x22B", + "display_name": "Wizardlm 2 8x22B", "modalities": { "input": [ "text" @@ -22099,27 +22803,28 @@ ] }, "limit": { - "context": 256000, - "output": 8192 + "context": 65535, + "output": 8000 }, - "tool_call": true, + "temperature": true, + "tool_call": false, "reasoning": { "supported": false }, "attachment": false, - "open_weights": false, - "release_date": "2025-07-01", - "last_updated": "2025-07-01", + "open_weights": true, + "release_date": "2024-04-24", + "last_updated": "2024-04-24", "cost": { - "input": 0.1, - "output": 2 + "input": 0.62, + "output": 0.62 }, "type": "chat" }, { - "id": "moonshotai/kimi-k2.6", - "name": "Kimi K2.6", - "display_name": "Kimi K2.6", + "id": "openai/gpt-oss-120b", + "name": "OpenAI GPT OSS 120B", + "display_name": "OpenAI GPT OSS 120B", "modalities": { "input": [ "text", @@ -22130,12 +22835,14 @@ ] }, "limit": { - "context": 256000, - "output": 65536 + "context": 131072, + "output": 32768 }, + "temperature": true, "tool_call": true, "reasoning": { - "supported": true + "supported": true, + "default": true }, "extra_capabilities": { "reasoning": { @@ -22144,113 +22851,118 @@ }, "attachment": true, "open_weights": true, - "release_date": "2026-04-16", - "last_updated": "2026-04-21", + "release_date": "2025-08-06", + "last_updated": "2025-08-06", "cost": { - "input": 0.53, - "output": 2.73 + "input": 0.05, + "output": 0.25 }, "type": "chat" }, { - "id": "moonshotai/Kimi-K2-Instruct-0905", - "name": "Kimi K2 0905", - "display_name": "Kimi K2 0905", + "id": "openai/gpt-oss-20b", + "name": "OpenAI: GPT OSS 20B", + "display_name": "OpenAI: GPT OSS 20B", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 256000, - "output": 262144 + "context": 131072, + "output": 32768 }, - "tool_call": true, + "temperature": true, + "tool_call": false, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": false, - "open_weights": false, - "release_date": "2025-09-25", - "last_updated": "2025-09-25", + "extra_capabilities": { + "reasoning": { + "supported": true + } + }, + "attachment": true, + "open_weights": true, + "release_date": "2025-08-06", + "last_updated": "2025-08-06", "cost": { - "input": 0.4, - "output": 2 + "input": 0.04, + "output": 0.15 }, "type": "chat" }, { - "id": "moonshotai/kimi-latest", - "name": "Kimi Latest", - "display_name": "Kimi Latest", + "id": "sao10K/l31-70b-euryale-v2.2", + "name": "L31 70B Euryale V2.2", + "display_name": "L31 70B Euryale V2.2", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 256000, - "output": 65536 + "context": 8192, + "output": 8192 }, + "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, - "attachment": true, - "open_weights": false, - "release_date": "2026-05-03", - "last_updated": "2026-05-03", + "attachment": false, + "open_weights": true, + "release_date": "2024-09-19", + "last_updated": "2024-09-19", "cost": { - "input": 0.5, - "output": 2.6, - "cache_read": 0.125 + "input": 1.48, + "output": 1.48 }, "type": "chat" }, { - "id": "moonshotai/kimi-k2.6:thinking", - "name": "Kimi K2.6 Thinking", - "display_name": "Kimi K2.6 Thinking", + "id": "sao10K/L3-8B-stheno-v3.2", + "name": "L3 8B Stheno V3.2", + "display_name": "L3 8B Stheno V3.2", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 256000, - "output": 65536 + "context": 8192, + "output": 32000 }, + "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, - "attachment": true, + "attachment": false, "open_weights": true, - "release_date": "2026-04-16", - "last_updated": "2026-04-21", + "release_date": "2024-11-29", + "last_updated": "2024-11-29", "cost": { - "input": 0.53, - "output": 2.73 + "input": 0.05, + "output": 0.05 }, "type": "chat" }, { - "id": "moonshotai/kimi-k2-thinking-original", - "name": "Kimi K2 Thinking Original", - "display_name": "Kimi K2 Thinking Original", + "id": "sao10K/l3-8b-lunaris", + "name": "Sao10k L3 8B Lunaris\t", + "display_name": "Sao10k L3 8B Lunaris\t", "modalities": { "input": [ "text" @@ -22260,70 +22972,59 @@ ] }, "limit": { - "context": 256000, - "output": 16384 + "context": 8192, + "output": 8192 }, + "temperature": true, "tool_call": false, "reasoning": { - "supported": true, - "default": true + "supported": false }, "attachment": false, - "open_weights": false, - "release_date": "2025-11-06", - "last_updated": "2025-11-06", + "open_weights": true, + "release_date": "2024-11-28", + "last_updated": "2024-11-28", "cost": { - "input": 0.6, - "output": 2.5 + "input": 0.05, + "output": 0.05 }, "type": "chat" }, { - "id": "moonshotai/kimi-k2.5", - "name": "Kimi K2.5", - "display_name": "Kimi K2.5", + "id": "sao10K/l3-70b-euryale-v2.1", + "name": "L3 70B Euryale V2.1\t", + "display_name": "L3 70B Euryale V2.1\t", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 256000, - "output": 65536 + "context": 8192, + "output": 8192 }, + "temperature": true, "tool_call": true, "reasoning": { - "supported": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } + "supported": false }, - "attachment": true, - "open_weights": false, - "release_date": "2026-01-26", - "last_updated": "2026-01-26", + "attachment": false, + "open_weights": true, + "release_date": "2024-06-18", + "last_updated": "2024-06-18", "cost": { - "input": 0.3, - "output": 1.9 + "input": 1.48, + "output": 1.48 }, "type": "chat" }, { - "id": "moonshotai/kimi-k2-thinking-turbo-original", - "name": "Kimi K2 Thinking Turbo Original", - "display_name": "Kimi K2 Thinking Turbo Original", + "id": "baichuan/baichuan-m2-32b", + "name": "baichuan-m2-32b", + "display_name": "baichuan-m2-32b", "modalities": { "input": [ "text" @@ -22333,121 +23034,155 @@ ] }, "limit": { - "context": 256000, - "output": 16384 + "context": 131072, + "output": 131072 }, + "temperature": true, "tool_call": false, "reasoning": { - "supported": true, - "default": true + "supported": false }, "attachment": false, - "open_weights": false, - "release_date": "2025-11-06", - "last_updated": "2025-11-06", + "open_weights": true, + "knowledge": "2024-12", + "release_date": "2025-08-13", + "last_updated": "2025-08-13", "cost": { - "input": 1.15, - "output": 8 + "input": 0.07, + "output": 0.07 }, "type": "chat" }, { - "id": "meta-llama/llama-4-maverick", - "name": "Llama 4 Maverick", - "display_name": "Llama 4 Maverick", + "id": "mistralai/mistral-nemo", + "name": "Mistral Nemo", + "display_name": "Mistral Nemo", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 1048576, - "output": 65536 + "context": 60288, + "output": 16000 }, - "tool_call": true, + "temperature": true, + "tool_call": false, "reasoning": { "supported": false }, - "attachment": true, - "open_weights": false, - "release_date": "2025-09-05", - "last_updated": "2025-09-05", + "attachment": false, + "open_weights": true, + "release_date": "2024-07-30", + "last_updated": "2024-07-30", "cost": { - "input": 0.18000000000000002, - "output": 0.8 + "input": 0.04, + "output": 0.17 }, "type": "chat" }, { - "id": "meta-llama/llama-3.2-3b-instruct", - "name": "Llama 3.2 3b Instruct", - "display_name": "Llama 3.2 3b Instruct", + "id": "xiaomimimo/mimo-v2-flash", + "name": "XiaomiMiMo/MiMo-V2-Flash", + "display_name": "XiaomiMiMo/MiMo-V2-Flash", "modalities": { "input": [ - "text", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 131072, - "output": 8192 + "context": 262144, + "output": 32000 }, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": true, - "open_weights": false, - "release_date": "2024-09-25", - "last_updated": "2024-09-25", + "attachment": false, + "open_weights": true, + "knowledge": "2024-12", + "release_date": "2025-12-19", + "last_updated": "2025-12-19", "cost": { - "input": 0.0306, - "output": 0.0493 + "input": 0.1, + "output": 0.3, + "cache_read": 0.3 }, "type": "chat" }, { - "id": "meta-llama/llama-4-scout", - "name": "Llama 4 Scout", - "display_name": "Llama 4 Scout", + "id": "xiaomimimo/mimo-v2-pro", + "name": "MiMo-V2-Pro", + "display_name": "MiMo-V2-Pro", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 328000, - "output": 65536 + "context": 1048576, + "output": 131072 }, + "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": true, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } + }, + "attachment": false, "open_weights": false, - "release_date": "2025-09-05", - "last_updated": "2025-09-05", + "knowledge": "2024-12", + "release_date": "2026-03-18", + "last_updated": "2026-05-27", "cost": { - "input": 0.085, - "output": 0.46 + "input": 2, + "output": 6, + "cache_read": 0.4, + "tiers": [ + { + "input": 2, + "output": 6, + "cache_read": 0.4, + "tier": { + "type": "context", + "size": 256000 + } + } + ], + "context_over_200k": { + "input": 2, + "output": 6, + "cache_read": 0.4 + } }, "type": "chat" }, { - "id": "meta-llama/llama-3.1-8b-instruct", - "name": "Llama 3.1 8b Instruct", - "display_name": "Llama 3.1 8b Instruct", + "id": "xiaomimimo/mimo-v2.5-pro", + "name": "MiMo-V2.5-Pro", + "display_name": "MiMo-V2.5-Pro", "modalities": { "input": [ "text" @@ -22457,27 +23192,58 @@ ] }, "limit": { - "context": 131072, - "output": 16384 + "context": 1048576, + "output": 131072 }, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } }, "attachment": false, - "open_weights": false, - "release_date": "2024-07-23", - "last_updated": "2024-07-23", + "open_weights": true, + "knowledge": "2024-12", + "release_date": "2026-04-22", + "last_updated": "2026-05-27", "cost": { - "input": 0.0544, - "output": 0.0544 + "input": 2, + "output": 6, + "cache_read": 0.4, + "tiers": [ + { + "input": 2, + "output": 6, + "cache_read": 0.4, + "tier": { + "type": "context", + "size": 256000 + } + } + ], + "context_over_200k": { + "input": 2, + "output": 6, + "cache_read": 0.4 + } }, "type": "chat" }, { - "id": "meta-llama/llama-3.3-70b-instruct", - "name": "Llama 3.3 70b Instruct", - "display_name": "Llama 3.3 70b Instruct", + "id": "gryphe/mythomax-l2-13b", + "name": "Mythomax L2 13B", + "display_name": "Mythomax L2 13B", "modalities": { "input": [ "text" @@ -22487,27 +23253,28 @@ ] }, "limit": { - "context": 131072, - "output": 16384 + "context": 4096, + "output": 3200 }, - "tool_call": true, + "temperature": true, + "tool_call": false, "reasoning": { "supported": false }, "attachment": false, - "open_weights": false, - "release_date": "2025-02-27", - "last_updated": "2025-02-27", + "open_weights": true, + "release_date": "2024-04-25", + "last_updated": "2024-04-25", "cost": { - "input": 0.05, - "output": 0.23 + "input": 0.09, + "output": 0.09 }, "type": "chat" }, { - "id": "anthracite-org/magnum-v2-72b", - "name": "Magnum V2 72B", - "display_name": "Magnum V2 72B", + "id": "zai-org/glm-4.7", + "name": "GLM-4.7", + "display_name": "GLM-4.7", "modalities": { "input": [ "text" @@ -22517,58 +23284,77 @@ ] }, "limit": { - "context": 16384, - "output": 8192 + "context": 204800, + "output": 131072 }, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } }, "attachment": false, - "open_weights": false, - "release_date": "2024-07-01", - "last_updated": "2024-07-01", + "open_weights": true, + "release_date": "2025-12-22", + "last_updated": "2025-12-22", "cost": { - "input": 2.006, - "output": 2.992 + "input": 0.6, + "output": 2.2, + "cache_read": 0.11 }, "type": "chat" }, { - "id": "anthracite-org/magnum-v4-72b", - "name": "Magnum v4 72B", - "display_name": "Magnum v4 72B", + "id": "zai-org/glm-4.5v", + "name": "GLM 4.5V", + "display_name": "GLM 4.5V", "modalities": { "input": [ "text", - "pdf" + "video", + "image" ], "output": [ "text" ] }, "limit": { - "context": 16384, - "output": 8192 + "context": 65536, + "output": 16384 }, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "attachment": true, - "open_weights": false, - "release_date": "2025-01-01", - "last_updated": "2025-01-01", + "open_weights": true, + "knowledge": "2025-04", + "release_date": "2025-08-11", + "last_updated": "2025-08-11", "cost": { - "input": 2.006, - "output": 2.992 + "input": 0.6, + "output": 1.8, + "cache_read": 0.11 }, "type": "chat" }, { - "id": "Doctor-Shotgun/MS3.2-24B-Magnum-Diamond", - "name": "MS3.2 24B Magnum Diamond", - "display_name": "MS3.2 24B Magnum Diamond", + "id": "zai-org/glm-4.5", + "name": "GLM-4.5", + "display_name": "GLM-4.5", "modalities": { "input": [ "text" @@ -22578,27 +23364,41 @@ ] }, "limit": { - "context": 16384, - "output": 32768 + "context": 131072, + "output": 98304 }, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } }, "attachment": false, - "open_weights": false, - "release_date": "2025-11-24", - "last_updated": "2025-11-24", + "open_weights": true, + "release_date": "2025-07-28", + "last_updated": "2025-07-28", "cost": { - "input": 0.49299999999999994, - "output": 0.49299999999999994 + "input": 0.6, + "output": 2.2, + "cache_read": 0.11 }, "type": "chat" }, { - "id": "baidu/ernie-4.5-vl-28b-a3b", - "name": "ERNIE 4.5 VL 28B", - "display_name": "ERNIE 4.5 VL 28B", + "id": "zai-org/autoglm-phone-9b-multilingual", + "name": "AutoGLM-Phone-9B-Multilingual", + "display_name": "AutoGLM-Phone-9B-Multilingual", "modalities": { "input": [ "text", @@ -22609,27 +23409,28 @@ ] }, "limit": { - "context": 32768, - "output": 16384 + "context": 65536, + "output": 65536 }, + "temperature": true, "tool_call": false, "reasoning": { "supported": false }, "attachment": true, - "open_weights": false, - "release_date": "2025-06-30", - "last_updated": "2025-06-30", + "open_weights": true, + "release_date": "2025-12-10", + "last_updated": "2025-12-10", "cost": { - "input": 0.13999999999999999, - "output": 0.5599999999999999 + "input": 0.035, + "output": 0.138 }, "type": "chat" }, { - "id": "nanogpt/coding-router:max", - "name": "Coding Router Max", - "display_name": "Coding Router Max", + "id": "zai-org/glm-5.1", + "name": "GLM-5.1", + "display_name": "GLM-5.1", "modalities": { "input": [ "text" @@ -22639,29 +23440,41 @@ ] }, "limit": { - "context": 1000000, - "output": 128000 + "context": 204800, + "output": 131072 }, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, "default": true }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } + }, "attachment": false, - "open_weights": false, - "release_date": "2026-05-12", - "last_updated": "2026-05-12", + "open_weights": true, + "release_date": "2026-03-27", + "last_updated": "2026-03-27", "cost": { - "input": 5, - "output": 30, - "cache_read": 0.5 + "input": 1.4, + "output": 4.4, + "cache_read": 0.26 }, "type": "chat" }, { - "id": "nanogpt/coding-router:high", - "name": "Coding Router High", - "display_name": "Coding Router High", + "id": "zai-org/glm-4.6", + "name": "GLM 4.6", + "display_name": "GLM 4.6", "modalities": { "input": [ "text" @@ -22671,61 +23484,77 @@ ] }, "limit": { - "context": 1000000, - "output": 128000 + "context": 204800, + "output": 131072 }, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, "default": true }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } + }, "attachment": false, - "open_weights": false, - "release_date": "2026-05-12", - "last_updated": "2026-05-12", + "open_weights": true, + "release_date": "2025-09-30", + "last_updated": "2025-09-30", "cost": { - "input": 1.1, + "input": 0.55, "output": 2.2, "cache_read": 0.11 }, "type": "chat" }, { - "id": "nanogpt/coding-router", - "name": "Coding Router", - "display_name": "Coding Router", + "id": "zai-org/glm-4.6v", + "name": "GLM 4.6V", + "display_name": "GLM 4.6V", "modalities": { "input": [ - "text" + "text", + "video", + "image" ], "output": [ "text" ] }, "limit": { - "context": 1000000, - "output": 128000 + "context": 131072, + "output": 32768 }, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, "default": true }, - "attachment": false, - "open_weights": false, - "release_date": "2026-05-12", - "last_updated": "2026-05-12", + "attachment": true, + "open_weights": true, + "knowledge": "2025-04", + "release_date": "2025-12-08", + "last_updated": "2025-12-08", "cost": { - "input": 1.1, - "output": 2.2, - "cache_read": 0.11 + "input": 0.3, + "output": 0.9, + "cache_read": 0.055 }, "type": "chat" }, { - "id": "nanogpt/coding-router:medium", - "name": "Coding Router Medium", - "display_name": "Coding Router Medium", + "id": "zai-org/glm-4.5-air", + "name": "GLM 4.5 Air", + "display_name": "GLM 4.5 Air", "modalities": { "input": [ "text" @@ -22735,29 +23564,30 @@ ] }, "limit": { - "context": 1000000, - "output": 128000 + "context": 131072, + "output": 98304 }, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, "default": true }, "attachment": false, - "open_weights": false, - "release_date": "2026-05-12", - "last_updated": "2026-05-12", + "open_weights": true, + "knowledge": "2025-04", + "release_date": "2025-10-13", + "last_updated": "2025-10-13", "cost": { - "input": 0.14, - "output": 0.28, - "cache_read": 0.028 + "input": 0.13, + "output": 0.85 }, "type": "chat" }, { - "id": "nanogpt/coding-router:low", - "name": "Coding Router Low", - "display_name": "Coding Router Low", + "id": "zai-org/glm-4.7-flash", + "name": "GLM-4.7-Flash", + "display_name": "GLM-4.7-Flash", "modalities": { "input": [ "text" @@ -22767,29 +23597,36 @@ ] }, "limit": { - "context": 1000000, + "context": 200000, "output": 128000 }, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, "default": true }, + "extra_capabilities": { + "reasoning": { + "supported": true + } + }, "attachment": false, - "open_weights": false, - "release_date": "2026-05-12", - "last_updated": "2026-05-12", + "open_weights": true, + "knowledge": "2025-04", + "release_date": "2026-01-19", + "last_updated": "2026-01-19", "cost": { - "input": 0.14, - "output": 0.28, - "cache_read": 0.028 + "input": 0.07, + "output": 0.4, + "cache_read": 0.01 }, "type": "chat" }, { - "id": "abacusai/Dracarys-72B-Instruct", - "name": "Llama 3.1 70B Dracarys 2", - "display_name": "Llama 3.1 70B Dracarys 2", + "id": "zai-org/glm-5", + "name": "GLM-5", + "display_name": "GLM-5", "modalities": { "input": [ "text" @@ -22799,27 +23636,41 @@ ] }, "limit": { - "context": 16384, - "output": 8192 + "context": 202800, + "output": 131072 }, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } }, "attachment": false, - "open_weights": false, - "release_date": "2025-08-02", - "last_updated": "2025-08-02", + "open_weights": true, + "release_date": "2026-02-11", + "last_updated": "2026-02-12", "cost": { - "input": 0.49299999999999994, - "output": 0.49299999999999994 + "input": 1, + "output": 3.2, + "cache_read": 0.2 }, "type": "chat" }, { - "id": "x-ai/grok-4.20-multi-agent", - "name": "Grok 4.20 Multi-Agent", - "display_name": "Grok 4.20 Multi-Agent", + "id": "paddlepaddle/paddleocr-vl", + "name": "PaddleOCR-VL", + "display_name": "PaddleOCR-VL", "modalities": { "input": [ "text", @@ -22830,173 +23681,183 @@ ] }, "limit": { - "context": 2000000, - "output": 131072 + "context": 16384, + "output": 16384 }, - "tool_call": true, + "temperature": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": true + "supported": false }, "attachment": true, - "open_weights": false, - "release_date": "2026-03-31", - "last_updated": "2026-03-31", + "open_weights": true, + "release_date": "2025-10-22", + "last_updated": "2025-10-22", "cost": { - "input": 2, - "output": 6 + "input": 0.02, + "output": 0.02 }, "type": "chat" }, { - "id": "x-ai/grok-build-0.1", - "name": "Grok Build 0.1", - "display_name": "Grok Build 0.1", + "id": "qwen/qwen3-vl-235b-a22b-thinking", + "name": "Qwen3 VL 235B A22B Thinking", + "display_name": "Qwen3 VL 235B A22B Thinking", "modalities": { "input": [ "text", - "image" + "image", + "video" ], "output": [ "text" ] }, "limit": { - "context": 256000, - "output": 256000 + "context": 131072, + "output": 32768 }, - "tool_call": true, + "temperature": true, + "tool_call": false, "reasoning": { "supported": true, "default": true }, "extra_capabilities": { "reasoning": { - "supported": true + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] } }, "attachment": true, - "open_weights": false, - "release_date": "2026-05-20", - "last_updated": "2026-05-20", + "open_weights": true, + "release_date": "2025-09-24", + "last_updated": "2025-09-24", "cost": { - "input": 1, - "output": 2, - "cache_read": 0.2 + "input": 0.98, + "output": 3.95 }, "type": "chat" }, { - "id": "x-ai/grok-4.20", - "name": "Grok 4.20", - "display_name": "Grok 4.20", + "id": "qwen/qwen3-vl-30b-a3b-thinking", + "name": "qwen/qwen3-vl-30b-a3b-thinking", + "display_name": "qwen/qwen3-vl-30b-a3b-thinking", "modalities": { "input": [ "text", - "image" - ], + "image", + "video" + ], "output": [ "text" ] }, "limit": { - "context": 2000000, - "output": 131072 + "context": 131072, + "output": 32768 }, + "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } }, "attachment": true, - "open_weights": false, - "release_date": "2026-03-31", - "last_updated": "2026-03-31", + "open_weights": true, + "release_date": "2025-10-11", + "last_updated": "2025-10-11", "cost": { - "input": 2, - "output": 6 + "input": 0.2, + "output": 1 }, "type": "chat" }, { - "id": "x-ai/grok-latest", - "name": "Grok Latest", - "display_name": "Grok Latest", + "id": "qwen/qwen3-235b-a22b-instruct-2507", + "name": "Qwen3 235B A22B Instruct 2507", + "display_name": "Qwen3 235B A22B Instruct 2507", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 1000000, - "output": 1000000 + "context": 131072, + "output": 16384 }, + "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, - "attachment": true, - "open_weights": false, - "release_date": "2026-05-03", - "last_updated": "2026-05-03", + "attachment": false, + "open_weights": true, + "knowledge": "2025-04", + "release_date": "2025-07-22", + "last_updated": "2025-07-22", "cost": { - "input": 1.25, - "output": 2.5, - "cache_read": 0.2 + "input": 0.09, + "output": 0.58 }, "type": "chat" }, { - "id": "x-ai/grok-4.3", - "name": "Grok 4.3", - "display_name": "Grok 4.3", + "id": "qwen/qwen3-coder-30b-a3b-instruct", + "name": "Qwen3 Coder 30b A3B Instruct", + "display_name": "Qwen3 Coder 30b A3B Instruct", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 1000000, - "output": 1000000 + "context": 160000, + "output": 32768 }, + "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true - } + "supported": false }, - "attachment": true, - "open_weights": false, - "release_date": "2026-04-30", - "last_updated": "2026-04-30", + "attachment": false, + "open_weights": true, + "release_date": "2025-10-09", + "last_updated": "2025-10-09", "cost": { - "input": 1.25, - "output": 2.5, - "cache_read": 0.2 + "input": 0.07, + "output": 0.27 }, "type": "chat" }, { - "id": "deepseek-ai/DeepSeek-V3.1", - "name": "DeepSeek V3.1", - "display_name": "DeepSeek V3.1", + "id": "qwen/qwen3-8b-fp8", + "name": "Qwen3 8B", + "display_name": "Qwen3 8B", "modalities": { "input": [ - "text", - "pdf" + "text" ], "output": [ "text" @@ -23004,26 +23865,28 @@ }, "limit": { "context": 128000, - "output": 65536 + "output": 20000 }, + "temperature": true, "tool_call": false, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": true, - "open_weights": false, - "release_date": "2025-07-26", - "last_updated": "2025-07-26", + "attachment": false, + "open_weights": true, + "release_date": "2025-04-29", + "last_updated": "2025-04-29", "cost": { - "input": 0.2, - "output": 0.7 + "input": 0.035, + "output": 0.138 }, "type": "chat" }, { - "id": "deepseek-ai/DeepSeek-V3.1:thinking", - "name": "DeepSeek V3.1 Thinking", - "display_name": "DeepSeek V3.1 Thinking", + "id": "qwen/qwen3-next-80b-a3b-instruct", + "name": "Qwen3 Next 80B A3B Instruct", + "display_name": "Qwen3 Next 80B A3B Instruct", "modalities": { "input": [ "text" @@ -23033,57 +23896,109 @@ ] }, "limit": { - "context": 128000, - "output": 65536 + "context": 131072, + "output": 32768 }, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { "supported": false }, "attachment": false, - "open_weights": false, - "release_date": "2025-08-21", - "last_updated": "2025-08-21", + "open_weights": true, + "release_date": "2025-09-10", + "last_updated": "2025-09-10", "cost": { - "input": 0.2, - "output": 0.7 + "input": 0.15, + "output": 1.5 }, "type": "chat" }, { - "id": "deepseek-ai/DeepSeek-V3.1-Terminus", - "name": "DeepSeek V3.1 Terminus", - "display_name": "DeepSeek V3.1 Terminus", + "id": "qwen/qwen3-vl-8b-instruct", + "name": "qwen/qwen3-vl-8b-instruct", + "display_name": "qwen/qwen3-vl-8b-instruct", "modalities": { "input": [ - "text" + "text", + "image", + "video" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 65536 + "context": 131072, + "output": 32768 }, + "temperature": true, "tool_call": true, "reasoning": { "supported": false }, - "attachment": false, - "open_weights": false, - "release_date": "2025-08-02", - "last_updated": "2025-08-02", + "attachment": true, + "open_weights": true, + "release_date": "2025-10-17", + "last_updated": "2025-10-17", + "cost": { + "input": 0.08, + "output": 0.5 + }, + "type": "chat" + }, + { + "id": "qwen/qwen3-omni-30b-a3b-thinking", + "name": "Qwen3 Omni 30B A3B Thinking", + "display_name": "Qwen3 Omni 30B A3B Thinking", + "modalities": { + "input": [ + "text", + "audio", + "video", + "image" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 65536, + "output": 16384 + }, + "temperature": true, + "tool_call": true, + "reasoning": { + "supported": true, + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } + }, + "attachment": true, + "open_weights": true, + "release_date": "2025-09-24", + "last_updated": "2025-09-24", "cost": { "input": 0.25, - "output": 0.7 + "output": 0.97, + "input_audio": 2.2, + "output_audio": 1.788 }, "type": "chat" }, { - "id": "deepseek-ai/deepseek-v3.2-exp-thinking", - "name": "DeepSeek V3.2 Exp Thinking", - "display_name": "DeepSeek V3.2 Exp Thinking", + "id": "qwen/qwen3.7-max", + "name": "Qwen3.7-Max", + "display_name": "Qwen3.7-Max", "modalities": { "input": [ "text" @@ -23093,28 +24008,36 @@ ] }, "limit": { - "context": 163840, + "context": 1000000, "output": 65536 }, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { "supported": true, "default": true }, + "extra_capabilities": { + "reasoning": { + "supported": true + } + }, "attachment": false, "open_weights": false, - "release_date": "2025-09-29", - "last_updated": "2025-09-29", + "release_date": "2026-05-21", + "last_updated": "2026-05-27", "cost": { - "input": 0.27999999999999997, - "output": 0.42000000000000004 + "input": 1.25, + "output": 3.75, + "cache_read": 0.125, + "cache_write": 1.5625 }, "type": "chat" }, { - "id": "deepseek-ai/DeepSeek-V3.1-Terminus:thinking", - "name": "DeepSeek V3.1 Terminus (Thinking)", - "display_name": "DeepSeek V3.1 Terminus (Thinking)", + "id": "qwen/qwen3-max", + "name": "Qwen3 Max", + "display_name": "Qwen3 Max", "modalities": { "input": [ "text" @@ -23124,27 +24047,40 @@ ] }, "limit": { - "context": 128000, + "context": 262144, "output": 65536 }, + "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } }, "attachment": false, "open_weights": false, - "release_date": "2025-09-22", - "last_updated": "2025-09-22", + "knowledge": "2025-04", + "release_date": "2025-09-24", + "last_updated": "2025-09-24", "cost": { - "input": 0.25, - "output": 0.7 + "input": 2.11, + "output": 8.45 }, "type": "chat" }, { - "id": "deepseek-ai/deepseek-v3.2-exp", - "name": "DeepSeek V3.2 Exp", - "display_name": "DeepSeek V3.2 Exp", + "id": "qwen/qwen2.5-7b-instruct", + "name": "Qwen2.5 7B Instruct", + "display_name": "Qwen2.5 7B Instruct", "modalities": { "input": [ "text" @@ -23154,27 +24090,28 @@ ] }, "limit": { - "context": 163840, - "output": 65536 + "context": 32000, + "output": 32000 }, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { "supported": false }, "attachment": false, - "open_weights": false, - "release_date": "2025-09-29", - "last_updated": "2025-09-29", + "open_weights": true, + "release_date": "2025-04-16", + "last_updated": "2025-04-16", "cost": { - "input": 0.27999999999999997, - "output": 0.42000000000000004 + "input": 0.07, + "output": 0.07 }, "type": "chat" }, { - "id": "deepseek-ai/DeepSeek-R1-0528", - "name": "DeepSeek R1 0528", - "display_name": "DeepSeek R1 0528", + "id": "qwen/qwen3-next-80b-a3b-thinking", + "name": "Qwen3 Next 80B A3B Thinking", + "display_name": "Qwen3 Next 80B A3B Thinking", "modalities": { "input": [ "text" @@ -23184,10 +24121,11 @@ ] }, "limit": { - "context": 128000, - "output": 163840 + "context": 131072, + "output": 32768 }, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { "supported": true, "default": true @@ -23204,19 +24142,19 @@ } }, "attachment": false, - "open_weights": false, - "release_date": "2025-05-28", - "last_updated": "2025-05-28", + "open_weights": true, + "release_date": "2025-09-10", + "last_updated": "2025-09-10", "cost": { - "input": 0.4, - "output": 1.7 + "input": 0.15, + "output": 1.5 }, "type": "chat" }, { - "id": "Sao10K/L3.1-70B-Hanami-x1", - "name": "Llama 3.1 70B Hanami", - "display_name": "Llama 3.1 70B Hanami", + "id": "qwen/qwen3-235b-a22b-thinking-2507", + "name": "Qwen3 235B A22b Thinking 2507", + "display_name": "Qwen3 235B A22b Thinking 2507", "modalities": { "input": [ "text" @@ -23226,27 +24164,41 @@ ] }, "limit": { - "context": 16384, - "output": 16384 + "context": 131072, + "output": 32768 }, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } }, "attachment": false, - "open_weights": false, - "release_date": "2024-07-23", - "last_updated": "2024-07-23", + "open_weights": true, + "knowledge": "2025-04", + "release_date": "2025-07-25", + "last_updated": "2025-07-25", "cost": { - "input": 0.49299999999999994, - "output": 0.49299999999999994 + "input": 0.3, + "output": 3 }, "type": "chat" }, { - "id": "Sao10K/L3.3-70B-Euryale-v2.3", - "name": "Llama 3.3 70B Euryale", - "display_name": "Llama 3.3 70B Euryale", + "id": "qwen/qwen-mt-plus", + "name": "Qwen MT Plus", + "display_name": "Qwen MT Plus", "modalities": { "input": [ "text" @@ -23256,27 +24208,28 @@ ] }, "limit": { - "context": 20480, - "output": 16384 + "context": 16384, + "output": 8192 }, + "temperature": true, "tool_call": false, "reasoning": { "supported": false }, "attachment": false, - "open_weights": false, - "release_date": "2024-12-06", - "last_updated": "2024-12-06", + "open_weights": true, + "release_date": "2025-09-03", + "last_updated": "2025-09-03", "cost": { - "input": 0.49299999999999994, - "output": 0.49299999999999994 + "input": 0.25, + "output": 0.75 }, "type": "chat" }, { - "id": "Sao10K/L3-8B-Stheno-v3.2", - "name": "Sao10K Stheno 8b", - "display_name": "Sao10K Stheno 8b", + "id": "qwen/qwen3-32b-fp8", + "name": "Qwen3 32B", + "display_name": "Qwen3 32B", "modalities": { "input": [ "text" @@ -23286,27 +24239,29 @@ ] }, "limit": { - "context": 16384, - "output": 8192 + "context": 40960, + "output": 20000 }, + "temperature": true, "tool_call": false, "reasoning": { - "supported": false + "supported": true, + "default": true }, "attachment": false, - "open_weights": false, - "release_date": "2024-11-29", - "last_updated": "2024-11-29", + "open_weights": true, + "release_date": "2025-04-29", + "last_updated": "2025-04-29", "cost": { - "input": 0.2006, - "output": 0.2006 + "input": 0.1, + "output": 0.45 }, "type": "chat" }, { - "id": "Sao10K/L3.1-70B-Euryale-v2.2", - "name": "Llama 3.1 70B Euryale", - "display_name": "Llama 3.1 70B Euryale", + "id": "qwen/qwen3-4b-fp8", + "name": "Qwen3 4B", + "display_name": "Qwen3 4B", "modalities": { "input": [ "text" @@ -23316,122 +24271,139 @@ ] }, "limit": { - "context": 20480, - "output": 16384 + "context": 128000, + "output": 20000 }, + "temperature": true, "tool_call": false, "reasoning": { - "supported": false + "supported": true, + "default": true }, "attachment": false, - "open_weights": false, - "release_date": "2024-07-23", - "last_updated": "2024-07-23", + "open_weights": true, + "release_date": "2025-04-29", + "last_updated": "2025-04-29", "cost": { - "input": 0.306, - "output": 0.357 + "input": 0.03, + "output": 0.03 }, "type": "chat" }, { - "id": "nvidia/Llama-3_3-Nemotron-Super-49B-v1_5", - "name": "Nvidia Nemotron Super 49B v1.5", - "display_name": "Nvidia Nemotron Super 49B v1.5", + "id": "qwen/qwen2.5-vl-72b-instruct", + "name": "Qwen2.5 VL 72B Instruct", + "display_name": "Qwen2.5 VL 72B Instruct", "modalities": { "input": [ - "text" + "text", + "image", + "video" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 16384 + "context": 32768, + "output": 32768 }, "temperature": true, "tool_call": false, "reasoning": { "supported": false }, - "attachment": false, - "open_weights": false, - "release_date": "2025-08-08", - "last_updated": "2025-08-08", + "attachment": true, + "open_weights": true, + "release_date": "2025-03-25", + "last_updated": "2025-03-25", "cost": { - "input": 0.05, - "output": 0.25 + "input": 0.8, + "output": 0.8 }, "type": "chat" }, { - "id": "nvidia/nemotron-3-nano-omni-30b-a3b-reasoning", - "name": "Nvidia Nemotron 3 Nano Omni", - "display_name": "Nvidia Nemotron 3 Nano Omni", + "id": "qwen/qwen3-30b-a3b-fp8", + "name": "Qwen3 30B A3B", + "display_name": "Qwen3 30B A3B", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 256000, - "output": 65536 + "context": 40960, + "output": 20000 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": true, "default": true }, - "attachment": true, - "open_weights": false, - "release_date": "2026-04-28", - "last_updated": "2026-04-28", + "attachment": false, + "open_weights": true, + "release_date": "2025-04-29", + "last_updated": "2025-04-29", "cost": { - "input": 0.105, - "output": 0.42 + "input": 0.09, + "output": 0.45 }, "type": "chat" }, { - "id": "nvidia/nemotron-3-nano-30b-a3b", - "name": "Nvidia Nemotron 3 Nano 30B", - "display_name": "Nvidia Nemotron 3 Nano 30B", + "id": "qwen/qwen3.5-27b", + "name": "Qwen3.5-27B", + "display_name": "Qwen3.5-27B", "modalities": { "input": [ - "text" + "text", + "image", + "video" ], "output": [ "text" ] }, "limit": { - "context": 256000, - "output": 262144 + "context": 262144, + "output": 65536 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": false, - "open_weights": false, - "release_date": "2025-12-15", - "last_updated": "2025-12-15", + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } + }, + "attachment": true, + "open_weights": true, + "release_date": "2026-02-26", + "last_updated": "2026-02-26", "cost": { - "input": 0.17, - "output": 0.68 + "input": 0.3, + "output": 2.4 }, "type": "chat" }, { - "id": "nvidia/Llama-3.3-Nemotron-Super-49B-v1", - "name": "Nvidia Nemotron Super 49B", - "display_name": "Nvidia Nemotron Super 49B", + "id": "qwen/qwen-2.5-72b-instruct", + "name": "Qwen 2.5 72B Instruct", + "display_name": "Qwen 2.5 72B Instruct", "modalities": { "input": [ "text" @@ -23441,28 +24413,29 @@ ] }, "limit": { - "context": 128000, - "output": 16384 + "context": 32000, + "output": 8192 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { "supported": false }, "attachment": false, - "open_weights": false, - "release_date": "2025-08-08", - "last_updated": "2025-08-08", + "open_weights": true, + "knowledge": "2024-04", + "release_date": "2024-10-15", + "last_updated": "2024-10-15", "cost": { - "input": 0.15, - "output": 0.15 + "input": 0.38, + "output": 0.4 }, "type": "chat" }, { - "id": "nvidia/nvidia-nemotron-nano-9b-v2", - "name": "Nvidia Nemotron Nano 9B v2", - "display_name": "Nvidia Nemotron Nano 9B v2", + "id": "qwen/qwen3-coder-next", + "name": "Qwen3 Coder Next", + "display_name": "Qwen3 Coder Next", "modalities": { "input": [ "text" @@ -23472,59 +24445,73 @@ ] }, "limit": { - "context": 128000, - "output": 16384 + "context": 262144, + "output": 65536 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { "supported": false }, "attachment": false, - "open_weights": false, - "release_date": "2025-08-18", - "last_updated": "2025-08-18", + "open_weights": true, + "release_date": "2026-02-03", + "last_updated": "2026-02-03", "cost": { - "input": 0.17, - "output": 0.68 + "input": 0.2, + "output": 1.5 }, "type": "chat" }, { - "id": "nvidia/Llama-3.1-Nemotron-70B-Instruct-HF", - "name": "Nvidia Nemotron 70b", - "display_name": "Nvidia Nemotron 70b", + "id": "qwen/qwen3.5-35b-a3b", + "name": "Qwen3.5-35B-A3B", + "display_name": "Qwen3.5-35B-A3B", "modalities": { "input": [ - "text" + "text", + "image", + "video" ], "output": [ "text" ] }, "limit": { - "context": 16384, - "output": 8192 + "context": 262144, + "output": 65536 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": false, - "open_weights": false, - "release_date": "2025-04-15", - "last_updated": "2025-04-15", + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } + }, + "attachment": true, + "open_weights": true, + "release_date": "2026-02-26", + "last_updated": "2026-02-26", "cost": { - "input": 0.357, - "output": 0.408 + "input": 0.25, + "output": 2 }, "type": "chat" }, { - "id": "nvidia/nemotron-3-super-120b-a12b", - "name": "Nvidia Nemotron 3 Super 120B", - "display_name": "Nvidia Nemotron 3 Super 120B", + "id": "qwen/qwen3-coder-480b-a35b-instruct", + "name": "Qwen3 Coder 480B A35B Instruct", + "display_name": "Qwen3 Coder 480B A35B Instruct", "modalities": { "input": [ "text" @@ -23535,31 +24522,33 @@ }, "limit": { "context": 262144, - "output": 16384 + "output": 65536 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, "attachment": false, - "open_weights": false, - "release_date": "2026-03-01", - "last_updated": "2026-03-01", + "open_weights": true, + "knowledge": "2025-04", + "release_date": "2025-07-23", + "last_updated": "2025-07-23", "cost": { - "input": 0.05, - "output": 0.25 + "input": 0.3, + "output": 1.3 }, "type": "chat" }, { - "id": "nvidia/nemotron-3-super-120b-a12b:thinking", - "name": "Nvidia Nemotron 3 Super 120B Thinking", - "display_name": "Nvidia Nemotron 3 Super 120B Thinking", + "id": "qwen/qwen3.5-397b-a17b", + "name": "Qwen3.5-397B-A17B", + "display_name": "Qwen3.5-397B-A17B", "modalities": { "input": [ - "text" + "text", + "image", + "video" ], "output": [ "text" @@ -23567,7 +24556,7 @@ }, "limit": { "context": 262144, - "output": 16384 + "output": 64000 }, "temperature": true, "tool_call": true, @@ -23575,23 +24564,36 @@ "supported": true, "default": true }, - "attachment": false, - "open_weights": false, - "release_date": "2026-03-01", - "last_updated": "2026-03-01", + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } + }, + "attachment": true, + "open_weights": true, + "release_date": "2026-02-17", + "last_updated": "2026-02-17", "cost": { - "input": 0.05, - "output": 0.25 + "input": 0.6, + "output": 3.6 }, "type": "chat" }, { - "id": "arcee-ai/trinity-mini", - "name": "Trinity Mini", - "display_name": "Trinity Mini", + "id": "qwen/qwen3-vl-30b-a3b-instruct", + "name": "qwen/qwen3-vl-30b-a3b-instruct", + "display_name": "qwen/qwen3-vl-30b-a3b-instruct", "modalities": { "input": [ - "text" + "text", + "video", + "image" ], "output": [ "text" @@ -23599,117 +24601,143 @@ }, "limit": { "context": 131072, - "output": 8192 + "output": 32768 }, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { "supported": false }, - "attachment": false, - "open_weights": false, - "release_date": "2025-12-01", - "last_updated": "2025-12-01", + "attachment": true, + "open_weights": true, + "release_date": "2025-10-11", + "last_updated": "2025-10-11", "cost": { - "input": 0.045000000000000005, - "output": 0.15 + "input": 0.2, + "output": 0.7 }, "type": "chat" }, { - "id": "arcee-ai/trinity-large-thinking", - "name": "Trinity Large Thinking", - "display_name": "Trinity Large Thinking", + "id": "qwen/qwen3-omni-30b-a3b-instruct", + "name": "Qwen3 Omni 30B A3B Instruct", + "display_name": "Qwen3 Omni 30B A3B Instruct", "modalities": { "input": [ - "text" + "text", + "video", + "audio", + "image" ], "output": [ - "text" + "text", + "audio" ] }, "limit": { - "context": 262144, - "output": 80000 + "context": 65536, + "output": 16384 }, + "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, - "attachment": false, - "open_weights": false, - "release_date": "2026-04-01", - "last_updated": "2026-04-01", + "attachment": true, + "open_weights": true, + "knowledge": "2024-04", + "release_date": "2025-09-24", + "last_updated": "2025-09-24", "cost": { "input": 0.25, - "output": 0.9 + "output": 0.97, + "input_audio": 2.2, + "output_audio": 1.788 }, "type": "chat" }, { - "id": "Infermatic/MN-12B-Inferor-v0.0", - "name": "Mistral Nemo Inferor 12B", - "display_name": "Mistral Nemo Inferor 12B", + "id": "qwen/qwen3-vl-235b-a22b-instruct", + "name": "Qwen3 VL 235B A22B Instruct", + "display_name": "Qwen3 VL 235B A22B Instruct", "modalities": { "input": [ - "text" + "text", + "image", + "video" ], "output": [ "text" ] }, "limit": { - "context": 16384, - "output": 8192 + "context": 131072, + "output": 32768 }, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { "supported": false }, - "attachment": false, - "open_weights": false, - "release_date": "2024-07-01", - "last_updated": "2024-07-01", + "attachment": true, + "open_weights": true, + "release_date": "2025-09-24", + "last_updated": "2025-09-24", "cost": { - "input": 0.25499999999999995, - "output": 0.49299999999999994 + "input": 0.3, + "output": 1.5 }, "type": "chat" }, { - "id": "meganova-ai/manta-mini-1.0", - "name": "Manta Mini 1.0", - "display_name": "Manta Mini 1.0", + "id": "qwen/qwen3.5-122b-a10b", + "name": "Qwen3.5-122B-A10B", + "display_name": "Qwen3.5-122B-A10B", "modalities": { "input": [ - "text" + "text", + "image", + "video" ], "output": [ "text" ] }, "limit": { - "context": 8192, - "output": 8192 + "context": 262144, + "output": 65536 }, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": false, - "open_weights": false, - "release_date": "2025-12-20", - "last_updated": "2025-12-20", + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } + }, + "attachment": true, + "open_weights": true, + "release_date": "2026-02-26", + "last_updated": "2026-02-26", "cost": { - "input": 0.02, - "output": 0.16 + "input": 0.4, + "output": 3.2 }, "type": "chat" }, { - "id": "meganova-ai/manta-flash-1.0", - "name": "Manta Flash 1.0", - "display_name": "Manta Flash 1.0", + "id": "qwen/qwen3-235b-a22b-fp8", + "name": "Qwen3 235B A22B", + "display_name": "Qwen3 235B A22B", "modalities": { "input": [ "text" @@ -23719,27 +24747,29 @@ ] }, "limit": { - "context": 16384, - "output": 16384 + "context": 40960, + "output": 20000 }, + "temperature": true, "tool_call": false, "reasoning": { - "supported": false + "supported": true, + "default": true }, "attachment": false, - "open_weights": false, - "release_date": "2025-12-20", - "last_updated": "2025-12-20", + "open_weights": true, + "release_date": "2025-04-29", + "last_updated": "2025-04-29", "cost": { - "input": 0.02, - "output": 0.16 + "input": 0.2, + "output": 0.8 }, "type": "chat" }, { - "id": "meganova-ai/manta-pro-1.0", - "name": "Manta Pro 1.0", - "display_name": "Manta Pro 1.0", + "id": "deepseek/deepseek-r1-0528", + "name": "DeepSeek R1 0528", + "display_name": "DeepSeek R1 0528", "modalities": { "input": [ "text" @@ -23749,27 +24779,42 @@ ] }, "limit": { - "context": 32768, + "context": 163840, "output": 32768 }, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } }, "attachment": false, - "open_weights": false, - "release_date": "2025-12-20", - "last_updated": "2025-12-20", + "open_weights": true, + "knowledge": "2024-07", + "release_date": "2025-05-28", + "last_updated": "2025-05-28", "cost": { - "input": 0.060000000000000005, - "output": 0.5 + "input": 0.7, + "output": 2.5, + "cache_read": 0.35 }, "type": "chat" }, { - "id": "cognitivecomputations/dolphin-2.9.2-qwen2-72b", - "name": "Dolphin 72b", - "display_name": "Dolphin 72b", + "id": "deepseek/deepseek-v4-flash", + "name": "DeepSeek V4 Flash", + "display_name": "DeepSeek V4 Flash", "modalities": { "input": [ "text" @@ -23779,58 +24824,75 @@ ] }, "limit": { - "context": 8192, - "output": 4096 + "context": 1048576, + "output": 393216 }, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } }, "attachment": false, - "open_weights": false, - "release_date": "2025-02-27", - "last_updated": "2025-02-27", + "open_weights": true, + "knowledge": "2025-05", + "release_date": "2026-04-24", + "last_updated": "2026-04-24", "cost": { - "input": 0.306, - "output": 0.306 + "input": 0.14, + "output": 0.28, + "cache_read": 0.028 }, "type": "chat" }, { - "id": "microsoft/wizardlm-2-8x22b", - "name": "WizardLM-2 8x22B", - "display_name": "WizardLM-2 8x22B", + "id": "deepseek/deepseek-v3.1-terminus", + "name": "Deepseek V3.1 Terminus", + "display_name": "Deepseek V3.1 Terminus", "modalities": { "input": [ - "text", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 65536, - "output": 8192 + "context": 131072, + "output": 32768 }, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": true, - "open_weights": false, - "release_date": "2025-04-15", - "last_updated": "2025-04-15", + "attachment": false, + "open_weights": true, + "release_date": "2025-09-22", + "last_updated": "2025-09-22", "cost": { - "input": 0.49299999999999994, - "output": 0.49299999999999994 + "input": 0.27, + "output": 1, + "cache_read": 0.135 }, "type": "chat" }, { - "id": "EVA-UNIT-01/EVA-Qwen2.5-72B-v0.2", - "name": "EVA-Qwen2.5-72B-v0.2", - "display_name": "EVA-Qwen2.5-72B-v0.2", + "id": "deepseek/deepseek-v3-0324", + "name": "DeepSeek V3 0324", + "display_name": "DeepSeek V3 0324", "modalities": { "input": [ "text" @@ -23840,57 +24902,62 @@ ] }, "limit": { - "context": 16384, - "output": 8192 + "context": 163840, + "output": 163840 }, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { "supported": false }, "attachment": false, - "open_weights": false, - "release_date": "2025-09-25", - "last_updated": "2025-09-25", + "open_weights": true, + "knowledge": "2024-07", + "release_date": "2025-03-25", + "last_updated": "2025-03-25", "cost": { - "input": 0.7989999999999999, - "output": 0.7989999999999999 + "input": 0.27, + "output": 1.12, + "cache_read": 0.135 }, "type": "chat" }, { - "id": "EVA-UNIT-01/EVA-Qwen2.5-32B-v0.2", - "name": "EVA-Qwen2.5-32B-v0.2", - "display_name": "EVA-Qwen2.5-32B-v0.2", + "id": "deepseek/deepseek-ocr", + "name": "DeepSeek-OCR", + "display_name": "DeepSeek-OCR", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 16384, + "context": 8192, "output": 8192 }, + "temperature": true, "tool_call": false, "reasoning": { "supported": false }, - "attachment": false, - "open_weights": false, - "release_date": "2025-07-26", - "last_updated": "2025-07-26", + "attachment": true, + "open_weights": true, + "release_date": "2025-10-24", + "last_updated": "2025-10-24", "cost": { - "input": 0.7989999999999999, - "output": 0.7989999999999999 + "input": 0.03, + "output": 0.03 }, "type": "chat" }, { - "id": "EVA-UNIT-01/EVA-LLaMA-3.33-70B-v0.0", - "name": "EVA Llama 3.33 70B", - "display_name": "EVA Llama 3.33 70B", + "id": "deepseek/deepseek-r1-distill-llama-70b", + "name": "DeepSeek R1 Distill LLama 70B", + "display_name": "DeepSeek R1 Distill LLama 70B", "modalities": { "input": [ "text" @@ -23900,27 +24967,34 @@ ] }, "limit": { - "context": 16384, - "output": 16384 + "context": 8192, + "output": 8192 }, + "temperature": true, "tool_call": false, "reasoning": { - "supported": false + "supported": true, + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true + } }, "attachment": false, - "open_weights": false, - "release_date": "2025-07-26", - "last_updated": "2025-07-26", + "open_weights": true, + "release_date": "2025-01-27", + "last_updated": "2025-01-27", "cost": { - "input": 2.006, - "output": 2.006 + "input": 0.8, + "output": 0.8 }, "type": "chat" }, { - "id": "EVA-UNIT-01/EVA-LLaMA-3.33-70B-v0.1", - "name": "EVA-LLaMA-3.33-70B-v0.1", - "display_name": "EVA-LLaMA-3.33-70B-v0.1", + "id": "deepseek/deepseek-r1-turbo", + "name": "DeepSeek R1 (Turbo)\t", + "display_name": "DeepSeek R1 (Turbo)\t", "modalities": { "input": [ "text" @@ -23930,27 +25004,29 @@ ] }, "limit": { - "context": 16384, - "output": 16384 + "context": 64000, + "output": 16000 }, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "attachment": false, - "open_weights": false, - "release_date": "2025-09-25", - "last_updated": "2025-09-25", + "open_weights": true, + "release_date": "2025-03-05", + "last_updated": "2025-03-05", "cost": { - "input": 2.006, - "output": 2.006 + "input": 0.7, + "output": 2.5 }, "type": "chat" }, { - "id": "stepfun-ai/step-3.5-flash", - "name": "Step 3.5 Flash", - "display_name": "Step 3.5 Flash", + "id": "deepseek/deepseek-prover-v2-671b", + "name": "Deepseek Prover V2 671B", + "display_name": "Deepseek Prover V2 671B", "modalities": { "input": [ "text" @@ -23960,28 +25036,28 @@ ] }, "limit": { - "context": 256000, - "output": 256000 + "context": 160000, + "output": 160000 }, + "temperature": true, "tool_call": false, "reasoning": { - "supported": true, - "default": true + "supported": false }, "attachment": false, - "open_weights": false, - "release_date": "2026-02-02", - "last_updated": "2026-02-02", + "open_weights": true, + "release_date": "2025-04-30", + "last_updated": "2025-04-30", "cost": { - "input": 0.2, - "output": 0.5 + "input": 0.7, + "output": 2.5 }, "type": "chat" }, { - "id": "stepfun-ai/step-3.5-flash-2603", - "name": "Step 3.5 Flash 2603", - "display_name": "Step 3.5 Flash 2603", + "id": "deepseek/deepseek-v4-pro", + "name": "DeepSeek V4 Pro", + "display_name": "DeepSeek V4 Pro", "modalities": { "input": [ "text" @@ -23991,28 +25067,42 @@ ] }, "limit": { - "context": 256000, - "output": 256000 + "context": 1048576, + "output": 393216 }, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { "supported": true, "default": true }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } + }, "attachment": false, - "open_weights": false, - "release_date": "2026-04-14", - "last_updated": "2026-04-14", + "open_weights": true, + "knowledge": "2025-05", + "release_date": "2026-04-24", + "last_updated": "2026-04-24", "cost": { - "input": 0.1, - "output": 0.3 + "input": 1.69, + "output": 3.38, + "cache_read": 0.13 }, "type": "chat" }, { - "id": "LLM360/K2-Think", - "name": "K2-Think", - "display_name": "K2-Think", + "id": "deepseek/deepseek-v3.2-exp", + "name": "Deepseek V3.2 Exp", + "display_name": "Deepseek V3.2 Exp", "modalities": { "input": [ "text" @@ -24022,57 +25112,60 @@ ] }, "limit": { - "context": 128000, - "output": 32768 + "context": 163840, + "output": 65536 }, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "attachment": false, - "open_weights": false, - "release_date": "2025-07-26", - "last_updated": "2025-07-26", + "open_weights": true, + "release_date": "2025-09-29", + "last_updated": "2025-09-29", "cost": { - "input": 0.17, - "output": 0.68 + "input": 0.27, + "output": 0.41 }, "type": "chat" }, { - "id": "bytedance-seed/seed-2.0-lite", - "name": "ByteDance Seed 2.0 Lite", - "display_name": "ByteDance Seed 2.0 Lite", + "id": "deepseek/deepseek-ocr-2", + "name": "deepseek/deepseek-ocr-2", + "display_name": "deepseek/deepseek-ocr-2", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 262144, - "output": 131072 + "context": 8192, + "output": 8192 }, "tool_call": false, "reasoning": { "supported": false }, - "attachment": false, - "open_weights": false, - "release_date": "2026-03-10", - "last_updated": "2026-03-10", + "attachment": true, + "open_weights": true, + "release_date": "2026-01-27", + "last_updated": "2026-01-27", "cost": { - "input": 0.25, - "output": 2 + "input": 0.03, + "output": 0.03 }, "type": "chat" }, { - "id": "TEE/gemma4-31b:thinking", - "name": "Gemma 4 31B Thinking TEE", - "display_name": "Gemma 4 31B Thinking TEE", + "id": "deepseek/deepseek-r1-distill-qwen-14b", + "name": "DeepSeek R1 Distill Qwen 14B", + "display_name": "DeepSeek R1 Distill Qwen 14B", "modalities": { "input": [ "text" @@ -24082,28 +25175,28 @@ ] }, "limit": { - "context": 262144, - "output": 131072 + "context": 32768, + "output": 16384 }, + "temperature": true, "tool_call": false, "reasoning": { - "supported": true, - "default": true + "supported": false }, "attachment": false, - "open_weights": false, - "release_date": "2026-05-02", - "last_updated": "2026-05-02", + "open_weights": true, + "release_date": "2025-01-20", + "last_updated": "2025-01-20", "cost": { - "input": 0.45, - "output": 1 + "input": 0.15, + "output": 0.15 }, "type": "chat" }, { - "id": "TEE/qwen3-30b-a3b-instruct-2507", - "name": "Qwen3 30B A3B Instruct 2507 TEE", - "display_name": "Qwen3 30B A3B Instruct 2507 TEE", + "id": "deepseek/deepseek-v3.1", + "name": "DeepSeek V3.1", + "display_name": "DeepSeek V3.1", "modalities": { "input": [ "text" @@ -24113,27 +25206,30 @@ ] }, "limit": { - "context": 262000, + "context": 131072, "output": 32768 }, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "attachment": false, - "open_weights": false, - "release_date": "2025-07-29", - "last_updated": "2025-07-29", + "open_weights": true, + "release_date": "2025-08-21", + "last_updated": "2025-08-21", "cost": { - "input": 0.15, - "output": 0.44999999999999996 + "input": 0.27, + "output": 1, + "cache_read": 0.135 }, "type": "chat" }, { - "id": "TEE/qwen3.5-122b-a10b", - "name": "Qwen3.5 122B A10B TEE", - "display_name": "Qwen3.5 122B A10B TEE", + "id": "deepseek/deepseek-r1-0528-qwen3-8b", + "name": "DeepSeek R1 0528 Qwen3 8B", + "display_name": "DeepSeek R1 0528 Qwen3 8B", "modalities": { "input": [ "text" @@ -24143,70 +25239,60 @@ ] }, "limit": { - "context": 262144, - "output": 262144 + "context": 128000, + "output": 32000 }, - "tool_call": true, + "temperature": true, + "tool_call": false, "reasoning": { "supported": true, "default": true }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } - }, "attachment": false, - "open_weights": false, - "release_date": "2026-05-26", - "last_updated": "2026-05-26", + "open_weights": true, + "release_date": "2025-05-29", + "last_updated": "2025-05-29", "cost": { - "input": 0.46, - "output": 3.68 + "input": 0.06, + "output": 0.09 }, "type": "chat" }, { - "id": "TEE/qwen2.5-vl-72b-instruct", - "name": "Qwen2.5 VL 72B TEE", - "display_name": "Qwen2.5 VL 72B TEE", + "id": "deepseek/deepseek-r1-distill-qwen-32b", + "name": "DeepSeek R1 Distill Qwen 32B", + "display_name": "DeepSeek R1 Distill Qwen 32B", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 65536, - "output": 8192 + "context": 64000, + "output": 32000 }, + "temperature": true, "tool_call": false, "reasoning": { "supported": false }, - "attachment": true, - "open_weights": false, - "release_date": "2025-02-01", - "last_updated": "2025-02-01", + "attachment": false, + "open_weights": true, + "release_date": "2025-01-20", + "last_updated": "2025-01-20", "cost": { - "input": 0.7, - "output": 0.7 + "input": 0.3, + "output": 0.3 }, "type": "chat" }, { - "id": "TEE/glm-5.1-thinking", - "name": "GLM 5.1 Thinking TEE", - "display_name": "GLM 5.1 Thinking TEE", + "id": "deepseek/deepseek-v3-turbo", + "name": "DeepSeek V3 (Turbo)\t", + "display_name": "DeepSeek V3 (Turbo)\t", "modalities": { "input": [ "text" @@ -24216,42 +25302,41 @@ ] }, "limit": { - "context": 202752, - "output": 65535 + "context": 64000, + "output": 16000 }, + "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, "attachment": false, - "open_weights": false, - "release_date": "2026-04-20", - "last_updated": "2026-04-20", + "open_weights": true, + "release_date": "2025-03-05", + "last_updated": "2025-03-05", "cost": { - "input": 1.5, - "output": 5.25, - "cache_read": 0.3 + "input": 0.4, + "output": 1.3 }, "type": "chat" }, { - "id": "TEE/qwen3.6-35b-a3b-uncensored", - "name": "Qwen3.6 35B A3B Uncensored TEE", - "display_name": "Qwen3.6 35B A3B Uncensored TEE", + "id": "deepseek/deepseek-v3.2", + "name": "Deepseek V3.2", + "display_name": "Deepseek V3.2", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 131072, - "output": 131072 + "context": 163840, + "output": 65536 }, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, @@ -24268,20 +25353,21 @@ ] } }, - "attachment": true, - "open_weights": false, - "release_date": "2026-05-23", - "last_updated": "2026-05-23", + "attachment": false, + "open_weights": true, + "release_date": "2025-12-01", + "last_updated": "2025-12-01", "cost": { - "input": 0.3, - "output": 1.5 + "input": 0.269, + "output": 0.4, + "cache_read": 0.1345 }, "type": "chat" }, { - "id": "TEE/gemma-4-31b-it", - "name": "Gemma 4 31B IT TEE", - "display_name": "Gemma 4 31B IT TEE", + "id": "minimax/minimax-m2.7-highspeed", + "name": "MiniMax-M2.7-highspeed", + "display_name": "MiniMax-M2.7-highspeed", "modalities": { "input": [ "text" @@ -24291,28 +25377,42 @@ ] }, "limit": { - "context": 262144, - "output": 262144 + "context": 204800, + "output": 131072 }, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, "default": true }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } + }, "attachment": false, - "open_weights": false, - "release_date": "2026-05-26", - "last_updated": "2026-05-26", + "open_weights": true, + "release_date": "2026-03-18", + "last_updated": "2026-05-27", "cost": { - "input": 0.15, - "output": 0.46 + "input": 0.6, + "output": 2.4, + "cache_read": 0.06, + "cache_write": 0.375 }, "type": "chat" }, { - "id": "TEE/deepseek-v3.2", - "name": "DeepSeek V3.2 TEE", - "display_name": "DeepSeek V3.2 TEE", + "id": "minimax/minimax-m2.5", + "name": "MiniMax M2.5", + "display_name": "MiniMax M2.5", "modalities": { "input": [ "text" @@ -24322,69 +25422,84 @@ ] }, "limit": { - "context": 164000, - "output": 65536 + "context": 204800, + "output": 131100 }, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { - "supported": true + "supported": true, + "default": true }, "extra_capabilities": { "reasoning": { - "supported": true + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] } }, "attachment": false, "open_weights": false, - "release_date": "2025-12-01", - "last_updated": "2025-12-01", + "release_date": "2026-02-12", + "last_updated": "2026-02-12", "cost": { - "input": 0.5, - "output": 1 + "input": 0.3, + "output": 1.2, + "cache_read": 0.03 }, "type": "chat" }, { - "id": "TEE/kimi-k2.6", - "name": "Kimi K2.6 TEE", - "display_name": "Kimi K2.6 TEE", + "id": "minimax/minimax-m2.1", + "name": "Minimax M2.1", + "display_name": "Minimax M2.1", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 262144, - "output": 65536 + "context": 204800, + "output": 131072 }, + "temperature": true, "tool_call": true, "reasoning": { "supported": true }, "extra_capabilities": { "reasoning": { - "supported": true + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] } }, - "attachment": true, - "open_weights": false, - "release_date": "2026-04-21", - "last_updated": "2026-04-21", + "attachment": false, + "open_weights": true, + "release_date": "2025-12-23", + "last_updated": "2025-12-23", "cost": { - "input": 1.5, - "output": 5.25, - "cache_read": 0.375 + "input": 0.3, + "output": 1.2, + "cache_read": 0.03 }, "type": "chat" }, { - "id": "TEE/glm-4.7", - "name": "GLM 4.7 TEE", - "display_name": "GLM 4.7 TEE", + "id": "minimax/minimax-m2", + "name": "MiniMax-M2", + "display_name": "MiniMax-M2", "modalities": { "input": [ "text" @@ -24394,12 +25509,14 @@ ] }, "limit": { - "context": 131000, - "output": 65535 + "context": 204800, + "output": 131072 }, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { - "supported": true + "supported": true, + "default": true }, "extra_capabilities": { "reasoning": { @@ -24413,19 +25530,20 @@ } }, "attachment": false, - "open_weights": false, - "release_date": "2026-01-29", - "last_updated": "2026-01-29", + "open_weights": true, + "release_date": "2025-10-27", + "last_updated": "2025-10-27", "cost": { - "input": 0.85, - "output": 3.3 + "input": 0.3, + "output": 1.2, + "cache_read": 0.03 }, "type": "chat" }, { - "id": "TEE/gpt-oss-120b", - "name": "GPT-OSS 120B TEE", - "display_name": "GPT-OSS 120B TEE", + "id": "minimax/minimax-m2.7", + "name": "MiniMax M2.7", + "display_name": "MiniMax M2.7", "modalities": { "input": [ "text" @@ -24435,32 +25553,41 @@ ] }, "limit": { - "context": 131072, - "output": 16384 + "context": 204800, + "output": 131072 }, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { - "supported": true + "supported": true, + "default": true }, "extra_capabilities": { "reasoning": { - "supported": true + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] } }, "attachment": false, - "open_weights": false, - "release_date": "2025-08-05", - "last_updated": "2025-08-05", + "open_weights": true, + "release_date": "2026-03-18", + "last_updated": "2026-03-18", "cost": { - "input": 2, - "output": 2 + "input": 0.3, + "output": 1.2, + "cache_read": 0.06 }, "type": "chat" }, { - "id": "TEE/gpt-oss-20b", - "name": "GPT-OSS 20B TEE", - "display_name": "GPT-OSS 20B TEE", + "id": "minimax/minimax-m2.5-highspeed", + "name": "MiniMax M2.5 Highspeed", + "display_name": "MiniMax M2.5 Highspeed", "modalities": { "input": [ "text" @@ -24470,32 +25597,41 @@ ] }, "limit": { - "context": 131072, - "output": 8192 + "context": 204800, + "output": 131100 }, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { - "supported": true + "supported": true, + "default": true }, "extra_capabilities": { "reasoning": { - "supported": true + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] } }, "attachment": false, "open_weights": false, - "release_date": "2025-08-05", - "last_updated": "2025-08-05", + "release_date": "2026-02-12", + "last_updated": "2026-02-12", "cost": { - "input": 0.2, - "output": 0.8 + "input": 0.6, + "output": 2.4, + "cache_read": 0.03 }, "type": "chat" }, { - "id": "TEE/gemma-3-27b-it", - "name": "Gemma 3 27B TEE", - "display_name": "Gemma 3 27B TEE", + "id": "kwaipilot/kat-coder-pro", + "name": "Kat Coder Pro", + "display_name": "Kat Coder Pro", "modalities": { "input": [ "text" @@ -24505,27 +25641,29 @@ ] }, "limit": { - "context": 131072, - "output": 8192 + "context": 256000, + "output": 128000 }, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { "supported": false }, "attachment": false, - "open_weights": false, - "release_date": "2025-03-10", - "last_updated": "2025-03-10", + "open_weights": true, + "release_date": "2026-01-05", + "last_updated": "2026-01-05", "cost": { - "input": 0.2, - "output": 0.8 + "input": 0.3, + "output": 1.2, + "cache_read": 0.06 }, "type": "chat" }, { - "id": "TEE/deepseek-v4-pro:thinking", - "name": "DeepSeek V4 Pro Thinking TEE", - "display_name": "DeepSeek V4 Pro Thinking TEE", + "id": "nousresearch/hermes-2-pro-llama-3-8b", + "name": "Hermes 2 Pro Llama 3 8B", + "display_name": "Hermes 2 Pro Llama 3 8B", "modalities": { "input": [ "text" @@ -24535,286 +25673,354 @@ ] }, "limit": { - "context": 800000, - "output": 65536 + "context": 8192, + "output": 8192 }, - "tool_call": true, + "temperature": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": true + "supported": false }, "attachment": false, - "open_weights": false, - "release_date": "2026-04-29", - "last_updated": "2026-04-29", + "open_weights": true, + "release_date": "2024-06-27", + "last_updated": "2024-06-27", "cost": { - "input": 1.5, - "output": 5.25, - "cache_read": 0.15 + "input": 0.14, + "output": 0.14 }, "type": "chat" - }, + } + ] + }, + "xai": { + "id": "xai", + "name": "xai", + "display_name": "xai", + "doc": "https://docs.x.ai/docs/models", + "models": [ { - "id": "TEE/glm-4.7-flash", - "name": "GLM 4.7 Flash TEE", - "display_name": "GLM 4.7 Flash TEE", + "id": "grok-4.20-multi-agent-0309", + "name": "Grok 4.20 Multi-Agent", + "display_name": "Grok 4.20 Multi-Agent", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 203000, - "output": 65535 + "context": 1000000, + "output": 30000 }, + "temperature": true, "tool_call": false, "reasoning": { - "supported": true + "supported": true, + "default": true }, "extra_capabilities": { "reasoning": { "supported": true } }, - "attachment": false, + "attachment": true, "open_weights": false, - "release_date": "2026-01-19", - "last_updated": "2026-01-19", + "release_date": "2026-03-09", + "last_updated": "2026-03-09", "cost": { - "input": 0.15, - "output": 0.5 + "input": 1.25, + "output": 2.5, + "cache_read": 0.2, + "tiers": [ + { + "input": 2.5, + "output": 5, + "cache_read": 0.4, + "tier": { + "type": "context", + "size": 200000 + } + } + ], + "context_over_200k": { + "input": 2.5, + "output": 5, + "cache_read": 0.4 + } }, "type": "chat" }, { - "id": "TEE/kimi-k2.5-thinking", - "name": "Kimi K2.5 Thinking TEE", - "display_name": "Kimi K2.5 Thinking TEE", + "id": "grok-4.20-0309-non-reasoning", + "name": "Grok 4.20 (Non-Reasoning)", + "display_name": "Grok 4.20 (Non-Reasoning)", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 65535 + "context": 1000000, + "output": 30000 }, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, - "attachment": false, + "attachment": true, "open_weights": false, - "release_date": "2026-01-29", - "last_updated": "2026-01-29", + "release_date": "2026-03-09", + "last_updated": "2026-03-09", "cost": { - "input": 0.3, - "output": 1.9 + "input": 1.25, + "output": 2.5, + "cache_read": 0.2, + "tiers": [ + { + "input": 2.5, + "output": 5, + "cache_read": 0.4, + "tier": { + "type": "context", + "size": 200000 + } + } + ], + "context_over_200k": { + "input": 2.5, + "output": 5, + "cache_read": 0.4 + } }, "type": "chat" }, { - "id": "TEE/llama3-3-70b", - "name": "Llama 3.3 70B", - "display_name": "Llama 3.3 70B", + "id": "grok-4.3", + "name": "Grok 4.3", + "display_name": "Grok 4.3", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 16384 + "context": 1000000, + "output": 30000 }, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": false, + "extra_capabilities": { + "reasoning": { + "supported": true + } + }, + "attachment": true, "open_weights": false, - "release_date": "2025-07-03", - "last_updated": "2025-07-03", + "release_date": "2026-04-17", + "last_updated": "2026-04-17", "cost": { - "input": 2, - "output": 2 + "input": 1.25, + "output": 2.5, + "cache_read": 0.2, + "tiers": [ + { + "input": 2.5, + "output": 5, + "cache_read": 0.4, + "tier": { + "type": "context", + "size": 200000 + } + } + ], + "context_over_200k": { + "input": 2.5, + "output": 5, + "cache_read": 0.4 + } }, "type": "chat" }, { - "id": "TEE/glm-5", - "name": "GLM 5 TEE", - "display_name": "GLM 5 TEE", + "id": "grok-imagine-image-quality", + "name": "Grok Imagine Image Quality", + "display_name": "Grok Imagine Image Quality", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ - "text" + "image", + "pdf" ] }, "limit": { - "context": 203000, - "output": 65535 + "context": 8000, + "output": 8192 }, + "temperature": false, "tool_call": false, "reasoning": { - "supported": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } + "supported": false }, - "attachment": false, + "attachment": true, "open_weights": false, - "release_date": "2026-02-11", - "last_updated": "2026-02-11", - "cost": { - "input": 1.2, - "output": 3.5 - }, + "release_date": "2026-04-03", + "last_updated": "2026-04-03", "type": "chat" }, { - "id": "TEE/qwen3.5-397b-a17b", - "name": "Qwen3.5 397B A17B TEE", - "display_name": "Qwen3.5 397B A17B TEE", + "id": "grok-imagine-video", + "name": "Grok Imagine Video", + "display_name": "Grok Imagine Video", "modalities": { "input": [ - "text" + "text", + "image", + "video", + "pdf" ], "output": [ - "text" + "video" ] }, "limit": { - "context": 258048, - "output": 65536 + "context": 1024, + "output": 8192 }, + "temperature": false, "tool_call": false, "reasoning": { - "supported": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } + "supported": false }, - "attachment": false, + "attachment": true, "open_weights": false, - "release_date": "2026-02-28", - "last_updated": "2026-02-28", - "cost": { - "input": 0.6, - "output": 3.6 - }, + "release_date": "2026-01-28", + "last_updated": "2026-01-28", "type": "chat" }, { - "id": "TEE/minimax-m2.5", - "name": "MiniMax M2.5 TEE", - "display_name": "MiniMax M2.5 TEE", + "id": "grok-4.20-0309-reasoning", + "name": "Grok 4.20 (Reasoning)", + "display_name": "Grok 4.20 (Reasoning)", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 196608, - "output": 131072 + "context": 1000000, + "output": 30000 }, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, "default": true }, - "extra_capabilities": { - "reasoning": { - "supported": true - } - }, - "attachment": false, + "attachment": true, "open_weights": false, - "release_date": "2026-04-20", - "last_updated": "2026-04-20", + "release_date": "2026-03-09", + "last_updated": "2026-03-09", "cost": { - "input": 0.2, - "output": 1.38 + "input": 1.25, + "output": 2.5, + "cache_read": 0.2, + "tiers": [ + { + "input": 2.5, + "output": 5, + "cache_read": 0.4, + "tier": { + "type": "context", + "size": 200000 + } + } + ], + "context_over_200k": { + "input": 2.5, + "output": 5, + "cache_read": 0.4 + } }, "type": "chat" }, { - "id": "TEE/gemma-4-26b-a4b-uncensored", - "name": "Gemma 4 26B A4B Uncensored TEE", - "display_name": "Gemma 4 26B A4B Uncensored TEE", + "id": "grok-imagine-image", + "name": "Grok Imagine Image", + "display_name": "Grok Imagine Image", "modalities": { "input": [ "text", - "image" + "image", + "pdf" ], "output": [ - "text" + "image", + "pdf" ] }, "limit": { - "context": 65536, - "output": 65536 + "context": 8000, + "output": 8192 }, - "tool_call": true, + "temperature": false, + "tool_call": false, "reasoning": { "supported": false }, "attachment": true, "open_weights": false, - "release_date": "2026-05-23", - "last_updated": "2026-05-23", - "cost": { - "input": 0.15, - "output": 0.7 - }, + "release_date": "2026-01-28", + "last_updated": "2026-01-28", "type": "chat" }, { - "id": "TEE/deepseek-v4-pro", - "name": "DeepSeek V4 Pro TEE", - "display_name": "DeepSeek V4 Pro TEE", + "id": "grok-build-0.1", + "name": "Grok Build 0.1", + "display_name": "Grok Build 0.1", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 800000, - "output": 65536 + "context": 256000, + "output": 256000 }, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, @@ -24822,30 +26028,40 @@ }, "extra_capabilities": { "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] + "supported": true } }, - "attachment": false, + "attachment": true, "open_weights": false, - "release_date": "2026-04-25", - "last_updated": "2026-04-25", + "release_date": "2026-04-16", + "last_updated": "2026-04-16", "cost": { - "input": 1.5, - "output": 5.25, - "cache_read": 0.15 + "input": 1, + "output": 2, + "cache_read": 0.2, + "tiers": [ + { + "input": 2, + "output": 4, + "cache_read": 0.4, + "tier": { + "type": "context", + "size": 200000 + } + } + ], + "context_over_200k": { + "input": 2, + "output": 4, + "cache_read": 0.4 + } }, "type": "chat" }, { - "id": "TEE/kimi-k2.5", - "name": "Kimi K2.5 TEE", - "display_name": "Kimi K2.5 TEE", + "id": "grok-3-mini-fast-beta", + "name": "Grok 3 Mini Fast Beta", + "display_name": "Grok 3 Mini Fast Beta", "modalities": { "input": [ "text" @@ -24855,38 +26071,26 @@ ] }, "limit": { - "context": 128000, - "output": 65535 + "context": 120000, + "output": 100000 }, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { - "supported": true + "supported": true, + "default": true, + "effort": "low" }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } + "search": { + "supported": false }, "attachment": false, - "open_weights": false, - "release_date": "2026-01-29", - "last_updated": "2026-01-29", - "cost": { - "input": 0.3, - "output": 1.9 - }, "type": "chat" }, { - "id": "TEE/deepseek-v3.1", - "name": "DeepSeek V3.1 TEE", - "display_name": "DeepSeek V3.1 TEE", + "id": "grok-3-mini-beta", + "name": "Grok 3 Mini Beta", + "display_name": "Grok 3 Mini Beta", "modalities": { "input": [ "text" @@ -24896,136 +26100,109 @@ ] }, "limit": { - "context": 164000, - "output": 8192 + "context": 120000, + "output": 100000 }, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { + "supported": true, + "default": true, + "effort": "low" + }, + "search": { "supported": false }, "attachment": false, - "open_weights": false, - "release_date": "2025-08-21", - "last_updated": "2025-08-21", - "cost": { - "input": 1, - "output": 2.5 - }, "type": "chat" }, { - "id": "TEE/qwen3.5-27b", - "name": "Qwen3.5 27B TEE", - "display_name": "Qwen3.5 27B TEE", + "id": "grok-3-fast-beta", + "name": "Grok 3 Fast Beta", + "display_name": "Grok 3 Fast Beta", "modalities": { "input": [ - "text", - "image", - "video" + "text" ], "output": [ "text" ] }, "limit": { - "context": 262144, - "output": 65536 + "context": 120000, + "output": 100000 }, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { - "supported": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } + "supported": false }, - "attachment": true, - "open_weights": false, - "release_date": "2026-03-13", - "last_updated": "2026-03-13", - "cost": { - "input": 0.3, - "output": 2.4 + "search": { + "supported": false }, + "attachment": false, "type": "chat" }, { - "id": "TEE/gemma4-31b", - "name": "Gemma 4 31B", - "display_name": "Gemma 4 31B", + "id": "grok-2-vision-1212", + "name": "Grok 2 Vision 1212", + "display_name": "Grok 2 Vision 1212", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 262144, - "output": 131072 + "context": 32000, + "output": 32000 }, + "temperature": true, "tool_call": false, "reasoning": { "supported": false }, - "attachment": false, - "open_weights": false, - "release_date": "2026-04-04", - "last_updated": "2026-04-04", - "cost": { - "input": 0.45, - "output": 1 + "search": { + "supported": false }, + "attachment": false, "type": "chat" }, { - "id": "TEE/glm-5.1", - "name": "GLM 5.1 TEE", - "display_name": "GLM 5.1 TEE", + "id": "grok-2-image-1212", + "name": "Grok 2 Image 1212", + "display_name": "Grok 2 Image 1212", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 202752, - "output": 65535 + "context": 130000, + "output": 100000 }, + "temperature": true, "tool_call": false, "reasoning": { - "supported": true + "supported": false }, - "extra_capabilities": { - "reasoning": { - "supported": true - } + "search": { + "supported": false }, "attachment": false, - "open_weights": false, - "release_date": "2026-04-20", - "last_updated": "2026-04-20", - "cost": { - "input": 1.5, - "output": 5.25, - "cache_read": 0.3 - }, "type": "chat" }, { - "id": "nex-agi/deepseek-v3.1-nex-n1", - "name": "DeepSeek V3.1 Nex N1", - "display_name": "DeepSeek V3.1 Nex N1", + "id": "grok-3-beta", + "name": "Grok 3 Beta", + "display_name": "Grok 3 Beta", "modalities": { "input": [ "text" @@ -25035,27 +26212,24 @@ ] }, "limit": { - "context": 128000, - "output": 8192 + "context": 120000, + "output": 100000 }, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { "supported": false }, - "attachment": false, - "open_weights": false, - "release_date": "2025-12-10", - "last_updated": "2025-12-10", - "cost": { - "input": 0.27999999999999997, - "output": 0.42000000000000004 + "search": { + "supported": false }, + "attachment": false, "type": "chat" }, { - "id": "tencent/Hunyuan-MT-7B", - "name": "Hunyuan MT 7B", - "display_name": "Hunyuan MT 7B", + "id": "grok-2-1212", + "name": "Grok 2 1212", + "display_name": "Grok 2 1212", "modalities": { "input": [ "text" @@ -25065,27 +26239,33 @@ ] }, "limit": { - "context": 8192, - "output": 8192 + "context": 120000, + "output": 100000 }, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { "supported": false }, - "attachment": false, - "open_weights": false, - "release_date": "2025-09-18", - "last_updated": "2025-09-18", - "cost": { - "input": 10, - "output": 20 + "search": { + "supported": false }, + "attachment": false, "type": "chat" - }, + } + ] + }, + "privatemode-ai": { + "id": "privatemode-ai", + "name": "Privatemode AI", + "display_name": "Privatemode AI", + "api": "http://localhost:8080/v1", + "doc": "https://docs.privatemode.ai/api/overview", + "models": [ { - "id": "tencent/hy3-preview", - "name": "Tencent: Hy3 preview", - "display_name": "Tencent: Hy3 preview", + "id": "qwen3-embedding-4b", + "name": "Qwen3-Embedding 4B", + "display_name": "Qwen3-Embedding 4B", "modalities": { "input": [ "text" @@ -25095,64 +26275,62 @@ ] }, "limit": { - "context": 262144, - "output": 262144 + "context": 32000, + "output": 2560 }, + "temperature": true, "tool_call": false, "reasoning": { - "supported": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true - } + "supported": false }, "attachment": false, - "open_weights": false, - "release_date": "2026-04-23", - "last_updated": "2026-04-23", + "open_weights": true, + "knowledge": "2025-06", + "release_date": "2025-06-06", + "last_updated": "2025-06-06", "cost": { - "input": 0.066, - "output": 0.26, - "cache_read": 0.029 + "input": 0, + "output": 0 }, - "type": "chat" + "type": "embedding" }, { - "id": "ibm-granite/granite-4.1-8b", - "name": "Granite 4.1 8B", - "display_name": "Granite 4.1 8B", + "id": "gemma-3-27b", + "name": "Gemma 3 27B", + "display_name": "Gemma 3 27B", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 131072, - "output": 131072 + "context": 128000, + "output": 8192 }, + "temperature": true, "tool_call": true, "reasoning": { "supported": false }, - "attachment": false, - "open_weights": false, - "release_date": "2026-04-29", - "last_updated": "2026-04-29", + "attachment": true, + "open_weights": true, + "knowledge": "2024-08", + "release_date": "2025-03-12", + "last_updated": "2025-03-12", "cost": { - "input": 0.05, - "output": 0.1, - "cache_read": 0.05 + "input": 0, + "output": 0 }, "type": "chat" }, { - "id": "nothingiisreal/L3.1-70B-Celeste-V0.1-BF16", - "name": "Llama 3.1 70B Celeste v0.1", - "display_name": "Llama 3.1 70B Celeste v0.1", + "id": "gpt-oss-120b", + "name": "gpt-oss-120b", + "display_name": "gpt-oss-120b", "modalities": { "input": [ "text" @@ -25162,61 +26340,67 @@ ] }, "limit": { - "context": 16384, - "output": 16384 + "context": 128000, + "output": 128000 }, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true + } }, "attachment": false, - "open_weights": false, - "release_date": "2024-07-23", - "last_updated": "2024-07-23", + "open_weights": true, + "knowledge": "2025-08", + "release_date": "2025-08-04", + "last_updated": "2025-08-14", "cost": { - "input": 0.49299999999999994, - "output": 0.49299999999999994 + "input": 0, + "output": 0 }, "type": "chat" }, { - "id": "stepfun/step-3.7-flash:thinking", - "name": "Step 3.7 Flash Thinking", - "display_name": "Step 3.7 Flash Thinking", + "id": "whisper-large-v3", + "name": "Whisper large-v3", + "display_name": "Whisper large-v3", "modalities": { "input": [ - "text", - "image", - "video" + "audio" ], "output": [ "text" ] }, "limit": { - "context": 256000, - "output": 256000 + "context": 8192, + "output": 4096 }, - "tool_call": true, + "temperature": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": true + "supported": false }, "attachment": true, - "open_weights": false, - "release_date": "2026-05-29", - "last_updated": "2026-05-29", + "open_weights": true, + "knowledge": "2023-09", + "release_date": "2023-09-01", + "last_updated": "2023-09-01", "cost": { - "input": 0.2, - "output": 1.15, - "cache_read": 0.04 + "input": 0, + "output": 0 }, "type": "chat" }, { - "id": "aion-labs/aion-2.5", - "name": "AionLabs: Aion-2.5", - "display_name": "AionLabs: Aion-2.5", + "id": "qwen3-coder-30b-a3b", + "name": "Qwen3-Coder 30B-A3B", + "display_name": "Qwen3-Coder 30B-A3B", "modalities": { "input": [ "text" @@ -25226,28 +26410,38 @@ ] }, "limit": { - "context": 131072, + "context": 128000, "output": 32768 }, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { "supported": false }, "attachment": false, - "open_weights": false, - "release_date": "2026-03-20", - "last_updated": "2026-03-20", + "open_weights": true, + "knowledge": "2025-04", + "release_date": "2025-04", + "last_updated": "2025-04", "cost": { - "input": 1, - "output": 3, - "cache_read": 0.35 + "input": 0, + "output": 0 }, "type": "chat" - }, + } + ] + }, + "drun": { + "id": "drun", + "name": "D.Run (China)", + "display_name": "D.Run (China)", + "api": "https://chat.d.run/v1", + "doc": "https://www.d.run", + "models": [ { - "id": "aion-labs/aion-2.0", - "name": "AionLabs: Aion-2.0", - "display_name": "AionLabs: Aion-2.0", + "id": "public/deepseek-v3", + "name": "DeepSeek V3", + "display_name": "DeepSeek V3", "modalities": { "input": [ "text" @@ -25258,26 +26452,28 @@ }, "limit": { "context": 131072, - "output": 32768 + "output": 8192 }, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { "supported": false }, "attachment": false, - "open_weights": false, - "release_date": "2026-02-23", - "last_updated": "2026-02-23", + "open_weights": true, + "knowledge": "2024-07", + "release_date": "2024-12-26", + "last_updated": "2024-12-26", "cost": { - "input": 0.8, - "output": 1.6 + "input": 0.28, + "output": 1.1 }, "type": "chat" }, { - "id": "aion-labs/aion-1.0", - "name": "Aion 1.0", - "display_name": "Aion 1.0", + "id": "public/deepseek-r1", + "name": "DeepSeek R1", + "display_name": "DeepSeek R1", "modalities": { "input": [ "text" @@ -25287,27 +26483,41 @@ ] }, "limit": { - "context": 65536, - "output": 8192 + "context": 131072, + "output": 32000 }, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } }, "attachment": false, - "open_weights": false, - "release_date": "2025-02-01", - "last_updated": "2025-02-01", + "open_weights": true, + "knowledge": "2024-12", + "release_date": "2025-01-20", + "last_updated": "2025-01-20", "cost": { - "input": 3.995, - "output": 7.99 + "input": 0.55, + "output": 2.2 }, "type": "chat" }, { - "id": "aion-labs/aion-rp-llama-3.1-8b", - "name": "Llama 3.1 8b (uncensored)", - "display_name": "Llama 3.1 8b (uncensored)", + "id": "public/minimax-m25", + "name": "MiniMax M2.5", + "display_name": "MiniMax M2.5", "modalities": { "input": [ "text" @@ -25317,27 +26527,49 @@ ] }, "limit": { - "context": 32768, - "output": 16384 + "context": 204800, + "output": 131072 }, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } }, "attachment": false, "open_weights": false, - "release_date": "2024-07-23", - "last_updated": "2024-07-23", + "release_date": "2025-03-01", + "last_updated": "2025-03-01", "cost": { - "input": 0.2006, - "output": 0.2006 + "input": 0.29, + "output": 1.16 }, "type": "chat" - }, + } + ] + }, + "alibaba-token-plan-cn": { + "id": "alibaba-token-plan-cn", + "name": "Alibaba Token Plan (China)", + "display_name": "Alibaba Token Plan (China)", + "api": "https://token-plan.cn-beijing.maas.aliyuncs.com/compatible-mode/v1", + "doc": "https://www.alibabacloud.com/help/zh/model-studio/token-plan-overview", + "models": [ { - "id": "aion-labs/aion-1.0-mini", - "name": "Aion 1.0 mini (DeepSeek)", - "display_name": "Aion 1.0 mini (DeepSeek)", + "id": "deepseek-v4-flash", + "name": "DeepSeek V4 Flash", + "display_name": "DeepSeek V4 Flash", "modalities": { "input": [ "text" @@ -25347,57 +26579,83 @@ ] }, "limit": { - "context": 131072, - "output": 8192 + "context": 1000000, + "output": 384000 }, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } }, "attachment": false, - "open_weights": false, - "release_date": "2025-02-20", - "last_updated": "2025-02-20", + "open_weights": true, + "knowledge": "2025-05", + "release_date": "2026-04-24", + "last_updated": "2026-04-24", "cost": { - "input": 0.7989999999999999, - "output": 1.394 + "input": 0, + "output": 0, + "cache_read": 0 }, "type": "chat" }, { - "id": "amazon/nova-pro-v1", - "name": "Amazon Nova Pro 1.0", - "display_name": "Amazon Nova Pro 1.0", + "id": "qwen3.7-plus", + "name": "Qwen3.7 Plus", + "display_name": "Qwen3.7 Plus", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 300000, - "output": 32000 + "context": 1000000, + "output": 64000 }, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true + } }, "attachment": false, "open_weights": false, - "release_date": "2024-12-03", - "last_updated": "2024-12-03", + "knowledge": "2025-04", + "release_date": "2026-06-02", + "last_updated": "2026-06-02", "cost": { - "input": 0.7989999999999999, - "output": 3.1959999999999997 + "input": 0, + "output": 0, + "cache_read": 0, + "cache_write": 0 }, "type": "chat" }, { - "id": "amazon/nova-lite-v1", - "name": "Amazon Nova Lite 1.0", - "display_name": "Amazon Nova Lite 1.0", + "id": "qwen3.7-max", + "name": "Qwen3.7 Max", + "display_name": "Qwen3.7 Max", "modalities": { "input": [ "text" @@ -25407,27 +26665,36 @@ ] }, "limit": { - "context": 300000, - "output": 5120 + "context": 1000000, + "output": 65536 }, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true + } }, "attachment": false, "open_weights": false, - "release_date": "2024-12-03", - "last_updated": "2024-12-03", + "release_date": "2026-05-21", + "last_updated": "2026-05-21", "cost": { - "input": 0.0595, - "output": 0.238 + "input": 0, + "output": 0, + "cache_read": 0, + "cache_write": 0 }, "type": "chat" }, { - "id": "amazon/nova-micro-v1", - "name": "Amazon Nova Micro 1.0", - "display_name": "Amazon Nova Micro 1.0", + "id": "glm-5.1", + "name": "GLM-5.1", + "display_name": "GLM-5.1", "modalities": { "input": [ "text" @@ -25437,27 +26704,42 @@ ] }, "limit": { - "context": 128000, - "output": 5120 + "context": 202752, + "output": 128000 }, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } }, "attachment": false, - "open_weights": false, - "release_date": "2024-12-03", - "last_updated": "2024-12-03", + "open_weights": true, + "release_date": "2026-03-27", + "last_updated": "2026-03-27", "cost": { - "input": 0.0357, - "output": 0.1394 + "input": 0, + "output": 0, + "cache_read": 0, + "cache_write": 0 }, "type": "chat" }, { - "id": "amazon/nova-2-lite-v1", - "name": "Amazon Nova 2 Lite", - "display_name": "Amazon Nova 2 Lite", + "id": "deepseek-v4-pro", + "name": "DeepSeek V4 Pro", + "display_name": "DeepSeek V4 Pro", "modalities": { "input": [ "text" @@ -25468,90 +26750,124 @@ }, "limit": { "context": 1000000, - "output": 65535 + "output": 384000 }, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } }, "attachment": false, - "open_weights": false, - "release_date": "2024-12-03", - "last_updated": "2024-12-03", + "open_weights": true, + "knowledge": "2025-05", + "release_date": "2026-04-24", + "last_updated": "2026-04-24", "cost": { - "input": 0.5099999999999999, - "output": 4.25 + "input": 0, + "output": 0, + "cache_read": 0 }, "type": "chat" }, { - "id": "inclusionai/ling-2.6-flash", - "name": "Ling 2.6 Flash", - "display_name": "Ling 2.6 Flash", + "id": "wan2.7-image-pro", + "name": "Wan2.7 Image Pro", + "display_name": "Wan2.7 Image Pro", "modalities": { "input": [ "text" ], "output": [ - "text" + "image" ] }, "limit": { - "context": 262144, - "output": 32768 + "context": 8192, + "output": 8192 }, - "tool_call": true, + "temperature": true, + "tool_call": false, "reasoning": { "supported": false }, "attachment": false, "open_weights": false, - "release_date": "2026-04-21", - "last_updated": "2026-04-21", + "release_date": "2026-05-29", + "last_updated": "2026-05-29", "cost": { - "input": 0.08, - "output": 0.24 + "input": 0, + "output": 0 }, - "type": "chat" + "type": "imageGeneration" }, { - "id": "inclusionai/ling-2.6-1t", - "name": "Ling 2.6 1T", - "display_name": "Ling 2.6 1T", + "id": "qwen3.6-flash", + "name": "Qwen3.6 Flash", + "display_name": "Qwen3.6 Flash", "modalities": { "input": [ - "text" + "text", + "image", + "video" ], "output": [ "text" ] }, "limit": { - "context": 262144, - "output": 32768 + "context": 1000000, + "output": 65536 }, + "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": false, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } + }, + "attachment": true, "open_weights": false, - "release_date": "2026-04-23", - "last_updated": "2026-04-23", + "release_date": "2026-04-27", + "last_updated": "2026-04-27", "cost": { - "input": 0.3, - "output": 2.5, - "cache_read": 0.06 + "input": 0, + "output": 0, + "cache_read": 0, + "cache_write": 0 }, "type": "chat" }, { - "id": "inclusionai/ring-2.6-1t", - "name": "Ring 2.6 1T", - "display_name": "Ring 2.6 1T", + "id": "kimi-k2.5", + "name": "Kimi K2.5", + "display_name": "Kimi K2.5", "modalities": { "input": [ - "text" + "text", + "image", + "video" ], "output": [ "text" @@ -25559,180 +26875,228 @@ }, "limit": { "context": 262144, - "output": 65536 + "output": 32768 }, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, "default": true }, - "attachment": false, - "open_weights": false, - "release_date": "2026-05-08", - "last_updated": "2026-05-08", + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } + }, + "attachment": true, + "open_weights": true, + "knowledge": "2025-01", + "release_date": "2026-01", + "last_updated": "2026-01", "cost": { - "input": 1, - "output": 3 + "input": 0, + "output": 0, + "cache_read": 0, + "cache_write": 0 }, "type": "chat" }, { - "id": "mlabonne/NeuralDaredevil-8B-abliterated", - "name": "Neural Daredevil 8B abliterated", - "display_name": "Neural Daredevil 8B abliterated", + "id": "qwen-image-2.0", + "name": "Qwen Image 2.0", + "display_name": "Qwen Image 2.0", "modalities": { "input": [ "text" ], "output": [ - "text" + "image" ] }, "limit": { "context": 8192, "output": 8192 }, + "temperature": true, "tool_call": false, "reasoning": { "supported": false }, "attachment": false, "open_weights": false, - "release_date": "2024-12-01", - "last_updated": "2024-12-01", + "release_date": "2026-03-03", + "last_updated": "2026-03-03", "cost": { - "input": 0.44, - "output": 0.44 + "input": 0, + "output": 0 }, - "type": "chat" + "type": "imageGeneration" }, { - "id": "unsloth/gemma-3-27b-it", - "name": "Gemma 3 27B IT", - "display_name": "Gemma 3 27B IT", + "id": "MiniMax-M2.5", + "name": "MiniMax-M2.5", + "display_name": "MiniMax-M2.5", "modalities": { "input": [ - "text", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 96000 + "context": 196608, + "output": 24576 }, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": true, - "open_weights": false, - "release_date": "2025-03-10", - "last_updated": "2025-03-10", + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } + }, + "attachment": false, + "open_weights": true, + "release_date": "2026-02-12", + "last_updated": "2026-02-12", "cost": { - "input": 0.2992, - "output": 0.2992 + "input": 0, + "output": 0, + "cache_read": 0, + "cache_write": 0 }, "type": "chat" }, { - "id": "unsloth/gemma-3-12b-it", - "name": "Gemma 3 12B IT", - "display_name": "Gemma 3 12B IT", + "id": "kimi-k2.6", + "name": "Kimi K2.6", + "display_name": "Kimi K2.6", "modalities": { "input": [ "text", - "pdf" + "image", + "video" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 131072 + "context": 262144, + "output": 16384 }, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } }, "attachment": true, - "open_weights": false, - "release_date": "2025-03-10", - "last_updated": "2025-03-10", + "open_weights": true, + "knowledge": "2025-01", + "release_date": "2026-04-21", + "last_updated": "2026-04-21", "cost": { - "input": 0.272, - "output": 0.272 + "input": 0, + "output": 0, + "cache_read": 0, + "cache_write": 0 }, "type": "chat" }, { - "id": "unsloth/gemma-3-4b-it", - "name": "Gemma 3 4B IT", - "display_name": "Gemma 3 4B IT", + "id": "qwen-image-2.0-pro", + "name": "Qwen Image 2.0 Pro", + "display_name": "Qwen Image 2.0 Pro", "modalities": { "input": [ - "text", - "pdf" + "text" ], "output": [ - "text" + "image" ] }, "limit": { - "context": 128000, + "context": 8192, "output": 8192 }, + "temperature": true, "tool_call": false, "reasoning": { "supported": false }, - "attachment": true, + "attachment": false, "open_weights": false, - "release_date": "2025-03-10", - "last_updated": "2025-03-10", + "release_date": "2026-03-03", + "last_updated": "2026-03-03", "cost": { - "input": 0.2006, - "output": 0.2006 + "input": 0, + "output": 0 }, - "type": "chat" + "type": "imageGeneration" }, { - "id": "featherless-ai/Qwerky-72B", - "name": "Qwerky 72B", - "display_name": "Qwerky 72B", + "id": "wan2.7-image", + "name": "Wan2.7 Image", + "display_name": "Wan2.7 Image", "modalities": { "input": [ "text" ], "output": [ - "text" + "image" ] }, "limit": { - "context": 32000, + "context": 8192, "output": 8192 }, + "temperature": true, "tool_call": false, "reasoning": { "supported": false }, "attachment": false, "open_weights": false, - "release_date": "2025-03-20", - "last_updated": "2025-03-20", + "release_date": "2026-05-29", + "last_updated": "2026-05-29", "cost": { - "input": 0.5, - "output": 0.5 + "input": 0, + "output": 0 }, - "type": "chat" + "type": "imageGeneration" }, { - "id": "shisa-ai/shisa-v2-llama3.3-70b", - "name": "Shisa V2 Llama 3.3 70B", - "display_name": "Shisa V2 Llama 3.3 70B", + "id": "glm-5", + "name": "GLM-5", + "display_name": "GLM-5", "modalities": { "input": [ "text" @@ -25742,27 +27106,42 @@ ] }, "limit": { - "context": 128000, + "context": 202752, "output": 16384 }, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } }, "attachment": false, "open_weights": false, - "release_date": "2025-07-26", - "last_updated": "2025-07-26", + "release_date": "2026-02-11", + "last_updated": "2026-02-11", "cost": { - "input": 0.5, - "output": 0.5 + "input": 0, + "output": 0, + "cache_read": 0, + "cache_write": 0 }, "type": "chat" }, { - "id": "shisa-ai/shisa-v2.1-llama3.3-70b", - "name": "Shisa V2.1 Llama 3.3 70B", - "display_name": "Shisa V2.1 Llama 3.3 70B", + "id": "deepseek-v3.2", + "name": "DeepSeek V3.2", + "display_name": "DeepSeek V3.2", "modalities": { "input": [ "text" @@ -25772,58 +27151,92 @@ ] }, "limit": { - "context": 32768, - "output": 4096 + "context": 131072, + "output": 65536 }, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true + } }, "attachment": false, - "open_weights": false, - "release_date": "2024-12-06", - "last_updated": "2024-12-06", + "open_weights": true, + "knowledge": "2025-01", + "release_date": "2025-12-03", + "last_updated": "2025-12-05", "cost": { - "input": 0.5, - "output": 0.5 + "input": 0, + "output": 0 }, "type": "chat" }, { - "id": "undi95/remm-slerp-l2-13b", - "name": "ReMM SLERP 13B", - "display_name": "ReMM SLERP 13B", + "id": "qwen3.6-plus", + "name": "Qwen3.6 Plus", + "display_name": "Qwen3.6 Plus", "modalities": { "input": [ "text", - "pdf" + "image", + "video" ], "output": [ "text" ] }, "limit": { - "context": 6144, - "output": 4096 + "context": 1000000, + "output": 65536 }, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": true, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } + }, + "attachment": false, "open_weights": false, - "release_date": "2025-01-01", - "last_updated": "2025-01-01", + "knowledge": "2025-04", + "release_date": "2026-04-02", + "last_updated": "2026-04-02", "cost": { - "input": 0.7989999999999999, - "output": 1.2069999999999999 + "input": 0, + "output": 0, + "cache_read": 0, + "cache_write": 0 }, "type": "chat" - }, + } + ] + }, + "moonshot-ai": { + "id": "moonshot-ai", + "name": "Moonshot AI", + "display_name": "Moonshot AI", + "api": "https://api.moonshot.ai/v1", + "doc": "https://platform.moonshot.ai/docs/api/chat", + "models": [ { - "id": "VongolaChouko/Starcannon-Unleashed-12B-v1.0", - "name": "Mistral Nemo Starcannon 12b v1", - "display_name": "Mistral Nemo Starcannon 12b v1", + "id": "kimi-k2-0905-preview", + "name": "Kimi K2 0905", + "display_name": "Kimi K2 0905", "modalities": { "input": [ "text" @@ -25833,64 +27246,78 @@ ] }, "limit": { - "context": 16384, - "output": 8192 + "context": 262144, + "output": 262144 }, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { "supported": false }, "attachment": false, - "open_weights": false, - "release_date": "2024-07-01", - "last_updated": "2024-07-01", + "open_weights": true, + "knowledge": "2024-10", + "release_date": "2025-09-05", + "last_updated": "2025-09-05", "cost": { - "input": 0.49299999999999994, - "output": 0.49299999999999994 + "input": 0.6, + "output": 2.5, + "cache_read": 0.15 }, "type": "chat" }, { - "id": "google/gemini-pro-latest", - "name": "Gemini Pro Latest", - "display_name": "Gemini Pro Latest", + "id": "kimi-k2-thinking-turbo", + "name": "Kimi K2 Thinking Turbo", + "display_name": "Kimi K2 Thinking Turbo", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 1048756, - "output": 65536 + "context": 262144, + "output": 262144 }, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, "default": true }, - "attachment": true, - "open_weights": false, - "release_date": "2026-03-29", - "last_updated": "2026-03-29", + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } + }, + "attachment": false, + "open_weights": true, + "knowledge": "2024-08", + "release_date": "2025-11-06", + "last_updated": "2025-11-06", "cost": { - "input": 2, - "output": 12, - "cache_read": 0.2 + "input": 1.15, + "output": 8, + "cache_read": 0.15 }, "type": "chat" }, { - "id": "google/gemma-4-26b-a4b-it:thinking", - "name": "Gemma 4 26B A4B Thinking", - "display_name": "Gemma 4 26B A4B Thinking", + "id": "kimi-k2-thinking", + "name": "Kimi K2 Thinking", + "display_name": "Kimi K2 Thinking", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" @@ -25898,27 +27325,41 @@ }, "limit": { "context": 262144, - "output": 131072 + "output": 262144 }, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { "supported": true, "default": true }, - "attachment": true, - "open_weights": false, - "release_date": "2026-04-02", - "last_updated": "2026-04-02", + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } + }, + "attachment": false, + "open_weights": true, + "knowledge": "2024-08", + "release_date": "2025-11-06", + "last_updated": "2025-11-06", "cost": { - "input": 0.13, - "output": 0.4 + "input": 0.6, + "output": 2.5, + "cache_read": 0.15 }, "type": "chat" }, { - "id": "google/gemini-flash-1.5", - "name": "Gemini 1.5 Flash", - "display_name": "Gemini 1.5 Flash", + "id": "kimi-k2-0711-preview", + "name": "Kimi K2 0711", + "display_name": "Kimi K2 0711", "modalities": { "input": [ "text" @@ -25928,31 +27369,33 @@ ] }, "limit": { - "context": 2000000, - "output": 8192 + "context": 131072, + "output": 16384 }, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { "supported": false }, "attachment": false, - "open_weights": false, - "release_date": "2024-05-14", - "last_updated": "2024-05-14", + "open_weights": true, + "knowledge": "2024-10", + "release_date": "2025-07-14", + "last_updated": "2025-07-14", "cost": { - "input": 0.0748, - "output": 0.306 + "input": 0.6, + "output": 2.5, + "cache_read": 0.15 }, "type": "chat" }, { - "id": "google/gemma-4-31b-it", - "name": "Gemma 4 31B", - "display_name": "Gemma 4 31B", + "id": "kimi-k2-turbo-preview", + "name": "Kimi K2 Turbo", + "display_name": "Kimi K2 Turbo", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" @@ -25960,74 +27403,91 @@ }, "limit": { "context": 262144, - "output": 131072 + "output": 262144 }, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, - "attachment": true, - "open_weights": false, - "release_date": "2026-04-02", - "last_updated": "2026-04-02", + "attachment": false, + "open_weights": true, + "knowledge": "2024-10", + "release_date": "2025-09-05", + "last_updated": "2025-09-05", "cost": { - "input": 0.1, - "output": 0.35 + "input": 2.4, + "output": 10, + "cache_read": 0.6 }, "type": "chat" }, { - "id": "google/gemini-flash-lite-latest", - "name": "Gemini Flash Lite Latest", - "display_name": "Gemini Flash Lite Latest", + "id": "kimi-k2.5", + "name": "Kimi K2.5", + "display_name": "Kimi K2.5", "modalities": { "input": [ "text", "image", - "pdf" + "video" ], "output": [ "text" ] }, "limit": { - "context": 1048576, - "output": 65536 + "context": 262144, + "output": 262144 }, + "temperature": false, "tool_call": true, "reasoning": { "supported": true, "default": true }, - "attachment": true, - "open_weights": false, - "release_date": "2026-03-29", - "last_updated": "2026-03-29", + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } + }, + "attachment": false, + "open_weights": true, + "knowledge": "2025-01", + "release_date": "2026-01", + "last_updated": "2026-01", "cost": { - "input": 0.25, - "output": 1.5, - "cache_read": 0.025 + "input": 0.6, + "output": 3, + "cache_read": 0.1 }, "type": "chat" }, { - "id": "google/gemini-3-flash-preview", - "name": "Gemini 3 Flash (Preview)", - "display_name": "Gemini 3 Flash (Preview)", + "id": "kimi-k2.6", + "name": "Kimi K2.6", + "display_name": "Kimi K2.6", "modalities": { "input": [ "text", - "image" + "image", + "video" ], "output": [ "text" ] }, "limit": { - "context": 1048756, - "output": 65536 + "context": 262144, + "output": 262144 }, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, @@ -26036,36 +27496,39 @@ "extra_capabilities": { "reasoning": { "supported": true, - "default_enabled": true, - "mode": "level", - "level": "high", - "level_options": [ - "minimal", - "low", - "medium", - "high" - ], + "interleaved": true, "summaries": true, "visibility": "summary", "continuation": [ - "thought_signatures" + "thinking_blocks" ] } }, "attachment": true, - "open_weights": false, - "release_date": "2025-12-17", - "last_updated": "2025-12-17", + "open_weights": true, + "knowledge": "2025-01", + "release_date": "2026-04-21", + "last_updated": "2026-04-21", "cost": { - "input": 0.5, - "output": 3 + "input": 0.95, + "output": 4, + "cache_read": 0.16 }, "type": "chat" - }, + } + ] + }, + "fireworks-ai": { + "id": "fireworks-ai", + "name": "Fireworks AI", + "display_name": "Fireworks AI", + "api": "https://api.fireworks.ai/inference/v1/", + "doc": "https://fireworks.ai/docs/", + "models": [ { - "id": "google/gemini-3.1-pro-preview-high", - "name": "Gemini 3.1 Pro (Preview High)", - "display_name": "Gemini 3.1 Pro (Preview High)", + "id": "accounts/fireworks/routers/kimi-k2p6-turbo", + "name": "Kimi K2.6 Turbo", + "display_name": "Kimi K2.6 Turbo", "modalities": { "input": [ "text", @@ -26076,9 +27539,10 @@ ] }, "limit": { - "context": 1048756, - "output": 65536 + "context": 262000, + "output": 262000 }, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, @@ -26087,48 +27551,42 @@ "extra_capabilities": { "reasoning": { "supported": true, - "default_enabled": true, - "mode": "level", - "level": "high", - "level_options": [ - "low", - "high" - ], + "interleaved": true, "summaries": true, "visibility": "summary", "continuation": [ - "thought_signatures" + "thinking_blocks" ] } }, - "attachment": true, - "open_weights": false, - "release_date": "2026-02-21", - "last_updated": "2026-02-21", + "attachment": false, + "open_weights": true, + "release_date": "2026-04-17", + "last_updated": "2026-04-17", "cost": { "input": 2, - "output": 12, - "cache_read": 0.2 + "output": 8, + "cache_read": 0.3 }, "type": "chat" }, { - "id": "google/gemini-3.1-pro-preview-customtools", - "name": "Gemini 3.1 Pro (Preview Custom Tools)", - "display_name": "Gemini 3.1 Pro (Preview Custom Tools)", + "id": "accounts/fireworks/routers/glm-5p1-fast", + "name": "GLM 5.1 Fast", + "display_name": "GLM 5.1 Fast", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 1048756, - "output": 65536 + "context": 202800, + "output": 131072 }, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, @@ -26137,35 +27595,29 @@ "extra_capabilities": { "reasoning": { "supported": true, - "default_enabled": true, - "mode": "level", - "level": "high", - "level_options": [ - "low", - "high" - ], + "interleaved": true, "summaries": true, "visibility": "summary", "continuation": [ - "thought_signatures" + "thinking_blocks" ] } }, - "attachment": true, - "open_weights": false, - "release_date": "2026-02-27", - "last_updated": "2026-02-27", + "attachment": false, + "open_weights": true, + "release_date": "2026-04-01", + "last_updated": "2026-04-01", "cost": { - "input": 2, - "output": 12, - "cache_read": 0.2 + "input": 2.8, + "output": 8.8, + "cache_read": 0.52 }, "type": "chat" }, { - "id": "google/gemma-4-31b-it:thinking", - "name": "Gemma 4 31B Thinking", - "display_name": "Gemma 4 31B Thinking", + "id": "accounts/fireworks/routers/kimi-k2p6-fast", + "name": "Kimi K2.6 Fast", + "display_name": "Kimi K2.6 Fast", "modalities": { "input": [ "text", @@ -26176,75 +27628,102 @@ ] }, "limit": { - "context": 262144, - "output": 131072 + "context": 262000, + "output": 262000 }, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { "supported": true, "default": true }, - "attachment": true, - "open_weights": false, - "release_date": "2026-04-02", - "last_updated": "2026-04-02", + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } + }, + "attachment": false, + "open_weights": true, + "release_date": "2026-04-17", + "last_updated": "2026-06-05", "cost": { - "input": 0.1, - "output": 0.35 + "input": 2, + "output": 8, + "cache_read": 0.3 }, "type": "chat" }, { - "id": "google/gemini-flash-latest", - "name": "Gemini Flash Latest", - "display_name": "Gemini Flash Latest", + "id": "accounts/fireworks/models/deepseek-v4-flash", + "name": "DeepSeek V4 Flash", + "display_name": "DeepSeek V4 Flash", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 1048756, - "output": 65536 + "context": 1000000, + "output": 384000 }, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { "supported": true, "default": true }, - "attachment": true, - "open_weights": false, - "release_date": "2026-03-29", - "last_updated": "2026-03-29", + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } + }, + "attachment": false, + "open_weights": true, + "knowledge": "2025-05", + "release_date": "2026-04-24", + "last_updated": "2026-04-24", "cost": { - "input": 1.5, - "output": 9, - "cache_read": 0.15 + "input": 0.14, + "output": 0.28, + "cache_read": 0.03 }, "type": "chat" }, { - "id": "google/gemini-3.5-flash-thinking", - "name": "Gemini 3.5 Flash Thinking", - "display_name": "Gemini 3.5 Flash Thinking", + "id": "accounts/fireworks/models/kimi-k2p5", + "name": "Kimi K2.5", + "display_name": "Kimi K2.5", "modalities": { "input": [ "text", - "image" + "image", + "video" ], "output": [ "text" ] }, "limit": { - "context": 1048576, - "output": 65536 + "context": 256000, + "output": 256000 }, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { "supported": true, "default": true @@ -26252,37 +27731,30 @@ "extra_capabilities": { "reasoning": { "supported": true, - "default_enabled": true, - "mode": "level", - "level": "high", - "level_options": [ - "minimal", - "low", - "medium", - "high" - ], + "interleaved": true, "summaries": true, "visibility": "summary", "continuation": [ - "thought_signatures" + "thinking_blocks" ] } }, "attachment": true, - "open_weights": false, - "release_date": "2026-05-19", - "last_updated": "2026-05-19", + "open_weights": true, + "knowledge": "2025-01", + "release_date": "2026-01-27", + "last_updated": "2026-01-27", "cost": { - "input": 1.5, - "output": 9, - "cache_read": 0.15 + "input": 0.6, + "output": 3, + "cache_read": 0.1 }, "type": "chat" }, { - "id": "google/gemini-3.1-pro-preview", - "name": "Gemini 3.1 Pro (Preview)", - "display_name": "Gemini 3.1 Pro (Preview)", + "id": "accounts/fireworks/models/qwen3p6-plus", + "name": "Qwen 3.6 Plus", + "display_name": "Qwen 3.6 Plus", "modalities": { "input": [ "text", @@ -26293,9 +27765,43 @@ ] }, "limit": { - "context": 1048756, + "context": 262144, "output": 65536 }, + "temperature": true, + "tool_call": true, + "reasoning": { + "supported": true, + "default": true + }, + "attachment": true, + "open_weights": false, + "release_date": "2026-04-04", + "last_updated": "2026-04-04", + "cost": { + "input": 0.5, + "output": 3, + "cache_read": 0.1 + }, + "type": "chat" + }, + { + "id": "accounts/fireworks/models/deepseek-v4-pro", + "name": "DeepSeek V4 Pro", + "display_name": "DeepSeek V4 Pro", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 1000000, + "output": 384000 + }, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, @@ -26304,49 +27810,43 @@ "extra_capabilities": { "reasoning": { "supported": true, - "default_enabled": true, - "mode": "level", - "level": "high", - "level_options": [ - "low", - "high" - ], + "interleaved": true, "summaries": true, "visibility": "summary", "continuation": [ - "thought_signatures" + "thinking_blocks" ] } }, - "attachment": true, - "open_weights": false, - "release_date": "2026-02-19", - "last_updated": "2026-02-19", + "attachment": false, + "open_weights": true, + "knowledge": "2025-05", + "release_date": "2026-04-24", + "last_updated": "2026-04-24", "cost": { - "input": 2, - "output": 12, - "cache_read": 0.2 + "input": 1.74, + "output": 3.48, + "cache_read": 0.145 }, "type": "chat" }, { - "id": "google/gemini-3.1-flash-lite", - "name": "Gemini 3.1 Flash Lite", - "display_name": "Gemini 3.1 Flash Lite", + "id": "accounts/fireworks/models/minimax-m2p7", + "name": "MiniMax-M2.7", + "display_name": "MiniMax-M2.7", "modalities": { "input": [ - "text", - "image", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 1048576, - "output": 65536 + "context": 196608, + "output": 196608 }, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, @@ -26354,24 +27854,30 @@ }, "extra_capabilities": { "reasoning": { - "supported": true + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] } }, - "attachment": true, - "open_weights": false, - "release_date": "2026-03-03", - "last_updated": "2026-03-03", + "attachment": false, + "open_weights": true, + "release_date": "2026-04-12", + "last_updated": "2026-04-12", "cost": { - "input": 0.25, - "output": 1.5, - "cache_read": 0.025 + "input": 0.3, + "output": 1.2, + "cache_read": 0.06 }, "type": "chat" }, { - "id": "google/gemma-4-26b-a4b-it", - "name": "Gemma 4 26B A4B", - "display_name": "Gemma 4 26B A4B", + "id": "accounts/fireworks/models/kimi-k2p6", + "name": "Kimi K2.6", + "display_name": "Kimi K2.6", "modalities": { "input": [ "text", @@ -26382,42 +27888,54 @@ ] }, "limit": { - "context": 262144, - "output": 131072 + "context": 262000, + "output": 262000 }, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { "supported": true, "default": true }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } + }, "attachment": true, - "open_weights": false, - "release_date": "2026-04-02", - "last_updated": "2026-04-02", + "open_weights": true, + "release_date": "2026-04-17", + "last_updated": "2026-04-17", "cost": { - "input": 0.13, - "output": 0.4 + "input": 0.95, + "output": 4, + "cache_read": 0.16 }, "type": "chat" }, { - "id": "google/gemini-3.5-flash", - "name": "Gemini 3.5 Flash", - "display_name": "Gemini 3.5 Flash", + "id": "accounts/fireworks/models/glm-5p1", + "name": "GLM 5.1", + "display_name": "GLM 5.1", "modalities": { "input": [ - "text", - "image", - "audio" + "text" ], "output": [ "text" ] }, "limit": { - "context": 1048576, - "output": 65536 + "context": 202800, + "output": 131072 }, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, @@ -26426,101 +27944,80 @@ "extra_capabilities": { "reasoning": { "supported": true, - "default_enabled": true, - "mode": "level", - "level": "high", - "level_options": [ - "minimal", - "low", - "medium", - "high" - ], + "interleaved": true, "summaries": true, "visibility": "summary", "continuation": [ - "thought_signatures" + "thinking_blocks" ] } }, - "attachment": true, - "open_weights": false, - "release_date": "2026-05-19", - "last_updated": "2026-05-19", + "attachment": false, + "open_weights": true, + "release_date": "2026-04-01", + "last_updated": "2026-04-01", "cost": { - "input": 1.5, - "output": 9, - "cache_read": 0.15 + "input": 1.4, + "output": 4.4, + "cache_read": 0.26 }, "type": "chat" }, { - "id": "google/gemini-3-flash-preview-thinking", - "name": "Gemini 3 Flash Thinking", - "display_name": "Gemini 3 Flash Thinking", + "id": "accounts/fireworks/models/gpt-oss-120b", + "name": "GPT OSS 120B", + "display_name": "GPT OSS 120B", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 1048756, - "output": 65536 + "context": 131072, + "output": 32768 }, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { "supported": true, "default": true }, "extra_capabilities": { "reasoning": { - "supported": true, - "default_enabled": true, - "mode": "level", - "level": "high", - "level_options": [ - "minimal", - "low", - "medium", - "high" - ], - "summaries": true, - "visibility": "summary", - "continuation": [ - "thought_signatures" - ] + "supported": true } }, - "attachment": true, - "open_weights": false, - "release_date": "2025-12-17", - "last_updated": "2025-12-17", + "attachment": false, + "open_weights": true, + "release_date": "2025-08-05", + "last_updated": "2025-08-05", "cost": { - "input": 0.5, - "output": 3 + "input": 0.15, + "output": 0.6, + "cache_read": 0.015 }, "type": "chat" }, { - "id": "google/gemini-3.1-pro-preview-low", - "name": "Gemini 3.1 Pro (Preview Low)", - "display_name": "Gemini 3.1 Pro (Preview Low)", + "id": "accounts/fireworks/models/minimax-m2p5", + "name": "MiniMax-M2.5", + "display_name": "MiniMax-M2.5", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 1048756, - "output": 65536 + "context": 196608, + "output": 196608 }, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, @@ -26529,35 +28026,29 @@ "extra_capabilities": { "reasoning": { "supported": true, - "default_enabled": true, - "mode": "level", - "level": "high", - "level_options": [ - "low", - "high" - ], + "interleaved": true, "summaries": true, "visibility": "summary", "continuation": [ - "thought_signatures" + "thinking_blocks" ] } }, - "attachment": true, - "open_weights": false, - "release_date": "2026-02-21", - "last_updated": "2026-02-21", + "attachment": false, + "open_weights": true, + "release_date": "2026-02-12", + "last_updated": "2026-02-12", "cost": { - "input": 2, - "output": 12, - "cache_read": 0.2 + "input": 0.3, + "output": 1.2, + "cache_read": 0.03 }, "type": "chat" }, { - "id": "huihui-ai/Qwen2.5-32B-Instruct-abliterated", - "name": "Qwen 2.5 32B Abliterated", - "display_name": "Qwen 2.5 32B Abliterated", + "id": "accounts/fireworks/models/gpt-oss-20b", + "name": "GPT OSS 20B", + "display_name": "GPT OSS 20B", "modalities": { "input": [ "text" @@ -26567,27 +28058,44 @@ ] }, "limit": { - "context": 32768, - "output": 8192 + "context": 131072, + "output": 32768 }, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true + } }, "attachment": false, - "open_weights": false, - "release_date": "2025-01-06", - "last_updated": "2025-01-06", + "open_weights": true, + "release_date": "2025-08-05", + "last_updated": "2025-08-05", "cost": { - "input": 0.7, - "output": 0.7 + "input": 0.07, + "output": 0.3, + "cache_read": 0.035 }, "type": "chat" - }, + } + ] + }, + "vultr": { + "id": "vultr", + "name": "Vultr", + "display_name": "Vultr", + "api": "https://api.vultrinference.com/v1", + "doc": "https://api.vultrinference.com/", + "models": [ { - "id": "huihui-ai/Llama-3.3-70B-Instruct-abliterated", - "name": "Llama 3.3 70B Instruct abliterated", - "display_name": "Llama 3.3 70B Instruct abliterated", + "id": "moonshotai/Kimi-K2.6", + "name": "Kimi K2.6", + "display_name": "Kimi K2.6", "modalities": { "input": [ "text" @@ -26597,27 +28105,41 @@ ] }, "limit": { - "context": 16384, - "output": 16384 + "context": 262144, + "output": 131072 }, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": false, - "open_weights": false, - "release_date": "2025-08-08", - "last_updated": "2025-08-08", + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } + }, + "attachment": true, + "open_weights": true, + "knowledge": "2025-01", + "release_date": "2026-04-21", + "last_updated": "2026-04-21", "cost": { - "input": 0.7, - "output": 0.7 + "input": 0.15, + "output": 0.6 }, "type": "chat" }, { - "id": "huihui-ai/DeepSeek-R1-Distill-Llama-70B-abliterated", - "name": "DeepSeek R1 Llama 70B Abliterated", - "display_name": "DeepSeek R1 Llama 70B Abliterated", + "id": "nvidia/Llama-3.1-Nemotron-Safety-Guard-8B-v3", + "name": "Llama 3.1 Nemotron Safety Guard", + "display_name": "Llama 3.1 Nemotron Safety Guard", "modalities": { "input": [ "text" @@ -26627,28 +28149,29 @@ ] }, "limit": { - "context": 16384, - "output": 8192 + "context": 8192, + "output": 4096 }, + "temperature": true, "tool_call": false, "reasoning": { - "supported": true, - "default": true + "supported": false }, "attachment": false, - "open_weights": false, - "release_date": "2025-01-20", - "last_updated": "2025-01-20", + "open_weights": true, + "knowledge": "2023-12", + "release_date": "2025-10-28", + "last_updated": "2025-10-28", "cost": { - "input": 0.7, - "output": 0.7 + "input": 0.01, + "output": 0.01 }, "type": "chat" }, { - "id": "huihui-ai/DeepSeek-R1-Distill-Qwen-32B-abliterated", - "name": "DeepSeek R1 Qwen Abliterated", - "display_name": "DeepSeek R1 Qwen Abliterated", + "id": "nvidia/Nemotron-3-Nano-Omni-30B-A3B-Reasoning-BF16", + "name": "NVIDIA Nemotron 3 Nano Omni", + "display_name": "NVIDIA Nemotron 3 Nano Omni", "modalities": { "input": [ "text" @@ -26658,120 +28181,110 @@ ] }, "limit": { - "context": 16384, - "output": 8192 + "context": 262144, + "output": 131072 }, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { "supported": true, "default": true }, "attachment": false, - "open_weights": false, - "release_date": "2025-01-20", - "last_updated": "2025-01-20", + "open_weights": true, + "knowledge": "2025-05", + "release_date": "2026-04-28", + "last_updated": "2026-04-28", "cost": { - "input": 1.4, - "output": 1.4 + "input": 0.13, + "output": 0.38 }, "type": "chat" }, { - "id": "openai/gpt-4o-2024-08-06", - "name": "GPT-4o (2024-08-06)", - "display_name": "GPT-4o (2024-08-06)", + "id": "nvidia/DeepSeek-V3.2-NVFP4", + "name": "DeepSeek V3.2", + "display_name": "DeepSeek V3.2", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 16384 + "context": 131072, + "output": 131072 }, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": true, - "open_weights": false, - "release_date": "2024-08-06", - "last_updated": "2024-08-06", + "attachment": false, + "open_weights": true, + "knowledge": "2024-07", + "release_date": "2025-12-01", + "last_updated": "2025-12-01", "cost": { - "input": 2.499, - "output": 9.996 + "input": 0.55, + "output": 1.65 }, "type": "chat" }, { - "id": "openai/gpt-5-pro", - "name": "GPT 5 Pro", - "display_name": "GPT 5 Pro", + "id": "nvidia/Nemotron-Cascade-2-30B-A3B", + "name": "NVIDIA Nemotron Cascade 2", + "display_name": "NVIDIA Nemotron Cascade 2", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 400000, - "output": 128000 + "context": 262144, + "output": 131072 }, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { "supported": true, "default": true }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": true, - "mode": "fixed", - "effort": "high", - "verbosity": "medium", - "verbosity_options": [ - "low", - "medium", - "high" - ], - "visibility": "hidden" - } - }, - "attachment": true, - "open_weights": false, - "release_date": "2025-08-07", - "last_updated": "2025-08-07", + "attachment": false, + "open_weights": true, + "knowledge": "2024-07", + "release_date": "2025-12-01", + "last_updated": "2025-12-01", "cost": { - "input": 15, - "output": 120 + "input": 0.15, + "output": 0.6 }, "type": "chat" }, { - "id": "openai/gpt-5-mini", - "name": "GPT 5 Mini", - "display_name": "GPT 5 Mini", + "id": "zai-org/GLM-5.1-FP8", + "name": "GLM-5.1", + "display_name": "GLM-5.1", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 400000, - "output": 128000 + "context": 200000, + "output": 131072 }, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { "supported": true, "default": true @@ -26779,38 +28292,28 @@ "extra_capabilities": { "reasoning": { "supported": true, - "default_enabled": true, - "mode": "effort", - "effort": "medium", - "effort_options": [ - "minimal", - "low", - "medium", - "high" - ], - "verbosity": "medium", - "verbosity_options": [ - "low", - "medium", - "high" - ], - "visibility": "hidden" + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] } }, - "attachment": true, - "open_weights": false, - "release_date": "2025-08-07", - "last_updated": "2025-08-07", + "attachment": false, + "open_weights": true, + "release_date": "2026-03-27", + "last_updated": "2026-03-27", "cost": { - "input": 0.25, - "output": 2 + "input": 0.85, + "output": 3.1 }, "type": "chat" }, { - "id": "openai/o3-mini-high", - "name": "OpenAI o3-mini (High)", - "display_name": "OpenAI o3-mini (High)", + "id": "MiniMaxAI/MiniMax-M2.7", + "name": "MiniMax-M2.7", + "display_name": "MiniMax-M2.7", "modalities": { "input": [ "text" @@ -26820,9 +28323,10 @@ ] }, "limit": { - "context": 200000, - "output": 100000 + "context": 204800, + "output": 131072 }, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, @@ -26831,55 +28335,71 @@ "extra_capabilities": { "reasoning": { "supported": true, - "default_enabled": true, - "mode": "effort", - "effort": "medium", - "effort_options": [ - "low", - "medium", - "high" - ], - "visibility": "hidden" + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] } }, "attachment": false, - "open_weights": false, - "release_date": "2025-01-31", - "last_updated": "2025-01-31", + "open_weights": true, + "release_date": "2026-03-18", + "last_updated": "2026-03-18", "cost": { - "input": 0.64, - "output": 2.588 + "input": 0.3, + "output": 1.2 }, "type": "chat" - }, + } + ] + }, + "302ai": { + "id": "302ai", + "name": "302.AI", + "display_name": "302.AI", + "api": "https://api.302.ai/v1", + "doc": "https://doc.302.ai", + "models": [ { - "id": "openai/o4-mini-high", - "name": "OpenAI o4-mini high", - "display_name": "OpenAI o4-mini high", + "id": "gpt-5.4-mini-2026-03-17", + "name": "gpt-5.4-mini-2026-03-17", + "display_name": "gpt-5.4-mini-2026-03-17", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 100000 + "context": 400000, + "output": 128000 }, + "temperature": false, "tool_call": true, "reasoning": { "supported": true, - "default": true + "default": false }, "extra_capabilities": { "reasoning": { "supported": true, - "default_enabled": true, + "default_enabled": false, "mode": "effort", - "effort": "medium", + "effort": "none", "effort_options": [ + "none", + "low", + "medium", + "high", + "xhigh" + ], + "verbosity": "medium", + "verbosity_options": [ "low", "medium", "high" @@ -26887,20 +28407,21 @@ "visibility": "hidden" } }, - "attachment": false, + "attachment": true, "open_weights": false, - "release_date": "2025-04-16", - "last_updated": "2025-04-16", + "knowledge": "2025-08-31", + "release_date": "2026-03-19", + "last_updated": "2026-03-19", "cost": { - "input": 1.1, - "output": 4.4 + "input": 0.75, + "output": 4.5 }, "type": "chat" }, { - "id": "openai/gpt-4o", - "name": "GPT-4o", - "display_name": "GPT-4o", + "id": "chatgpt-4o-latest", + "name": "chatgpt-4o-latest", + "display_name": "chatgpt-4o-latest", "modalities": { "input": [ "text", @@ -26914,29 +28435,30 @@ "context": 128000, "output": 16384 }, + "temperature": true, "tool_call": false, "reasoning": { "supported": false }, "attachment": true, "open_weights": false, - "release_date": "2024-05-13", - "last_updated": "2024-05-13", + "knowledge": "2023-09", + "release_date": "2024-08-08", + "last_updated": "2024-08-08", "cost": { - "input": 2.499, - "output": 9.996 + "input": 5, + "output": 15 }, "type": "chat" }, { - "id": "openai/gpt-5.2", - "name": "GPT 5.2", - "display_name": "GPT 5.2", + "id": "gpt-5.4-nano-2026-03-17", + "name": "gpt-5.4-nano-2026-03-17", + "display_name": "gpt-5.4-nano-2026-03-17", "modalities": { "input": [ "text", - "image", - "pdf" + "image" ], "output": [ "text" @@ -26946,6 +28468,7 @@ "context": 400000, "output": 128000 }, + "temperature": false, "tool_call": true, "reasoning": { "supported": true, @@ -26975,18 +28498,19 @@ }, "attachment": true, "open_weights": false, - "release_date": "2026-01-01", - "last_updated": "2026-01-01", + "knowledge": "2025-08-31", + "release_date": "2026-03-19", + "last_updated": "2026-03-19", "cost": { - "input": 1.75, - "output": 14 + "input": 0.2, + "output": 1.25 }, "type": "chat" }, { - "id": "openai/gpt-5-codex", - "name": "GPT-5 Codex", - "display_name": "GPT-5 Codex", + "id": "kimi-k2-0905-preview", + "name": "kimi-k2-0905-preview", + "display_name": "kimi-k2-0905-preview", "modalities": { "input": [ "text" @@ -26996,94 +28520,66 @@ ] }, "limit": { - "context": 256000, - "output": 32768 + "context": 262144, + "output": 262144 }, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": true, - "mode": "effort", - "effort": "medium", - "effort_options": [ - "minimal", - "low", - "medium", - "high" - ], - "verbosity": "medium", - "verbosity_options": [ - "low", - "medium", - "high" - ], - "visibility": "hidden" - } + "supported": false }, "attachment": false, "open_weights": false, - "release_date": "2025-09-15", - "last_updated": "2025-09-15", + "knowledge": "2025-06", + "release_date": "2025-09-05", + "last_updated": "2025-09-05", "cost": { - "input": 9.996, - "output": 19.992 + "input": 0.632, + "output": 2.53 }, "type": "chat" }, { - "id": "openai/o3", - "name": "OpenAI o3", - "display_name": "OpenAI o3", + "id": "grok-4.20-beta-0309-non-reasoning", + "name": "grok-4.20-beta-0309-non-reasoning", + "display_name": "grok-4.20-beta-0309-non-reasoning", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 100000 + "context": 2000000, + "output": 30000 }, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": true }, "extra_capabilities": { "reasoning": { - "supported": true, - "default_enabled": true, - "mode": "effort", - "effort": "medium", - "effort_options": [ - "low", - "medium", - "high" - ], - "visibility": "hidden" + "supported": true } }, - "attachment": false, + "attachment": true, "open_weights": false, - "release_date": "2025-04-16", - "last_updated": "2025-04-16", + "release_date": "2026-03-16", + "last_updated": "2026-03-16", "cost": { "input": 2, - "output": 8 + "output": 6 }, "type": "chat" }, { - "id": "openai/gpt-4o-2024-11-20", - "name": "GPT-4o (2024-11-20)", - "display_name": "GPT-4o (2024-11-20)", + "id": "gemini-2.5-flash-nothink", + "name": "gemini-2.5-flash-nothink", + "display_name": "gemini-2.5-flash-nothink", "modalities": { "input": [ "text", @@ -27094,95 +28590,106 @@ ] }, "limit": { - "context": 128000, - "output": 16384 + "context": 1000000, + "output": 65536 }, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": true, + "mode": "budget", + "budget": { + "default": -1, + "min": 0, + "max": 24576, + "auto": -1, + "off": 0, + "unit": "tokens" + }, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thought_signatures" + ] + } }, "attachment": true, "open_weights": false, - "release_date": "2024-11-20", - "last_updated": "2024-11-20", + "knowledge": "2025-01", + "release_date": "2025-06-24", + "last_updated": "2025-06-24", "cost": { - "input": 2.5, - "output": 10 + "input": 0.3, + "output": 2.5 }, "type": "chat" }, { - "id": "openai/gpt-5", - "name": "GPT 5", - "display_name": "GPT 5", + "id": "qwen-plus", + "name": "Qwen-Plus", + "display_name": "Qwen-Plus", "modalities": { "input": [ - "text", - "image", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 400000, - "output": 128000 + "context": 1000000, + "output": 32768 }, + "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": true }, "extra_capabilities": { "reasoning": { "supported": true, - "default_enabled": true, - "mode": "effort", - "effort": "medium", - "effort_options": [ - "minimal", - "low", - "medium", - "high" - ], - "verbosity": "medium", - "verbosity_options": [ - "low", - "medium", - "high" - ], - "visibility": "hidden" + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] } }, - "attachment": true, + "attachment": false, "open_weights": false, - "release_date": "2025-08-07", - "last_updated": "2025-08-07", + "knowledge": "2024-10", + "release_date": "2024-07-23", + "last_updated": "2024-07-23", "cost": { - "input": 1.25, - "output": 10 + "input": 0.12, + "output": 1.2 }, "type": "chat" }, { - "id": "openai/gpt-5.4-pro", - "name": "GPT 5.4 Pro", - "display_name": "GPT 5.4 Pro", + "id": "glm-4.7", + "name": "glm-4.7", + "display_name": "glm-4.7", "modalities": { "input": [ - "text", - "image", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 922000, - "output": 128000 + "context": 204800, + "output": 131072 }, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, @@ -27191,69 +28698,96 @@ "extra_capabilities": { "reasoning": { "supported": true, - "default_enabled": true, - "mode": "effort", - "effort": "high", - "effort_options": [ - "medium", - "high", - "xhigh" - ], - "verbosity": "medium", - "verbosity_options": [ - "low", - "medium", - "high" - ], - "visibility": "hidden" + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] } }, - "attachment": true, + "attachment": false, + "open_weights": true, + "knowledge": "2025-04", + "release_date": "2025-12-22", + "last_updated": "2025-12-22", + "cost": { + "input": 0.286, + "output": 1.142 + }, + "type": "chat" + }, + { + "id": "qwen3-235b-a22b-instruct-2507", + "name": "qwen3-235b-a22b-instruct-2507", + "display_name": "qwen3-235b-a22b-instruct-2507", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 128000, + "output": 65536 + }, + "temperature": true, + "tool_call": true, + "reasoning": { + "supported": false + }, + "attachment": false, "open_weights": false, - "release_date": "2026-03-05", - "last_updated": "2026-03-05", + "knowledge": "2025-04", + "release_date": "2025-07-30", + "last_updated": "2025-07-30", "cost": { - "input": 30, - "output": 180, - "cache_read": 3 + "input": 0.29, + "output": 1.143 }, "type": "chat" }, { - "id": "openai/gpt-4.1-mini", - "name": "GPT 4.1 Mini", - "display_name": "GPT 4.1 Mini", + "id": "glm-4.5v", + "name": "GLM-4.5V", + "display_name": "GLM-4.5V", "modalities": { "input": [ "text", - "image" + "image", + "video" ], "output": [ "text" ] }, "limit": { - "context": 1047576, - "output": 32768 + "context": 64000, + "output": 16384 }, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "attachment": true, - "open_weights": false, - "release_date": "2025-04-14", - "last_updated": "2025-04-14", + "open_weights": true, + "knowledge": "2025-04", + "release_date": "2025-08-12", + "last_updated": "2025-08-12", "cost": { - "input": 0.4, - "output": 1.6 + "input": 0.29, + "output": 0.86 }, "type": "chat" }, { - "id": "openai/gpt-5.2-pro", - "name": "GPT 5.2 Pro", - "display_name": "GPT 5.2 Pro", + "id": "claude-opus-4-5", + "name": "claude-opus-4-5", + "display_name": "claude-opus-4-5", "modalities": { "input": [ "text", @@ -27265,90 +28799,124 @@ ] }, "limit": { - "context": 400000, - "output": 128000 + "context": 200000, + "output": 64000 }, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, - "default": true + "default": false }, "extra_capabilities": { "reasoning": { "supported": true, - "default_enabled": true, - "mode": "effort", + "default_enabled": false, + "mode": "mixed", + "budget": { + "min": 1024, + "unit": "tokens" + }, "effort": "high", "effort_options": [ - "medium", - "high", - "xhigh" - ], - "verbosity": "medium", - "verbosity_options": [ "low", "medium", "high" ], - "visibility": "hidden" + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ], + "notes": [ + "Claude Opus 4.5 uses manual thinking.type = \"enabled\" with budget_tokens; effort can be used alongside the thinking budget.", + "Interleaved thinking requires the interleaved-thinking-2025-05-14 beta header." + ] } }, "attachment": true, "open_weights": false, - "release_date": "2026-01-01", - "last_updated": "2026-01-01", + "knowledge": "2025-03-31", + "release_date": "2025-11-25", + "last_updated": "2025-11-25", "cost": { - "input": 21, - "output": 168 + "input": 5, + "output": 25 }, "type": "chat" }, { - "id": "openai/gpt-4o-mini-search-preview", - "name": "GPT-4o mini Search Preview", - "display_name": "GPT-4o mini Search Preview", + "id": "gemini-2.5-pro", + "name": "gemini-2.5-pro", + "display_name": "gemini-2.5-pro", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 16384 + "context": 1000000, + "output": 65536 }, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": false, + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": true, + "mode": "budget", + "budget": { + "default": -1, + "min": 128, + "max": 32768, + "auto": -1, + "unit": "tokens" + }, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thought_signatures" + ] + } + }, + "attachment": true, "open_weights": false, - "release_date": "2024-07-18", - "last_updated": "2024-07-18", + "knowledge": "2025-01", + "release_date": "2025-06-17", + "last_updated": "2025-06-17", "cost": { - "input": 0.088, - "output": 0.35 + "input": 1.25, + "output": 10 }, "type": "chat" }, { - "id": "openai/o4-mini", - "name": "OpenAI o4-mini", - "display_name": "OpenAI o4-mini", + "id": "gpt-5", + "name": "gpt-5", + "display_name": "gpt-5", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 100000 + "context": 400000, + "output": 128000 }, + "temperature": false, "tool_call": true, "reasoning": { "supported": true, @@ -27361,6 +28929,13 @@ "mode": "effort", "effort": "medium", "effort_options": [ + "minimal", + "low", + "medium", + "high" + ], + "verbosity": "medium", + "verbosity_options": [ "low", "medium", "high" @@ -27368,20 +28943,21 @@ "visibility": "hidden" } }, - "attachment": false, + "attachment": true, "open_weights": false, - "release_date": "2025-04-16", - "last_updated": "2025-04-16", + "knowledge": "2024-09-30", + "release_date": "2025-08-08", + "last_updated": "2025-08-08", "cost": { - "input": 1.1, - "output": 4.4 + "input": 1.25, + "output": 10 }, "type": "chat" }, { - "id": "openai/gpt-5.4", - "name": "GPT 5.4", - "display_name": "GPT 5.4", + "id": "claude-haiku-4-5-20251001", + "name": "claude-haiku-4-5-20251001", + "display_name": "claude-haiku-4-5-20251001", "modalities": { "input": [ "text", @@ -27393,9 +28969,10 @@ ] }, "limit": { - "context": 922000, - "output": 128000 + "context": 200000, + "output": 64000 }, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, @@ -27405,39 +28982,38 @@ "reasoning": { "supported": true, "default_enabled": false, - "mode": "effort", - "effort": "none", - "effort_options": [ - "none", - "low", - "medium", - "high", - "xhigh" - ], - "verbosity": "medium", - "verbosity_options": [ - "low", - "medium", - "high" + "mode": "budget", + "budget": { + "min": 1024, + "unit": "tokens" + }, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" ], - "visibility": "hidden" + "notes": [ + "Claude 4 manual thinking uses thinking.type = \"enabled\" with budget_tokens.", + "Interleaved thinking requires the interleaved-thinking-2025-05-14 beta header for this model family." + ] } }, "attachment": true, "open_weights": false, - "release_date": "2026-03-05", - "last_updated": "2026-03-05", + "knowledge": "2025-02-28", + "release_date": "2025-10-16", + "last_updated": "2025-10-16", "cost": { - "input": 2.5, - "output": 15, - "cache_read": 0.25 + "input": 1, + "output": 5 }, "type": "chat" }, { - "id": "openai/o3-mini", - "name": "OpenAI o3-mini", - "display_name": "OpenAI o3-mini", + "id": "kimi-k2-thinking-turbo", + "name": "kimi-k2-thinking-turbo", + "display_name": "kimi-k2-thinking-turbo", "modalities": { "input": [ "text" @@ -27447,42 +29023,30 @@ ] }, "limit": { - "context": 200000, - "output": 100000 + "context": 262144, + "output": 262144 }, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, "default": true }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": true, - "mode": "effort", - "effort": "medium", - "effort_options": [ - "low", - "medium", - "high" - ], - "visibility": "hidden" - } - }, "attachment": false, "open_weights": false, - "release_date": "2025-01-31", - "last_updated": "2025-01-31", + "knowledge": "2025-06", + "release_date": "2025-09-05", + "last_updated": "2025-09-05", "cost": { - "input": 1.1, - "output": 4.4 + "input": 1.265, + "output": 9.119 }, "type": "chat" }, { - "id": "openai/gpt-latest", - "name": "GPT Latest", - "display_name": "GPT Latest", + "id": "claude-3-5-haiku-20241022", + "name": "claude-3-5-haiku-20241022", + "display_name": "claude-3-5-haiku-20241022", "modalities": { "input": [ "text", @@ -27494,89 +29058,66 @@ ] }, "limit": { - "context": 1000000, - "output": 128000 + "context": 200000, + "output": 8192 }, + "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, "attachment": true, "open_weights": false, - "release_date": "2026-03-29", - "last_updated": "2026-03-29", + "knowledge": "2024-07-31", + "release_date": "2024-10-22", + "last_updated": "2024-10-22", "cost": { - "input": 5, - "output": 30, - "cache_read": 0.5 + "input": 0.8, + "output": 4 }, "type": "chat" }, { - "id": "openai/gpt-5.5", - "name": "GPT 5.5", - "display_name": "GPT 5.5", + "id": "glm-4.5", + "name": "GLM-4.5", + "display_name": "GLM-4.5", "modalities": { "input": [ - "text", - "image", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 1000000, - "output": 128000 + "context": 131072, + "output": 98304 }, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, "default": true }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": true, - "mode": "effort", - "effort": "medium", - "effort_options": [ - "low", - "medium", - "high", - "xhigh" - ], - "verbosity": "medium", - "verbosity_options": [ - "low", - "medium", - "high" - ], - "visibility": "hidden" - } - }, - "attachment": true, - "open_weights": false, - "release_date": "2026-04-23", - "last_updated": "2026-04-23", + "attachment": false, + "open_weights": true, + "knowledge": "2025-04", + "release_date": "2025-07-29", + "last_updated": "2025-07-29", "cost": { - "input": 5, - "output": 30, - "cache_read": 0.5 + "input": 0.286, + "output": 1.142 }, "type": "chat" }, { - "id": "openai/gpt-5.1", - "name": "GPT 5.1", - "display_name": "GPT 5.1", + "id": "gpt-5-pro", + "name": "gpt-5-pro", + "display_name": "gpt-5-pro", "modalities": { "input": [ "text", - "image", - "pdf" + "image" ], "output": [ "text" @@ -27584,25 +29125,20 @@ }, "limit": { "context": 400000, - "output": 128000 + "output": 272000 }, + "temperature": false, "tool_call": true, "reasoning": { "supported": true, - "default": false + "default": true }, "extra_capabilities": { "reasoning": { "supported": true, - "default_enabled": false, - "mode": "effort", - "effort": "none", - "effort_options": [ - "none", - "low", - "medium", - "high" - ], + "default_enabled": true, + "mode": "fixed", + "effort": "high", "verbosity": "medium", "verbosity_options": [ "low", @@ -27614,18 +29150,19 @@ }, "attachment": true, "open_weights": false, - "release_date": "2025-11-13", - "last_updated": "2025-11-13", + "knowledge": "2024-09-30", + "release_date": "2025-10-08", + "last_updated": "2025-10-08", "cost": { - "input": 1.25, - "output": 10 + "input": 15, + "output": 120 }, "type": "chat" }, { - "id": "openai/gpt-5-nano", - "name": "GPT 5 Nano", - "display_name": "GPT 5 Nano", + "id": "grok-4.20-beta-0309-reasoning", + "name": "grok-4.20-beta-0309-reasoning", + "display_name": "grok-4.20-beta-0309-reasoning", "modalities": { "input": [ "text", @@ -27636,61 +29173,48 @@ ] }, "limit": { - "context": 400000, - "output": 128000 + "context": 2000000, + "output": 30000 }, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { "supported": true, "default": true }, "extra_capabilities": { "reasoning": { - "supported": true, - "default_enabled": true, - "mode": "effort", - "effort": "medium", - "effort_options": [ - "minimal", - "low", - "medium", - "high" - ], - "verbosity": "medium", - "verbosity_options": [ - "low", - "medium", - "high" - ], - "visibility": "hidden" + "supported": true } }, "attachment": true, "open_weights": false, - "release_date": "2025-08-07", - "last_updated": "2025-08-07", + "release_date": "2026-03-16", + "last_updated": "2026-03-16", "cost": { - "input": 0.05, - "output": 0.4 + "input": 2, + "output": 6 }, "type": "chat" }, { - "id": "openai/gpt-oss-120b", - "name": "GPT OSS 120B", - "display_name": "GPT OSS 120B", + "id": "gemini-2.5-flash", + "name": "gemini-2.5-flash", + "display_name": "gemini-2.5-flash", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 16384 + "context": 1000000, + "output": 65536 }, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, @@ -27698,27 +29222,44 @@ }, "extra_capabilities": { "reasoning": { - "supported": true + "supported": true, + "default_enabled": true, + "mode": "budget", + "budget": { + "default": -1, + "min": 0, + "max": 24576, + "auto": -1, + "off": 0, + "unit": "tokens" + }, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thought_signatures" + ] } }, - "attachment": false, + "attachment": true, "open_weights": false, - "release_date": "2025-08-05", - "last_updated": "2025-08-05", + "knowledge": "2025-01", + "release_date": "2025-06-17", + "last_updated": "2025-06-17", "cost": { - "input": 0.05, - "output": 0.25 + "input": 0.3, + "output": 2.5 }, "type": "chat" }, { - "id": "openai/gpt-4o-mini", - "name": "GPT-4o mini", - "display_name": "GPT-4o mini", + "id": "gpt-4o", + "name": "gpt-4o", + "display_name": "gpt-4o", "modalities": { "input": [ "text", - "image" + "image", + "pdf" ], "output": [ "text" @@ -27728,78 +29269,62 @@ "context": 128000, "output": 16384 }, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { "supported": false }, "attachment": true, "open_weights": false, - "release_date": "2024-07-18", - "last_updated": "2024-07-18", + "knowledge": "2023-09", + "release_date": "2024-05-13", + "last_updated": "2024-05-13", "cost": { - "input": 0.1496, - "output": 0.595 + "input": 2.5, + "output": 10 }, "type": "chat" }, { - "id": "openai/gpt-5.1-codex-max", - "name": "GPT 5.1 Codex Max", - "display_name": "GPT 5.1 Codex Max", + "id": "MiniMax-M2.1", + "name": "MiniMax-M2.1", + "display_name": "MiniMax-M2.1", "modalities": { "input": [ - "text", - "image", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 400000, - "output": 128000 + "context": 1000000, + "output": 131072 }, + "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": false + "supported": true }, "extra_capabilities": { "reasoning": { - "supported": true, - "default_enabled": false, - "mode": "effort", - "effort": "none", - "effort_options": [ - "none", - "low", - "medium", - "high" - ], - "verbosity": "medium", - "verbosity_options": [ - "low", - "medium", - "high" - ], - "visibility": "hidden" + "supported": true } }, - "attachment": true, + "attachment": false, "open_weights": false, - "release_date": "2025-11-13", - "last_updated": "2025-11-13", + "release_date": "2025-12-19", + "last_updated": "2025-12-19", "cost": { - "input": 2.5, - "output": 20 + "input": 0.3, + "output": 1.2 }, "type": "chat" }, { - "id": "openai/gpt-5.1-codex-mini", - "name": "GPT 5.1 Codex Mini", - "display_name": "GPT 5.1 Codex Mini", + "id": "gemini-2.5-flash-lite-preview-09-2025", + "name": "gemini-2.5-flash-lite-preview-09-2025", + "display_name": "gemini-2.5-flash-lite-preview-09-2025", "modalities": { "input": [ "text", @@ -27810,10 +29335,11 @@ ] }, "limit": { - "context": 400000, - "output": 128000 + "context": 1000000, + "output": 65536 }, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { "supported": true, "default": false @@ -27822,84 +29348,68 @@ "reasoning": { "supported": true, "default_enabled": false, - "mode": "effort", - "effort": "none", - "effort_options": [ - "none", - "low", - "medium", - "high" - ], - "verbosity": "medium", - "verbosity_options": [ - "low", - "medium", - "high" - ], - "visibility": "hidden" + "mode": "budget", + "budget": { + "default": -1, + "min": 512, + "max": 24576, + "auto": -1, + "unit": "tokens" + }, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thought_signatures" + ] } }, "attachment": true, "open_weights": false, - "release_date": "2025-11-13", - "last_updated": "2025-11-13", + "knowledge": "2025-01", + "release_date": "2025-09-26", + "last_updated": "2025-09-26", "cost": { - "input": 0.25, - "output": 2 + "input": 0.1, + "output": 0.4 }, "type": "chat" }, { - "id": "openai/o1-pro", - "name": "OpenAI o1 Pro", - "display_name": "OpenAI o1 Pro", + "id": "doubao-seed-1-6-vision-250815", + "name": "doubao-seed-1-6-vision-250815", + "display_name": "doubao-seed-1-6-vision-250815", "modalities": { "input": [ "text", - "image", - "pdf" + "image" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 100000 + "context": 256000, + "output": 32000 }, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": true, - "mode": "effort", - "effort": "medium", - "effort_options": [ - "low", - "medium", - "high" - ], - "visibility": "hidden" - } + "supported": false }, "attachment": true, "open_weights": false, - "release_date": "2025-01-25", - "last_updated": "2025-01-25", + "release_date": "2025-09-30", + "last_updated": "2025-09-30", "cost": { - "input": 150, - "output": 600 + "input": 0.114, + "output": 1.143 }, "type": "chat" }, { - "id": "openai/gpt-chat-latest", - "name": "GPT Chat Latest", - "display_name": "GPT Chat Latest", + "id": "claude-opus-4-1-20250805", + "name": "claude-opus-4-1-20250805", + "display_name": "claude-opus-4-1-20250805", "modalities": { "input": [ "text", @@ -27911,33 +29421,51 @@ ] }, "limit": { - "context": 400000, - "output": 128000 + "context": 200000, + "output": 32000 }, + "temperature": true, "tool_call": true, "reasoning": { - "supported": true + "supported": true, + "default": false }, "extra_capabilities": { "reasoning": { - "supported": true + "supported": true, + "default_enabled": false, + "mode": "budget", + "budget": { + "min": 1024, + "unit": "tokens" + }, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ], + "notes": [ + "Claude 4 manual thinking uses thinking.type = \"enabled\" with budget_tokens.", + "Interleaved thinking requires the interleaved-thinking-2025-05-14 beta header for this model family." + ] } }, "attachment": true, "open_weights": false, - "release_date": "2026-05-03", - "last_updated": "2026-05-03", + "knowledge": "2025-03-31", + "release_date": "2025-08-05", + "last_updated": "2025-08-05", "cost": { - "input": 5, - "output": 30, - "cache_read": 0.5 + "input": 15, + "output": 75 }, "type": "chat" }, { - "id": "openai/o3-pro-2025-06-10", - "name": "OpenAI o3-pro (2025-06-10)", - "display_name": "OpenAI o3-pro (2025-06-10)", + "id": "qwen3-max-2025-09-23", + "name": "qwen3-max-2025-09-23", + "display_name": "qwen3-max-2025-09-23", "modalities": { "input": [ "text" @@ -27947,42 +29475,29 @@ ] }, "limit": { - "context": 200000, - "output": 100000 + "context": 258048, + "output": 65536 }, + "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": true, - "mode": "effort", - "effort": "medium", - "effort_options": [ - "low", - "medium", - "high" - ], - "visibility": "hidden" - } + "supported": false }, "attachment": false, "open_weights": false, - "release_date": "2025-06-10", - "last_updated": "2025-06-10", + "knowledge": "2025-04", + "release_date": "2025-09-24", + "last_updated": "2025-09-24", "cost": { - "input": 9.996, - "output": 19.992 + "input": 0.86, + "output": 3.43 }, "type": "chat" }, { - "id": "openai/gpt-oss-20b", - "name": "GPT OSS 20B", - "display_name": "GPT OSS 20B", + "id": "glm-4.7-flashx", + "name": "glm-4.7-flashx", + "display_name": "glm-4.7-flashx", "modalities": { "input": [ "text" @@ -27992,33 +29507,30 @@ ] }, "limit": { - "context": 128000, - "output": 16384 + "context": 200000, + "output": 131072 }, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { "supported": true, "default": true }, - "extra_capabilities": { - "reasoning": { - "supported": true - } - }, "attachment": false, - "open_weights": false, - "release_date": "2025-08-05", - "last_updated": "2025-08-05", + "open_weights": true, + "knowledge": "2025-04", + "release_date": "2026-01-20", + "last_updated": "2026-01-20", "cost": { - "input": 0.04, - "output": 0.15 + "input": 0.0715, + "output": 0.429 }, "type": "chat" }, { - "id": "openai/gpt-4-turbo-preview", - "name": "GPT-4 Turbo Preview", - "display_name": "GPT-4 Turbo Preview", + "id": "glm-5.1", + "name": "glm-5.1", + "display_name": "glm-5.1", "modalities": { "input": [ "text" @@ -28028,27 +29540,40 @@ ] }, "limit": { - "context": 128000, - "output": 4096 + "context": 200000, + "output": 131072 }, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } }, "attachment": false, "open_weights": false, - "release_date": "2023-11-06", - "last_updated": "2024-01-01", + "release_date": "2026-04-10", + "last_updated": "2026-04-10", "cost": { - "input": 9.996, - "output": 30.004999999999995 + "input": 0.86, + "output": 3.5 }, "type": "chat" }, { - "id": "openai/o3-deep-research", - "name": "OpenAI o3 Deep Research", - "display_name": "OpenAI o3 Deep Research", + "id": "glm-4.6", + "name": "glm-4.6", + "display_name": "glm-4.6", "modalities": { "input": [ "text" @@ -28058,42 +29583,35 @@ ] }, "limit": { - "context": 200000, - "output": 100000 + "context": 204800, + "output": 131072 }, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { "supported": true, "default": true }, "extra_capabilities": { "reasoning": { - "supported": true, - "default_enabled": true, - "mode": "effort", - "effort": "medium", - "effort_options": [ - "low", - "medium", - "high" - ], - "visibility": "hidden" + "supported": true } }, "attachment": false, - "open_weights": false, - "release_date": "2025-04-16", - "last_updated": "2025-04-16", + "open_weights": true, + "knowledge": "2025-04", + "release_date": "2025-09-30", + "last_updated": "2025-09-30", "cost": { - "input": 9.996, - "output": 19.992 + "input": 0.286, + "output": 1.142 }, "type": "chat" }, { - "id": "openai/o3-mini-low", - "name": "OpenAI o3-mini (Low)", - "display_name": "OpenAI o3-mini (Low)", + "id": "kimi-k2-thinking", + "name": "kimi-k2-thinking", + "display_name": "kimi-k2-thinking", "modalities": { "input": [ "text" @@ -28103,9 +29621,10 @@ ] }, "limit": { - "context": 200000, - "output": 100000 + "context": 262144, + "output": 262144 }, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, @@ -28114,31 +29633,29 @@ "extra_capabilities": { "reasoning": { "supported": true, - "default_enabled": true, - "mode": "effort", - "effort": "medium", - "effort_options": [ - "low", - "medium", - "high" - ], - "visibility": "hidden" + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] } }, "attachment": false, "open_weights": false, - "release_date": "2025-01-31", - "last_updated": "2025-01-31", + "knowledge": "2025-06", + "release_date": "2025-09-05", + "last_updated": "2025-09-05", "cost": { - "input": 9.996, - "output": 19.992 + "input": 0.575, + "output": 2.3 }, "type": "chat" }, { - "id": "openai/gpt-4.1", - "name": "GPT 4.1", - "display_name": "GPT 4.1", + "id": "claude-sonnet-4-5", + "name": "claude-sonnet-4-5", + "display_name": "claude-sonnet-4-5", "modalities": { "input": [ "text", @@ -28150,83 +29667,116 @@ ] }, "limit": { - "context": 1047576, - "output": 32768 + "context": 200000, + "output": 64000 }, + "temperature": true, "tool_call": true, "reasoning": { - "supported": false - }, - "attachment": true, - "open_weights": false, - "release_date": "2025-09-10", - "last_updated": "2025-09-10", - "cost": { - "input": 2, - "output": 8 + "supported": true, + "default": false }, - "type": "chat" + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": false, + "mode": "budget", + "budget": { + "min": 1024, + "unit": "tokens" + }, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ], + "notes": [ + "Claude 4 manual thinking uses thinking.type = \"enabled\" with budget_tokens.", + "Interleaved thinking requires the interleaved-thinking-2025-05-14 beta header for this model family." + ] + } + }, + "attachment": true, + "open_weights": false, + "knowledge": "2025-07-31", + "release_date": "2025-09-30", + "last_updated": "2025-09-30", + "cost": { + "input": 3, + "output": 15 + }, + "type": "chat" }, { - "id": "openai/gpt-5.4-nano", - "name": "GPT 5.4 Nano", - "display_name": "GPT 5.4 Nano", + "id": "glm-4.5-x", + "name": "glm-4.5-x", + "display_name": "glm-4.5-x", "modalities": { "input": [ - "text", - "image", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 400000, + "context": 128000, + "output": 16384 + }, + "temperature": true, + "tool_call": true, + "reasoning": { + "supported": false + }, + "attachment": false, + "open_weights": false, + "knowledge": "2025-04", + "release_date": "2025-07-29", + "last_updated": "2025-07-29", + "cost": { + "input": 1.143, + "output": 2.29 + }, + "type": "chat" + }, + { + "id": "deepseek-v3.2-thinking", + "name": "DeepSeek-V3.2-Thinking", + "display_name": "DeepSeek-V3.2-Thinking", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 128000, "output": 128000 }, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, - "default": false - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": false, - "mode": "effort", - "effort": "none", - "effort_options": [ - "none", - "low", - "medium", - "high", - "xhigh" - ], - "verbosity": "medium", - "verbosity_options": [ - "low", - "medium", - "high" - ], - "visibility": "hidden" - } + "default": true }, - "attachment": true, + "attachment": false, "open_weights": false, - "release_date": "2026-03-17", - "last_updated": "2026-03-17", + "knowledge": "2024-12", + "release_date": "2025-12-01", + "last_updated": "2025-12-01", "cost": { - "input": 0.2, - "output": 1.25, - "cache_read": 0.02 + "input": 0.29, + "output": 0.43 }, "type": "chat" }, { - "id": "openai/gpt-5.3-codex", - "name": "GPT 5.3 Codex", - "display_name": "GPT 5.3 Codex", + "id": "claude-sonnet-4-6-thinking", + "name": "claude-sonnet-4-6-thinking", + "display_name": "claude-sonnet-4-6-thinking", "modalities": { "input": [ "text", @@ -28238,9 +29788,10 @@ ] }, "limit": { - "context": 400000, - "output": 128000 + "context": 1000000, + "output": 64000 }, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, @@ -28250,126 +29801,174 @@ "reasoning": { "supported": true, "default_enabled": true, - "mode": "effort", - "effort": "medium", + "mode": "mixed", + "budget": { + "min": 1024, + "unit": "tokens" + }, + "effort": "high", "effort_options": [ "low", "medium", "high", - "xhigh" + "max" ], - "verbosity": "medium", - "verbosity_options": [ - "low", - "medium", - "high" + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" ], - "visibility": "hidden" + "notes": [ + "Anthropic recommends adaptive thinking with effort for Claude 4.6; budget_tokens remains a deprecated compatibility path.", + "Anthropic API defaults effort to high; lower effort levels should be chosen per workload." + ] } }, "attachment": true, "open_weights": false, - "release_date": "2026-02-24", - "last_updated": "2026-02-24", + "knowledge": "2025-08", + "release_date": "2026-02-18", + "last_updated": "2026-03-13", "cost": { - "input": 1.75, - "output": 14, - "cache_read": 0.175 + "input": 3, + "output": 15 }, "type": "chat" }, { - "id": "openai/o4-mini-deep-research", - "name": "OpenAI o4-mini Deep Research", - "display_name": "OpenAI o4-mini Deep Research", + "id": "claude-opus-4-7", + "name": "claude-opus-4-7", + "display_name": "claude-opus-4-7", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 100000 + "context": 1000000, + "output": 128000 }, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { "supported": true, - "default": true + "default": false }, "extra_capabilities": { "reasoning": { "supported": true, - "default_enabled": true, + "default_enabled": false, "mode": "effort", - "effort": "medium", + "effort": "high", "effort_options": [ "low", "medium", - "high" + "high", + "xhigh", + "max" ], - "visibility": "hidden" + "interleaved": true, + "summaries": true, + "visibility": "omitted", + "continuation": [ + "thinking_blocks" + ], + "notes": [ + "Claude Opus 4.7 and newer Opus models require thinking.type = \"adaptive\" to enable thinking explicitly.", + "Manual budget_tokens requests return 400 on Claude Opus 4.7 and newer adaptive-only Opus models.", + "task_budget is separate from thinking control and should not be treated as a thinking budget." + ] } }, - "attachment": false, + "attachment": true, "open_weights": false, - "release_date": "2025-04-16", - "last_updated": "2025-04-16", + "knowledge": "2026-01-31", + "release_date": "2026-04-17", + "last_updated": "2026-04-17", "cost": { - "input": 9.996, - "output": 19.992 + "input": 5, + "output": 25, + "cache_read": 0.5, + "cache_write": 6.25, + "tiers": [ + { + "input": 10, + "output": 37.5, + "cache_read": 1, + "cache_write": 12.5, + "tier": { + "type": "context", + "size": 200000 + } + } + ], + "context_over_200k": { + "input": 10, + "output": 37.5, + "cache_read": 1, + "cache_write": 12.5 + } }, "type": "chat" }, { - "id": "openai/gpt-3.5-turbo", - "name": "GPT-3.5 Turbo", - "display_name": "GPT-3.5 Turbo", + "id": "grok-4-1-fast-non-reasoning", + "name": "grok-4-1-fast-non-reasoning", + "display_name": "grok-4-1-fast-non-reasoning", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 16385, - "output": 4096 + "context": 2000000, + "output": 30000 }, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { "supported": false }, - "attachment": false, + "attachment": true, "open_weights": false, - "release_date": "2022-11-30", - "last_updated": "2024-01-01", + "knowledge": "2025-06", + "release_date": "2025-11-20", + "last_updated": "2025-11-20", "cost": { - "input": 0.5, - "output": 1.5 + "input": 0.2, + "output": 0.5 }, "type": "chat" }, { - "id": "openai/gpt-5.1-2025-11-13", - "name": "GPT-5.1 (2025-11-13)", - "display_name": "GPT-5.1 (2025-11-13)", + "id": "gpt-5.4-nano", + "name": "gpt-5.4-nano", + "display_name": "gpt-5.4-nano", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 1000000, - "output": 32768 + "context": 400000, + "output": 128000 }, - "tool_call": false, + "temperature": false, + "tool_call": true, "reasoning": { "supported": true, "default": false @@ -28384,7 +29983,8 @@ "none", "low", "medium", - "high" + "high", + "xhigh" ], "verbosity": "medium", "verbosity_options": [ @@ -28395,34 +29995,35 @@ "visibility": "hidden" } }, - "attachment": false, + "attachment": true, "open_weights": false, - "release_date": "2025-11-13", - "last_updated": "2025-11-13", + "knowledge": "2025-08-31", + "release_date": "2026-03-19", + "last_updated": "2026-03-19", "cost": { - "input": 1.25, - "output": 10 + "input": 0.2, + "output": 1.25 }, "type": "chat" }, { - "id": "openai/gpt-5.2-codex", - "name": "GPT 5.2 Codex", - "display_name": "GPT 5.2 Codex", + "id": "claude-opus-4-1-20250805-thinking", + "name": "claude-opus-4-1-20250805-thinking", + "display_name": "claude-opus-4-1-20250805-thinking", "modalities": { "input": [ "text", - "image", - "pdf" + "image" ], "output": [ "text" ] }, "limit": { - "context": 400000, - "output": 128000 + "context": 200000, + "output": 32000 }, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, @@ -28432,166 +30033,157 @@ "reasoning": { "supported": true, "default_enabled": true, - "mode": "effort", - "effort": "medium", - "effort_options": [ - "low", - "medium", - "high", - "xhigh" - ], - "verbosity": "medium", - "verbosity_options": [ - "low", - "medium", - "high" + "mode": "budget", + "budget": { + "min": 1024, + "unit": "tokens" + }, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" ], - "visibility": "hidden" + "notes": [ + "Claude 4 manual thinking uses thinking.type = \"enabled\" with budget_tokens.", + "Interleaved thinking requires the interleaved-thinking-2025-05-14 beta header for this model family." + ] } }, "attachment": true, "open_weights": false, - "release_date": "2026-01-14", - "last_updated": "2026-01-14", + "knowledge": "2025-03", + "release_date": "2025-05-27", + "last_updated": "2025-05-27", "cost": { - "input": 1.75, - "output": 14 + "input": 15, + "output": 75 }, "type": "chat" }, { - "id": "openai/gpt-5.1-codex", - "name": "GPT 5.1 Codex", - "display_name": "GPT 5.1 Codex", + "id": "glm-4.5-airx", + "name": "glm-4.5-airx", + "display_name": "glm-4.5-airx", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 400000, - "output": 128000 + "context": 128000, + "output": 16384 }, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { - "supported": true, - "default": false - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": false, - "mode": "effort", - "effort": "none", - "effort_options": [ - "none", - "low", - "medium", - "high" - ], - "verbosity": "medium", - "verbosity_options": [ - "low", - "medium", - "high" - ], - "visibility": "hidden" - } + "supported": false }, - "attachment": true, + "attachment": false, "open_weights": false, - "release_date": "2025-11-13", - "last_updated": "2025-11-13", + "knowledge": "2025-04", + "release_date": "2025-07-29", + "last_updated": "2025-07-29", "cost": { - "input": 1.25, - "output": 10 + "input": 0.572, + "output": 1.714 }, "type": "chat" }, { - "id": "openai/o1-preview", - "name": "OpenAI o1-preview", - "display_name": "OpenAI o1-preview", + "id": "grok-4.1", + "name": "grok-4.1", + "display_name": "grok-4.1", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 32768 + "context": 200000, + "output": 64000 }, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": true, - "mode": "effort", - "effort": "medium", - "effort_options": [ - "low", - "medium", - "high" - ], - "visibility": "hidden" - } + "supported": false }, - "attachment": false, + "attachment": true, "open_weights": false, - "release_date": "2024-09-12", - "last_updated": "2024-09-12", + "knowledge": "2025-06", + "release_date": "2025-11-18", + "last_updated": "2025-11-18", "cost": { - "input": 14.993999999999998, - "output": 59.993 + "input": 2, + "output": 10 }, "type": "chat" }, { - "id": "openai/gpt-oss-safeguard-20b", - "name": "GPT OSS Safeguard 20B", - "display_name": "GPT OSS Safeguard 20B", + "id": "gemini-2.5-flash-preview-09-2025", + "name": "gemini-2.5-flash-preview-09-2025", + "display_name": "gemini-2.5-flash-preview-09-2025", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 16384 + "context": 1000000, + "output": 65536 }, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { "supported": true, "default": true }, - "attachment": false, + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": true, + "mode": "budget", + "budget": { + "default": -1, + "min": 0, + "max": 24576, + "auto": -1, + "off": 0, + "unit": "tokens" + }, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thought_signatures" + ] + } + }, + "attachment": true, "open_weights": false, - "release_date": "2025-10-29", - "last_updated": "2025-10-29", + "knowledge": "2025-01", + "release_date": "2025-09-26", + "last_updated": "2025-09-26", "cost": { - "input": 0.075, - "output": 0.3 + "input": 0.3, + "output": 2.5 }, "type": "chat" }, { - "id": "openai/gpt-5.4-mini", - "name": "GPT 5.4 Mini", - "display_name": "GPT 5.4 Mini", + "id": "claude-opus-4-5-20251101", + "name": "claude-opus-4-5-20251101", + "display_name": "claude-opus-4-5-20251101", "modalities": { "input": [ "text", @@ -28603,9 +30195,10 @@ ] }, "limit": { - "context": 400000, - "output": 128000 + "context": 200000, + "output": 64000 }, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, @@ -28615,82 +30208,114 @@ "reasoning": { "supported": true, "default_enabled": false, - "mode": "effort", - "effort": "none", + "mode": "mixed", + "budget": { + "min": 1024, + "unit": "tokens" + }, + "effort": "high", "effort_options": [ - "none", - "low", - "medium", - "high", - "xhigh" - ], - "verbosity": "medium", - "verbosity_options": [ "low", "medium", "high" ], - "visibility": "hidden" + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ], + "notes": [ + "Claude Opus 4.5 uses manual thinking.type = \"enabled\" with budget_tokens; effort can be used alongside the thinking budget.", + "Interleaved thinking requires the interleaved-thinking-2025-05-14 beta header." + ] } }, "attachment": true, "open_weights": false, - "release_date": "2026-03-17", - "last_updated": "2026-03-17", + "knowledge": "2025-03-31", + "release_date": "2025-11-25", + "last_updated": "2025-11-25", "cost": { - "input": 0.75, - "output": 4.5, - "cache_read": 0.075 + "input": 5, + "output": 25 }, "type": "chat" }, { - "id": "openai/gpt-4-turbo", - "name": "GPT-4 Turbo", - "display_name": "GPT-4 Turbo", + "id": "claude-opus-4-20250514", + "name": "claude-opus-4-20250514", + "display_name": "claude-opus-4-20250514", "modalities": { "input": [ "text", - "image" + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 4096 + "context": 200000, + "output": 32000 }, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": false + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": false, + "mode": "budget", + "budget": { + "min": 1024, + "unit": "tokens" + }, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ], + "notes": [ + "Claude 4 manual thinking uses thinking.type = \"enabled\" with budget_tokens.", + "Interleaved thinking requires the interleaved-thinking-2025-05-14 beta header for this model family." + ] + } }, "attachment": true, "open_weights": false, - "release_date": "2023-11-06", - "last_updated": "2024-01-01", + "knowledge": "2025-03-31", + "release_date": "2025-05-22", + "last_updated": "2025-05-22", "cost": { - "input": 10, - "output": 30 + "input": 15, + "output": 75 }, "type": "chat" }, { - "id": "openai/o1", - "name": "OpenAI o1", - "display_name": "OpenAI o1", + "id": "gemini-3-pro-image-preview", + "name": "gemini-3-pro-image-preview", + "display_name": "gemini-3-pro-image-preview", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 100000 + "context": 32768, + "output": 64000 }, + "temperature": true, "tool_call": false, "reasoning": { "supported": true, @@ -28700,30 +30325,34 @@ "reasoning": { "supported": true, "default_enabled": true, - "mode": "effort", - "effort": "medium", - "effort_options": [ + "mode": "level", + "level": "high", + "level_options": [ "low", - "medium", "high" ], - "visibility": "hidden" + "summaries": true, + "visibility": "summary", + "continuation": [ + "thought_signatures" + ] } }, - "attachment": false, + "attachment": true, "open_weights": false, - "release_date": "2024-12-17", - "last_updated": "2024-12-17", + "knowledge": "2025-06", + "release_date": "2025-11-20", + "last_updated": "2025-11-20", "cost": { - "input": 14.993999999999998, - "output": 59.993 + "input": 2, + "output": 120 }, - "type": "chat" + "type": "imageGeneration" }, { - "id": "openai/gpt-4o-search-preview", - "name": "GPT-4o Search Preview", - "display_name": "GPT-4o Search Preview", + "id": "gemini-2.5-flash-image", + "name": "gemini-2.5-flash-image", + "display_name": "gemini-2.5-flash-image", "modalities": { "input": [ "text", @@ -28734,89 +30363,117 @@ ] }, "limit": { - "context": 128000, - "output": 16384 + "context": 32768, + "output": 32768 }, + "temperature": true, "tool_call": false, "reasoning": { "supported": false }, "attachment": true, "open_weights": false, - "release_date": "2024-05-13", - "last_updated": "2024-05-13", + "knowledge": "2025-01", + "release_date": "2025-10-08", + "last_updated": "2025-10-08", "cost": { - "input": 1.47, - "output": 5.88 + "input": 0.3, + "output": 30 }, - "type": "chat" + "type": "imageGeneration" }, { - "id": "openai/gpt-4.1-nano", - "name": "GPT 4.1 Nano", - "display_name": "GPT 4.1 Nano", + "id": "glm-for-coding", + "name": "glm-for-coding", + "display_name": "glm-for-coding", "modalities": { "input": [ - "text", - "image", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 1047576, - "output": 32768 + "context": 200000, + "output": 131072 }, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": true, + "attachment": false, "open_weights": false, - "release_date": "2025-04-14", - "last_updated": "2025-04-14", + "release_date": "2025-09-30", + "last_updated": "2025-09-30", "cost": { - "input": 0.1, - "output": 0.4 + "input": 0.086, + "output": 0.343 }, "type": "chat" }, { - "id": "poolside/laguna-m.1", - "name": "Laguna M.1", - "display_name": "Laguna M.1", + "id": "gpt-5.2", + "name": "gpt-5.2", + "display_name": "gpt-5.2", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 32768 + "context": 400000, + "output": 128000 }, - "tool_call": false, + "temperature": false, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": false }, - "attachment": false, + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": false, + "mode": "effort", + "effort": "none", + "effort_options": [ + "none", + "low", + "medium", + "high", + "xhigh" + ], + "verbosity": "medium", + "verbosity_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" + } + }, + "attachment": true, "open_weights": false, - "release_date": "2026-04-29", - "last_updated": "2026-04-29", + "knowledge": "2025-08-31", + "release_date": "2025-12-12", + "last_updated": "2025-12-12", "cost": { - "input": 0.1, - "output": 0.3 + "input": 1.75, + "output": 14 }, "type": "chat" }, { - "id": "poolside/laguna-xs.2", - "name": "Laguna XS.2", - "display_name": "Laguna XS.2", + "id": "qwen-flash", + "name": "Qwen-Flash", + "display_name": "Qwen-Flash", "modalities": { "input": [ "text" @@ -28826,147 +30483,226 @@ ] }, "limit": { - "context": 128000, + "context": 1000000, "output": 32768 }, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { - "supported": false + "supported": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } }, "attachment": false, "open_weights": false, - "release_date": "2026-04-29", - "last_updated": "2026-04-29", + "release_date": "2025-07-28", + "last_updated": "2025-07-28", "cost": { - "input": 0.1, - "output": 0.3 + "input": 0.022, + "output": 0.22 }, "type": "chat" }, { - "id": "baseten/Kimi-K2-Instruct-FP4", - "name": "Kimi K2 0711 Instruct FP4", - "display_name": "Kimi K2 0711 Instruct FP4", + "id": "claude-opus-4-6-thinking", + "name": "claude-opus-4-6-thinking", + "display_name": "claude-opus-4-6-thinking", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 131072 + "context": 1000000, + "output": 128000 }, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": false, + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": true, + "mode": "mixed", + "budget": { + "min": 1024, + "unit": "tokens" + }, + "effort": "high", + "effort_options": [ + "low", + "medium", + "high", + "max" + ], + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ], + "notes": [ + "Anthropic recommends adaptive thinking with effort for Claude 4.6; budget_tokens remains a deprecated compatibility path.", + "Anthropic API defaults effort to high; lower effort levels should be chosen per workload." + ] + } + }, + "attachment": true, "open_weights": false, - "release_date": "2025-07-11", - "last_updated": "2025-07-11", + "knowledge": "2025-05", + "release_date": "2026-02-06", + "last_updated": "2026-03-13", "cost": { - "input": 0.1, - "output": 2 + "input": 5, + "output": 25 }, "type": "chat" }, { - "id": "failspy/Meta-Llama-3-70B-Instruct-abliterated-v3.5", - "name": "Llama 3 70B abliterated", - "display_name": "Llama 3 70B abliterated", + "id": "claude-sonnet-4-20250514", + "name": "claude-sonnet-4-20250514", + "display_name": "claude-sonnet-4-20250514", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 8192, - "output": 8192 + "context": 200000, + "output": 64000 }, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": false }, - "attachment": false, + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": false, + "mode": "budget", + "budget": { + "min": 1024, + "unit": "tokens" + }, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ], + "notes": [ + "Claude 4 manual thinking uses thinking.type = \"enabled\" with budget_tokens.", + "Interleaved thinking requires the interleaved-thinking-2025-05-14 beta header for this model family." + ] + } + }, + "attachment": true, "open_weights": false, - "release_date": "2025-07-26", - "last_updated": "2025-07-26", + "knowledge": "2025-03-31", + "release_date": "2025-05-22", + "last_updated": "2025-05-22", "cost": { - "input": 0.7, - "output": 0.7 + "input": 3, + "output": 15 }, "type": "chat" }, { - "id": "NeverSleep/Lumimaid-v0.2-70B", - "name": "Lumimaid v0.2", - "display_name": "Lumimaid v0.2", + "id": "gpt-5.1-chat-latest", + "name": "gpt-5.1-chat-latest", + "display_name": "gpt-5.1-chat-latest", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 16384, - "output": 8192 + "context": 128000, + "output": 16384 }, - "tool_call": false, + "temperature": false, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": false, + "attachment": true, "open_weights": false, - "release_date": "2024-07-01", - "last_updated": "2024-07-01", + "knowledge": "2024-09-30", + "release_date": "2025-11-14", + "last_updated": "2025-11-14", "cost": { - "input": 1, - "output": 1.5 + "input": 1.25, + "output": 10 }, "type": "chat" }, { - "id": "inflatebot/MN-12B-Mag-Mell-R1", - "name": "Mag Mell R1", - "display_name": "Mag Mell R1", + "id": "gpt-5.2-chat-latest", + "name": "gpt-5.2-chat-latest", + "display_name": "gpt-5.2-chat-latest", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 16384, - "output": 8192 + "context": 128000, + "output": 16384 }, - "tool_call": false, + "temperature": false, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": false, + "attachment": true, "open_weights": false, - "release_date": "2024-07-01", - "last_updated": "2024-07-01", + "knowledge": "2025-08-31", + "release_date": "2025-12-12", + "last_updated": "2025-12-12", "cost": { - "input": 0.49299999999999994, - "output": 0.49299999999999994 + "input": 1.75, + "output": 14 }, "type": "chat" }, { - "id": "minimax/minimax-m3", - "name": "MiniMax M3", - "display_name": "MiniMax M3", + "id": "grok-4-fast-reasoning", + "name": "grok-4-fast-reasoning", + "display_name": "grok-4-fast-reasoning", "modalities": { "input": [ "text", @@ -28977,12 +30713,14 @@ ] }, "limit": { - "context": 512000, - "output": 80000 + "context": 2000000, + "output": 30000 }, + "temperature": true, "tool_call": true, "reasoning": { - "supported": true + "supported": true, + "default": true }, "extra_capabilities": { "reasoning": { @@ -28991,53 +30729,57 @@ }, "attachment": true, "open_weights": false, - "release_date": "2026-06-01", - "last_updated": "2026-06-01", + "knowledge": "2025-06", + "release_date": "2025-09-23", + "last_updated": "2025-09-23", "cost": { - "input": 0.3, - "output": 1.2, - "cache_read": 0.06 + "input": 0.2, + "output": 0.5 }, "type": "chat" }, { - "id": "minimax/minimax-01", - "name": "MiniMax 01", - "display_name": "MiniMax 01", + "id": "gpt-4.1-nano", + "name": "gpt-4.1-nano", + "display_name": "gpt-4.1-nano", "modalities": { "input": [ "text", - "pdf" + "image" ], "output": [ "text" ] }, "limit": { - "context": 1000192, - "output": 16384 + "context": 1047576, + "output": 32768 }, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { "supported": false }, "attachment": true, "open_weights": false, - "release_date": "2025-01-15", - "last_updated": "2025-01-15", + "knowledge": "2024-04", + "release_date": "2025-04-14", + "last_updated": "2025-04-14", "cost": { - "input": 0.1394, - "output": 1.1219999999999999 + "input": 0.1, + "output": 0.4 }, "type": "chat" }, { - "id": "minimax/minimax-m2.1", - "name": "MiniMax M2.1", - "display_name": "MiniMax M2.1", + "id": "claude-sonnet-4-5-20250929-thinking", + "name": "claude-sonnet-4-5-20250929-thinking", + "display_name": "claude-sonnet-4-5-20250929-thinking", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ "text" @@ -29045,8 +30787,9 @@ }, "limit": { "context": 200000, - "output": 131072 + "output": 64000 }, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, @@ -29054,23 +30797,40 @@ }, "extra_capabilities": { "reasoning": { - "supported": true + "supported": true, + "default_enabled": true, + "mode": "budget", + "budget": { + "min": 1024, + "unit": "tokens" + }, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ], + "notes": [ + "Claude 4 manual thinking uses thinking.type = \"enabled\" with budget_tokens.", + "Interleaved thinking requires the interleaved-thinking-2025-05-14 beta header for this model family." + ] } }, - "attachment": false, + "attachment": true, "open_weights": false, - "release_date": "2025-12-19", - "last_updated": "2025-12-19", + "knowledge": "2025-03", + "release_date": "2025-09-30", + "last_updated": "2025-09-30", "cost": { - "input": 0.33, - "output": 1.32 + "input": 3, + "output": 15 }, "type": "chat" }, { - "id": "minimax/minimax-m2.7-turbo", - "name": "MiniMax M2.7 Turbo", - "display_name": "MiniMax M2.7 Turbo", + "id": "MiniMax-M2.7-highspeed", + "name": "MiniMax-M2.7-highspeed", + "display_name": "MiniMax-M2.7-highspeed", "modalities": { "input": [ "text" @@ -29083,41 +30843,10 @@ "context": 204800, "output": 131072 }, + "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true - }, - "attachment": false, - "open_weights": false, - "release_date": "2026-03-18", - "last_updated": "2026-03-18", - "cost": { - "input": 0.6, - "output": 2.4 - }, - "type": "chat" - }, - { - "id": "minimax/minimax-m2.7", - "name": "MiniMax M2.7", - "display_name": "MiniMax M2.7", - "modalities": { - "input": [ - "text" - ], - "output": [ - "text" - ] - }, - "limit": { - "context": 204800, - "output": 131072 - }, - "tool_call": true, - "reasoning": { - "supported": true, - "default": true + "supported": true }, "extra_capabilities": { "reasoning": { @@ -29132,87 +30861,94 @@ }, "attachment": false, "open_weights": false, - "release_date": "2026-03-18", - "last_updated": "2026-03-18", + "release_date": "2026-03-19", + "last_updated": "2026-03-19", "cost": { - "input": 0.3, - "output": 1.2 + "input": 0.6, + "output": 4.8 }, "type": "chat" }, { - "id": "minimax/minimax-m3:thinking", - "name": "MiniMax M3 Thinking", - "display_name": "MiniMax M3 Thinking", + "id": "MiniMax-M2", + "name": "MiniMax-M2", + "display_name": "MiniMax-M2", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 512000, - "output": 80000 + "context": 1000000, + "output": 128000 }, + "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": true }, - "attachment": true, + "extra_capabilities": { + "reasoning": { + "supported": true + } + }, + "attachment": false, "open_weights": false, - "release_date": "2026-06-01", - "last_updated": "2026-06-01", + "release_date": "2025-10-26", + "last_updated": "2025-10-26", "cost": { - "input": 0.3, - "output": 1.2, - "cache_read": 0.06 + "input": 0.33, + "output": 1.32 }, "type": "chat" }, { - "id": "minimax/minimax-m2.5", - "name": "MiniMax M2.5", - "display_name": "MiniMax M2.5", + "id": "gemini-3.1-flash-image-preview", + "name": "gemini-3.1-flash-image-preview", + "display_name": "gemini-3.1-flash-image-preview", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ - "text" + "text", + "image" ] }, "limit": { - "context": 204800, - "output": 131072 + "context": 131072, + "output": 32768 }, - "tool_call": true, + "temperature": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": true + "supported": true }, "extra_capabilities": { "reasoning": { "supported": true } }, - "attachment": false, + "attachment": true, "open_weights": false, - "release_date": "2026-02-12", - "last_updated": "2026-02-12", + "knowledge": "2025-01", + "release_date": "2026-02-27", + "last_updated": "2026-02-27", "cost": { - "input": 0.3, - "output": 1.2 + "input": 0.5, + "output": 60 }, - "type": "chat" + "type": "imageGeneration" }, { - "id": "minimax/minimax-m2-her", - "name": "MiniMax M2-her", - "display_name": "MiniMax M2-her", + "id": "qwen3-235b-a22b", + "name": "Qwen3-235B-A22B", + "display_name": "Qwen3-235B-A22B", "modalities": { "input": [ "text" @@ -29222,27 +30958,40 @@ ] }, "limit": { - "context": 65532, - "output": 2048 + "context": 128000, + "output": 16384 }, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { - "supported": false + "supported": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } }, "attachment": false, "open_weights": false, - "release_date": "2026-01-24", - "last_updated": "2026-01-24", + "knowledge": "2025-04", + "release_date": "2025-04-29", + "last_updated": "2025-04-29", "cost": { - "input": 0.30200000000000005, - "output": 1.2069999999999999 + "input": 0.29, + "output": 2.86 }, "type": "chat" }, { - "id": "minimax/minimax-latest", - "name": "MiniMax Latest", - "display_name": "MiniMax Latest", + "id": "ministral-14b-2512", + "name": "ministral-14b-2512", + "display_name": "ministral-14b-2512", "modalities": { "input": [ "text", @@ -29253,32 +31002,34 @@ ] }, "limit": { - "context": 512000, - "output": 80000 + "context": 128000, + "output": 128000 }, + "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, "attachment": true, "open_weights": false, - "release_date": "2026-05-03", - "last_updated": "2026-05-03", + "knowledge": "2024-12", + "release_date": "2025-12-16", + "last_updated": "2025-12-16", "cost": { - "input": 0.3, - "output": 1.2, - "cache_read": 0.06 + "input": 0.33, + "output": 0.33 }, "type": "chat" }, { - "id": "allenai/olmo-3-32b-think", - "name": "Olmo 3 32B Think", - "display_name": "Olmo 3 32B Think", + "id": "glm-4.6v", + "name": "GLM-4.6V", + "display_name": "GLM-4.6V", "modalities": { "input": [ - "text" + "text", + "image", + "video" ], "output": [ "text" @@ -29286,283 +31037,376 @@ }, "limit": { "context": 128000, - "output": 8192 + "output": 32768 }, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { "supported": true, "default": true }, - "attachment": false, - "open_weights": false, - "release_date": "2025-11-01", - "last_updated": "2025-11-01", + "attachment": true, + "open_weights": true, + "knowledge": "2025-04", + "release_date": "2025-12-08", + "last_updated": "2025-12-08", "cost": { - "input": 0.3, - "output": 0.44999999999999996 + "input": 0.145, + "output": 0.43 }, "type": "chat" - } - ] - }, - "alibaba-cn": { - "id": "alibaba-cn", - "name": "alibaba-cn", - "display_name": "alibaba-cn", - "api": "https://dashscope.aliyuncs.com/compatible-mode/v1", - "doc": "https://www.alibabacloud.com/help/en/model-studio/models", - "models": [ + }, { - "id": "MiniMax-M2.5", - "name": "MiniMax-M2.5", - "display_name": "MiniMax-M2.5", + "id": "claude-haiku-4-5", + "name": "claude-haiku-4-5", + "display_name": "claude-haiku-4-5", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 204800, - "output": 131072 + "context": 200000, + "output": 64000 }, "temperature": true, "tool_call": true, "reasoning": { "supported": true, - "default": true + "default": false }, "extra_capabilities": { "reasoning": { "supported": true, + "default_enabled": false, + "mode": "budget", + "budget": { + "min": 1024, + "unit": "tokens" + }, "interleaved": true, "summaries": true, "visibility": "summary", "continuation": [ "thinking_blocks" + ], + "notes": [ + "Claude 4 manual thinking uses thinking.type = \"enabled\" with budget_tokens.", + "Interleaved thinking requires the interleaved-thinking-2025-05-14 beta header for this model family." ] } }, - "attachment": false, - "open_weights": true, - "release_date": "2026-02-12", - "last_updated": "2026-02-12", + "attachment": true, + "open_weights": false, + "knowledge": "2025-02-28", + "release_date": "2025-10-16", + "last_updated": "2025-10-16", "cost": { - "input": 0.3, - "output": 1.2 + "input": 1, + "output": 5 }, "type": "chat" }, { - "id": "qwen3-asr-flash", - "name": "Qwen3-ASR Flash", - "display_name": "Qwen3-ASR Flash", + "id": "gpt-5.4", + "name": "gpt-5.4", + "display_name": "gpt-5.4", "modalities": { "input": [ - "audio" + "text", + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 53248, - "output": 4096 + "context": 1050000, + "output": 128000 }, "temperature": false, - "tool_call": false, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": false }, - "attachment": false, + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": false, + "mode": "effort", + "effort": "none", + "effort_options": [ + "none", + "low", + "medium", + "high", + "xhigh" + ], + "verbosity": "medium", + "verbosity_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" + } + }, + "attachment": true, "open_weights": false, - "knowledge": "2024-04", - "release_date": "2025-09-08", - "last_updated": "2025-09-08", + "knowledge": "2025-08-31", + "release_date": "2026-03-05", + "last_updated": "2026-03-05", "cost": { - "input": 0.032, - "output": 0.032 + "input": 2.5, + "output": 15, + "cache_read": 0.25, + "cache_write": 0, + "tiers": [ + { + "input": 5, + "output": 22.5, + "tier": { + "type": "context", + "size": 272000 + } + } + ], + "context_over_200k": { + "input": 5, + "output": 22.5 + } }, "type": "chat" }, { - "id": "qwen-math-turbo", - "name": "Qwen Math Turbo", - "display_name": "Qwen Math Turbo", + "id": "doubao-seed-1-6-thinking-250715", + "name": "doubao-seed-1-6-thinking-250715", + "display_name": "doubao-seed-1-6-thinking-250715", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 4096, - "output": 3072 + "context": 256000, + "output": 16000 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": false, + "attachment": true, "open_weights": false, - "knowledge": "2024-04", - "release_date": "2024-09-19", - "last_updated": "2024-09-19", + "release_date": "2025-07-15", + "last_updated": "2025-07-15", "cost": { - "input": 0.287, - "output": 0.861 + "input": 0.121, + "output": 1.21 }, "type": "chat" }, { - "id": "deepseek-r1-0528", - "name": "DeepSeek R1 0528", - "display_name": "DeepSeek R1 0528", + "id": "gpt-5.4-mini", + "name": "gpt-5.4-mini", + "display_name": "gpt-5.4-mini", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 131072, - "output": 16384 + "context": 400000, + "output": 128000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { "supported": true, - "default": true + "default": false }, "extra_capabilities": { "reasoning": { "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] + "default_enabled": false, + "mode": "effort", + "effort": "none", + "effort_options": [ + "none", + "low", + "medium", + "high", + "xhigh" + ], + "verbosity": "medium", + "verbosity_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" } }, - "attachment": false, + "attachment": true, "open_weights": false, - "release_date": "2025-05-28", - "last_updated": "2025-05-28", + "knowledge": "2025-08-31", + "release_date": "2026-03-19", + "last_updated": "2026-03-19", "cost": { - "input": 0.574, - "output": 2.294 + "input": 0.75, + "output": 4.5 }, "type": "chat" }, { - "id": "qwen2-5-math-72b-instruct", - "name": "Qwen2.5-Math 72B Instruct", - "display_name": "Qwen2.5-Math 72B Instruct", + "id": "gpt-4.1", + "name": "gpt-4.1", + "display_name": "gpt-4.1", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 4096, - "output": 3072 + "context": 1047576, + "output": 32768 }, "temperature": true, "tool_call": true, "reasoning": { "supported": false }, - "attachment": false, - "open_weights": true, + "attachment": true, + "open_weights": false, "knowledge": "2024-04", - "release_date": "2024-09", - "last_updated": "2024-09", + "release_date": "2025-04-14", + "last_updated": "2025-04-14", "cost": { - "input": 0.574, - "output": 1.721 + "input": 2, + "output": 8 }, "type": "chat" }, { - "id": "qwen3-next-80b-a3b-instruct", - "name": "Qwen3 Next 80B A3B Instruct", - "display_name": "Qwen3 Next 80B A3B Instruct", + "id": "doubao-seed-code-preview-251028", + "name": "doubao-seed-code-preview-251028", + "display_name": "doubao-seed-code-preview-251028", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 131072, - "output": 32768 + "context": 256000, + "output": 32000 }, "temperature": true, "tool_call": true, "reasoning": { "supported": false }, - "attachment": false, - "open_weights": true, - "knowledge": "2025-04", - "release_date": "2025-09", - "last_updated": "2025-09", + "attachment": true, + "open_weights": false, + "release_date": "2025-11-11", + "last_updated": "2025-11-11", "cost": { - "input": 0.144, - "output": 0.574 + "input": 0.17, + "output": 1.14 }, "type": "chat" }, { - "id": "qwen2-5-vl-72b-instruct", - "name": "Qwen2.5-VL 72B Instruct", - "display_name": "Qwen2.5-VL 72B Instruct", + "id": "claude-opus-4-6", + "name": "claude-opus-4-6", + "display_name": "claude-opus-4-6", "modalities": { "input": [ "text", - "image" + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 131072, - "output": 8192 + "context": 1000000, + "output": 128000 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": false }, - "attachment": false, - "open_weights": true, - "knowledge": "2024-04", - "release_date": "2024-09", - "last_updated": "2024-09", + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": false, + "mode": "mixed", + "budget": { + "min": 1024, + "unit": "tokens" + }, + "effort": "high", + "effort_options": [ + "low", + "medium", + "high", + "max" + ], + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ], + "notes": [ + "Anthropic recommends adaptive thinking with effort for Claude 4.6; budget_tokens remains a deprecated compatibility path.", + "Anthropic API defaults effort to high; lower effort levels should be chosen per workload." + ] + } + }, + "attachment": true, + "open_weights": false, + "knowledge": "2025-05-31", + "release_date": "2026-02-06", + "last_updated": "2026-03-13", "cost": { - "input": 2.294, - "output": 6.881 + "input": 5, + "output": 25 }, "type": "chat" }, { - "id": "qwen-deep-research", - "name": "Qwen Deep Research", - "display_name": "Qwen Deep Research", + "id": "qwen3-coder-480b-a35b-instruct", + "name": "qwen3-coder-480b-a35b-instruct", + "display_name": "qwen3-coder-480b-a35b-instruct", "modalities": { "input": [ "text" @@ -29572,8 +31416,8 @@ ] }, "limit": { - "context": 1000000, - "output": 32768 + "context": 262144, + "output": 65536 }, "temperature": true, "tool_call": true, @@ -29582,101 +31426,75 @@ }, "attachment": false, "open_weights": false, - "knowledge": "2024-04", - "release_date": "2024-01", - "last_updated": "2024-01", + "knowledge": "2025-04", + "release_date": "2025-07-23", + "last_updated": "2025-07-23", "cost": { - "input": 7.742, - "output": 23.367 + "input": 0.86, + "output": 3.43 }, "type": "chat" }, { - "id": "qwen3-32b", - "name": "Qwen3 32B", - "display_name": "Qwen3 32B", + "id": "claude-sonnet-4-5-20250929", + "name": "claude-sonnet-4-5-20250929", + "display_name": "claude-sonnet-4-5-20250929", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 131072, - "output": 16384 + "context": 200000, + "output": 64000 }, "temperature": true, "tool_call": true, "reasoning": { "supported": true, - "default": true, - "budget": { - "default": 38912, - "min": 0, - "max": 38912 - } + "default": false }, "extra_capabilities": { "reasoning": { "supported": true, + "default_enabled": false, + "mode": "budget", + "budget": { + "min": 1024, + "unit": "tokens" + }, "interleaved": true, "summaries": true, "visibility": "summary", "continuation": [ "thinking_blocks" + ], + "notes": [ + "Claude 4 manual thinking uses thinking.type = \"enabled\" with budget_tokens.", + "Interleaved thinking requires the interleaved-thinking-2025-05-14 beta header for this model family." ] } }, - "attachment": false, - "open_weights": true, - "knowledge": "2025-04", - "release_date": "2025-04", - "last_updated": "2025-04", - "cost": { - "input": 0.287, - "output": 1.147, - "reasoning": 2.868 - }, - "type": "chat" - }, - { - "id": "qwen3-coder-30b-a3b-instruct", - "name": "Qwen3-Coder 30B-A3B Instruct", - "display_name": "Qwen3-Coder 30B-A3B Instruct", - "modalities": { - "input": [ - "text" - ], - "output": [ - "text" - ] - }, - "limit": { - "context": 262144, - "output": 65536 - }, - "temperature": true, - "tool_call": true, - "reasoning": { - "supported": false - }, - "attachment": false, - "open_weights": true, - "knowledge": "2025-04", - "release_date": "2025-04", - "last_updated": "2025-04", + "attachment": true, + "open_weights": false, + "knowledge": "2025-07-31", + "release_date": "2025-09-30", + "last_updated": "2025-09-30", "cost": { - "input": 0.216, - "output": 0.861 + "input": 3, + "output": 15 }, "type": "chat" }, { - "id": "kimi-k2-thinking", - "name": "Moonshot Kimi K2 Thinking", - "display_name": "Moonshot Kimi K2 Thinking", + "id": "deepseek-reasoner", + "name": "Deepseek-Reasoner", + "display_name": "Deepseek-Reasoner", "modalities": { "input": [ "text" @@ -29686,8 +31504,8 @@ ] }, "limit": { - "context": 262144, - "output": 16384 + "context": 128000, + "output": 128000 }, "temperature": true, "tool_call": true, @@ -29707,54 +31525,63 @@ } }, "attachment": false, - "open_weights": true, - "release_date": "2025-11-06", - "last_updated": "2025-11-06", + "open_weights": false, + "knowledge": "2024-07", + "release_date": "2025-01-20", + "last_updated": "2025-01-20", "cost": { - "input": 0.574, - "output": 2.294 + "input": 0.29, + "output": 0.43 }, "type": "chat" }, { - "id": "qwen2-5-math-7b-instruct", - "name": "Qwen2.5-Math 7B Instruct", - "display_name": "Qwen2.5-Math 7B Instruct", + "id": "grok-4-1-fast-reasoning", + "name": "grok-4-1-fast-reasoning", + "display_name": "grok-4-1-fast-reasoning", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 4096, - "output": 3072 + "context": 2000000, + "output": 30000 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": false, - "open_weights": true, - "knowledge": "2024-04", - "release_date": "2024-09", - "last_updated": "2024-09", + "extra_capabilities": { + "reasoning": { + "supported": true + } + }, + "attachment": true, + "open_weights": false, + "knowledge": "2025-06", + "release_date": "2025-11-20", + "last_updated": "2025-11-20", "cost": { - "input": 0.144, - "output": 0.287 + "input": 0.2, + "output": 0.5 }, "type": "chat" }, { - "id": "qwen-flash", - "name": "Qwen Flash", - "display_name": "Qwen Flash", + "id": "gemini-3-pro-preview", + "name": "gemini-3-pro-preview", + "display_name": "gemini-3-pro-preview", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" @@ -29762,64 +31589,58 @@ }, "limit": { "context": 1000000, - "output": 32768 + "output": 64000 }, "temperature": true, "tool_call": true, "reasoning": { "supported": true, - "default": false, - "budget": { - "default": 81920, - "min": 0, - "max": 81920 - } + "default": true }, "extra_capabilities": { "reasoning": { "supported": true, - "interleaved": true, + "default_enabled": true, + "mode": "level", + "level": "high", + "level_options": [ + "low", + "high" + ], "summaries": true, "visibility": "summary", "continuation": [ - "thinking_blocks" + "thought_signatures" ] } }, - "search": { - "supported": true, - "default": false, - "forced_search": false, - "search_strategy": "turbo" - }, - "attachment": false, + "attachment": true, "open_weights": false, - "knowledge": "2024-04", - "release_date": "2025-07-28", - "last_updated": "2025-07-28", + "knowledge": "2025-06", + "release_date": "2025-11-19", + "last_updated": "2025-11-19", "cost": { - "input": 0.022, - "output": 0.216 + "input": 2, + "output": 12 }, "type": "chat" }, { - "id": "qwen3.5-plus", - "name": "Qwen3.5 Plus", - "display_name": "Qwen3.5 Plus", + "id": "gpt-5-thinking", + "name": "gpt-5-thinking", + "display_name": "gpt-5-thinking", "modalities": { "input": [ "text", - "image", - "video" + "image" ], "output": [ "text" ] }, "limit": { - "context": 1000000, - "output": 65536 + "context": 400000, + "output": 128000 }, "temperature": true, "tool_call": true, @@ -29827,131 +31648,131 @@ "supported": true, "default": true }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } - }, - "attachment": false, + "attachment": true, "open_weights": false, - "knowledge": "2025-04", - "release_date": "2026-02-16", - "last_updated": "2026-02-16", + "knowledge": "2024-10", + "release_date": "2025-08-08", + "last_updated": "2025-08-08", "cost": { - "input": 0.573, - "output": 3.44, - "reasoning": 3.44 + "input": 1.25, + "output": 10 }, "type": "chat" }, { - "id": "deepseek-r1-distill-llama-8b", - "name": "DeepSeek R1 Distill Llama 8B", - "display_name": "DeepSeek R1 Distill Llama 8B", + "id": "gpt-5-mini", + "name": "gpt-5-mini", + "display_name": "gpt-5-mini", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 32768, - "output": 16384 + "context": 400000, + "output": 128000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { "supported": true, "default": true }, - "attachment": false, + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": true, + "mode": "effort", + "effort": "medium", + "effort_options": [ + "minimal", + "low", + "medium", + "high" + ], + "verbosity": "medium", + "verbosity_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" + } + }, + "attachment": true, "open_weights": false, - "release_date": "2025-01-01", - "last_updated": "2025-01-01", + "knowledge": "2024-05-30", + "release_date": "2025-08-08", + "last_updated": "2025-08-08", "cost": { - "input": 0, - "output": 0 + "input": 0.25, + "output": 2 }, "type": "chat" }, { - "id": "qwen3-235b-a22b", - "name": "Qwen3 235B A22B", - "display_name": "Qwen3 235B A22B", + "id": "gpt-4.1-mini", + "name": "gpt-4.1-mini", + "display_name": "gpt-4.1-mini", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 131072, + "context": 1047576, "output": 32768 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": false, - "budget": { - "default": 81920, - "min": 0, - "max": 81920 - } - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } + "supported": false }, - "attachment": false, - "open_weights": true, - "knowledge": "2025-04", - "release_date": "2025-04", - "last_updated": "2025-04", + "attachment": true, + "open_weights": false, + "knowledge": "2024-04", + "release_date": "2025-04-14", + "last_updated": "2025-04-14", "cost": { - "input": 0.287, - "output": 1.147, - "reasoning": 2.868 + "input": 0.4, + "output": 1.6 }, "type": "chat" }, { - "id": "qwen3-max", - "name": "Qwen3 Max", - "display_name": "Qwen3 Max", + "id": "glm-5v-turbo", + "name": "GLM-5V-Turbo", + "display_name": "GLM-5V-Turbo", "modalities": { "input": [ - "text" + "text", + "image", + "video", + "audio", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 262144, - "output": 65536 + "context": 200000, + "output": 131072 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true + "supported": true, + "default": true }, "extra_capabilities": { "reasoning": { @@ -29964,36 +31785,34 @@ ] } }, - "attachment": false, + "attachment": true, "open_weights": false, - "knowledge": "2025-04", - "release_date": "2025-09-23", - "last_updated": "2025-09-23", + "release_date": "2026-04-02", + "last_updated": "2026-04-02", "cost": { - "input": 0.861, - "output": 3.441 + "input": 0.72, + "output": 3.2 }, "type": "chat" }, { - "id": "kimi-k2.6", - "name": "Moonshot Kimi K2.6", - "display_name": "Moonshot Kimi K2.6", + "id": "gpt-5.4-pro", + "name": "gpt-5.4-pro", + "display_name": "gpt-5.4-pro", "modalities": { "input": [ "text", - "image", - "video" + "image" ], "output": [ "text" ] }, "limit": { - "context": 262144, - "output": 16384 + "context": 1050000, + "output": 128000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { "supported": true, @@ -30002,29 +31821,54 @@ "extra_capabilities": { "reasoning": { "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] + "default_enabled": true, + "mode": "effort", + "effort": "high", + "effort_options": [ + "medium", + "high", + "xhigh" + ], + "verbosity": "medium", + "verbosity_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" } }, "attachment": true, - "open_weights": true, - "knowledge": "2025-01", - "release_date": "2026-04-21", - "last_updated": "2026-04-21", + "open_weights": false, + "knowledge": "2025-08-31", + "release_date": "2026-03-05", + "last_updated": "2026-03-05", "cost": { - "input": 0.929, - "output": 3.858 + "input": 30, + "output": 180, + "cache_read": 0, + "cache_write": 0, + "tiers": [ + { + "input": 60, + "output": 270, + "tier": { + "type": "context", + "size": 272000 + } + } + ], + "context_over_200k": { + "input": 60, + "output": 270 + } }, "type": "chat" }, { - "id": "qwen2-5-72b-instruct", - "name": "Qwen2.5 72B Instruct", - "display_name": "Qwen2.5 72B Instruct", + "id": "glm-4.5-air", + "name": "glm-4.5-air", + "display_name": "glm-4.5-air", "modalities": { "input": [ "text" @@ -30035,128 +31879,125 @@ }, "limit": { "context": 131072, - "output": 8192 + "output": 98304 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "attachment": false, "open_weights": true, - "knowledge": "2024-04", - "release_date": "2024-09", - "last_updated": "2024-09", + "knowledge": "2025-04", + "release_date": "2025-07-29", + "last_updated": "2025-07-29", "cost": { - "input": 0.574, - "output": 1.721 + "input": 0.1143, + "output": 0.286 }, "type": "chat" }, { - "id": "qwen3-14b", - "name": "Qwen3 14B", - "display_name": "Qwen3 14B", + "id": "claude-sonnet-4-6", + "name": "claude-sonnet-4-6", + "display_name": "claude-sonnet-4-6", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 131072, - "output": 8192 + "context": 1000000, + "output": 64000 }, "temperature": true, "tool_call": true, "reasoning": { "supported": true, - "default": true, - "budget": { - "default": 38912, - "min": 0, - "max": 38912 - } + "default": false }, "extra_capabilities": { "reasoning": { "supported": true, + "default_enabled": false, + "mode": "mixed", + "budget": { + "min": 1024, + "unit": "tokens" + }, + "effort": "high", + "effort_options": [ + "low", + "medium", + "high", + "max" + ], "interleaved": true, "summaries": true, "visibility": "summary", "continuation": [ "thinking_blocks" + ], + "notes": [ + "Anthropic recommends adaptive thinking with effort for Claude 4.6; budget_tokens remains a deprecated compatibility path.", + "Anthropic API defaults effort to high; lower effort levels should be chosen per workload." ] } }, - "attachment": false, - "open_weights": true, - "knowledge": "2025-04", - "release_date": "2025-04", - "last_updated": "2025-04", + "attachment": true, + "open_weights": false, + "knowledge": "2025-08-31", + "release_date": "2026-02-18", + "last_updated": "2026-03-13", "cost": { - "input": 0.144, - "output": 0.574, - "reasoning": 1.434 + "input": 3, + "output": 15 }, "type": "chat" }, { - "id": "qwen3-omni-flash", - "name": "Qwen3-Omni Flash", - "display_name": "Qwen3-Omni Flash", + "id": "grok-4-fast-non-reasoning", + "name": "grok-4-fast-non-reasoning", + "display_name": "grok-4-fast-non-reasoning", "modalities": { "input": [ "text", - "image", - "audio", - "video" + "image" ], "output": [ - "text", - "audio" + "text" ] }, "limit": { - "context": 65536, - "output": 16384 + "context": 2000000, + "output": 30000 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } - }, - "attachment": false, + "attachment": true, "open_weights": false, - "knowledge": "2024-04", - "release_date": "2025-09-15", - "last_updated": "2025-09-15", + "knowledge": "2025-06", + "release_date": "2025-09-23", + "last_updated": "2025-09-23", "cost": { - "input": 0.058, - "output": 0.23, - "input_audio": 3.584, - "output_audio": 7.168 + "input": 0.2, + "output": 0.5 }, "type": "chat" }, { - "id": "qwen3-vl-235b-a22b", - "name": "Qwen3-VL 235B-A22B", - "display_name": "Qwen3-VL 235B-A22B", + "id": "gemini-3-flash-preview", + "name": "gemini-3-flash-preview", + "display_name": "gemini-3-flash-preview", "modalities": { "input": [ "text", @@ -30167,8 +32008,8 @@ ] }, "limit": { - "context": 131072, - "output": 32768 + "context": 1000000, + "output": 65536 }, "temperature": true, "tool_call": true, @@ -30179,30 +32020,37 @@ "extra_capabilities": { "reasoning": { "supported": true, - "interleaved": true, + "default_enabled": true, + "mode": "level", + "level": "high", + "level_options": [ + "minimal", + "low", + "medium", + "high" + ], "summaries": true, "visibility": "summary", "continuation": [ - "thinking_blocks" + "thought_signatures" ] } }, - "attachment": false, - "open_weights": true, - "knowledge": "2025-04", - "release_date": "2025-04", - "last_updated": "2025-04", + "attachment": true, + "open_weights": false, + "knowledge": "2025-06", + "release_date": "2025-12-18", + "last_updated": "2025-12-18", "cost": { - "input": 0.286705, - "output": 1.14682, - "reasoning": 2.867051 + "input": 0.5, + "output": 3 }, "type": "chat" }, { - "id": "deepseek-r1", - "name": "DeepSeek R1", - "display_name": "DeepSeek R1", + "id": "deepseek-chat", + "name": "Deepseek-Chat", + "display_name": "Deepseek-Chat", "modalities": { "input": [ "text" @@ -30212,45 +32060,32 @@ ] }, "limit": { - "context": 131072, - "output": 16384 + "context": 128000, + "output": 8192 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } + "supported": false }, "attachment": false, "open_weights": false, - "release_date": "2025-01-01", - "last_updated": "2025-01-01", + "knowledge": "2024-07", + "release_date": "2024-11-29", + "last_updated": "2024-11-29", "cost": { - "input": 0.574, - "output": 2.294 + "input": 0.29, + "output": 0.43 }, "type": "chat" }, { - "id": "qwen3.5-flash", - "name": "Qwen3.5 Flash", - "display_name": "Qwen3.5 Flash", + "id": "MiniMax-M1", + "name": "MiniMax-M1", + "display_name": "MiniMax-M1", "modalities": { "input": [ - "text", - "image", - "video" + "text" ], "output": [ "text" @@ -30258,72 +32093,65 @@ }, "limit": { "context": 1000000, - "output": 65536 + "output": 128000 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } + "supported": false }, - "attachment": true, + "attachment": false, "open_weights": false, - "knowledge": "2025-04", - "release_date": "2026-02-23", - "last_updated": "2026-02-23", + "release_date": "2025-06-16", + "last_updated": "2025-06-16", "cost": { - "input": 0.172, - "output": 1.72, - "reasoning": 1.72 + "input": 0.132, + "output": 1.254 }, "type": "chat" }, { - "id": "deepseek-v3-1", - "name": "DeepSeek V3.1", - "display_name": "DeepSeek V3.1", + "id": "grok-4.20-multi-agent-beta-0309", + "name": "grok-4.20-multi-agent-beta-0309", + "display_name": "grok-4.20-multi-agent-beta-0309", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 131072, - "output": 65536 + "context": 2000000, + "output": 30000 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": false, + "extra_capabilities": { + "reasoning": { + "supported": true + } + }, + "attachment": true, "open_weights": false, - "release_date": "2025-01-01", - "last_updated": "2025-01-01", + "release_date": "2026-03-16", + "last_updated": "2026-03-16", "cost": { - "input": 0.574, - "output": 1.721 + "input": 2, + "output": 6 }, "type": "chat" }, { - "id": "qwen3-8b", - "name": "Qwen3 8B", - "display_name": "Qwen3 8B", + "id": "glm-5", + "name": "glm-5", + "display_name": "glm-5", "modalities": { "input": [ "text" @@ -30333,19 +32161,14 @@ ] }, "limit": { - "context": 131072, - "output": 8192 + "context": 204800, + "output": 131072 }, "temperature": true, "tool_call": true, "reasoning": { "supported": true, - "default": true, - "budget": { - "default": 38912, - "min": 0, - "max": 38912 - } + "default": true }, "extra_capabilities": { "reasoning": { @@ -30360,20 +32183,18 @@ }, "attachment": false, "open_weights": true, - "knowledge": "2025-04", - "release_date": "2025-04", - "last_updated": "2025-04", + "release_date": "2026-02-12", + "last_updated": "2026-02-12", "cost": { - "input": 0.072, - "output": 0.287, - "reasoning": 0.717 + "input": 0.6, + "output": 2.6 }, "type": "chat" }, { - "id": "qwen3.7-max", - "name": "Qwen3.7 Max", - "display_name": "Qwen3.7 Max", + "id": "qwen-max-latest", + "name": "Qwen-Max-Latest", + "display_name": "Qwen-Max-Latest", "modalities": { "input": [ "text" @@ -30383,36 +32204,29 @@ ] }, "limit": { - "context": 1000000, - "output": 65536 + "context": 131072, + "output": 8192 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true - } + "supported": false }, "attachment": false, "open_weights": false, - "release_date": "2026-05-21", - "last_updated": "2026-05-21", + "knowledge": "2024-11", + "release_date": "2024-04-03", + "last_updated": "2025-01-25", "cost": { - "input": 2.5, - "output": 7.5, - "cache_read": 0.5, - "cache_write": 3.125 + "input": 0.343, + "output": 1.372 }, "type": "chat" }, { - "id": "qwen-vl-plus", - "name": "Qwen-VL Plus", - "display_name": "Qwen-VL Plus", + "id": "mistral-large-2512", + "name": "mistral-large-2512", + "display_name": "mistral-large-2512", "modalities": { "input": [ "text", @@ -30423,29 +32237,29 @@ ] }, "limit": { - "context": 131072, - "output": 8192 + "context": 128000, + "output": 262144 }, "temperature": true, "tool_call": true, "reasoning": { "supported": false }, - "attachment": false, + "attachment": true, "open_weights": false, - "knowledge": "2024-04", - "release_date": "2024-01-25", - "last_updated": "2025-08-15", + "knowledge": "2024-12", + "release_date": "2025-12-16", + "last_updated": "2025-12-16", "cost": { - "input": 0.115, - "output": 0.287 + "input": 1.1, + "output": 3.3 }, "type": "chat" }, { - "id": "deepseek-r1-distill-llama-70b", - "name": "DeepSeek R1 Distill Llama 70B", - "display_name": "DeepSeek R1 Distill Llama 70B", + "id": "MiniMax-M2.7", + "name": "MiniMax-M2.7", + "display_name": "MiniMax-M2.7", "modalities": { "input": [ "text" @@ -30455,123 +32269,89 @@ ] }, "limit": { - "context": 32768, - "output": 16384 + "context": 204800, + "output": 131072 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": true }, "extra_capabilities": { "reasoning": { - "supported": true + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] } }, "attachment": false, "open_weights": false, - "release_date": "2025-01-01", - "last_updated": "2025-01-01", + "release_date": "2026-03-19", + "last_updated": "2026-03-19", "cost": { - "input": 0.287, - "output": 0.861 + "input": 0.3, + "output": 1.2 }, "type": "chat" }, { - "id": "qwen3.6-plus", - "name": "Qwen3.6 Plus", - "display_name": "Qwen3.6 Plus", + "id": "claude-3-5-haiku-latest", + "name": "claude-3-5-haiku-latest", + "display_name": "claude-3-5-haiku-latest", "modalities": { "input": [ "text", "image", - "video" + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 1000000, - "output": 65536 + "context": 200000, + "output": 8192 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } + "supported": false }, - "attachment": false, + "attachment": true, "open_weights": false, - "knowledge": "2025-04", - "release_date": "2026-04-02", - "last_updated": "2026-04-02", + "knowledge": "2024-07-31", + "release_date": "2024-10-22", + "last_updated": "2024-10-22", "cost": { - "input": 0.5, - "output": 3, - "cache_read": 0.05, - "cache_write": 0.625, - "tiers": [ - { - "input": 2, - "output": 6, - "cache_read": 0.2, - "cache_write": 2.5, - "tier": { - "type": "context", - "size": 256000 - } - } - ], - "context_over_200k": { - "input": 2, - "output": 6, - "cache_read": 0.2, - "cache_write": 2.5 - } + "input": 0.8, + "output": 4 }, "type": "chat" }, { - "id": "qwen3-vl-plus", - "name": "Qwen3 VL Plus", - "display_name": "Qwen3 VL Plus", + "id": "qwen3-30b-a3b", + "name": "Qwen3-30B-A3B", + "display_name": "Qwen3-30B-A3B", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 262144, - "output": 32768 + "context": 128000, + "output": 8192 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { - "supported": true, - "default": false, - "budget": { - "default": 81920, - "min": 0, - "max": 81920 - } + "supported": true }, "extra_capabilities": { "reasoning": { @@ -30587,19 +32367,18 @@ "attachment": false, "open_weights": false, "knowledge": "2025-04", - "release_date": "2025-09-23", - "last_updated": "2025-09-23", + "release_date": "2025-04-29", + "last_updated": "2025-04-29", "cost": { - "input": 0.143353, - "output": 1.433525, - "reasoning": 4.300576 + "input": 0.11, + "output": 1.08 }, "type": "chat" }, { - "id": "tongyi-intent-detect-v3", - "name": "Tongyi Intent Detect V3", - "display_name": "Tongyi Intent Detect V3", + "id": "deepseek-v3.2", + "name": "deepseek-v3.2", + "display_name": "deepseek-v3.2", "modalities": { "input": [ "text" @@ -30609,137 +32388,160 @@ ] }, "limit": { - "context": 8192, - "output": 1024 + "context": 128000, + "output": 8192 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { - "supported": false + "supported": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true + } }, "attachment": false, "open_weights": false, - "knowledge": "2024-04", - "release_date": "2024-01", - "last_updated": "2024-01", + "knowledge": "2024-12", + "release_date": "2025-12-01", + "last_updated": "2025-12-01", "cost": { - "input": 0.058, - "output": 0.144 + "input": 0.29, + "output": 0.43 }, "type": "chat" }, { - "id": "qwen-max", - "name": "Qwen Max", - "display_name": "Qwen Max", + "id": "doubao-seed-1-8-251215", + "name": "doubao-seed-1-8-251215", + "display_name": "doubao-seed-1-8-251215", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 32768, - "output": 8192 + "context": 224000, + "output": 64000 }, "temperature": true, "tool_call": true, "reasoning": { "supported": false }, - "search": { - "supported": true, - "default": false, - "forced_search": false, - "search_strategy": "turbo" - }, - "attachment": false, + "attachment": true, "open_weights": false, - "knowledge": "2024-04", - "release_date": "2024-04-03", - "last_updated": "2025-01-25", + "release_date": "2025-12-18", + "last_updated": "2025-12-18", "cost": { - "input": 0.345, - "output": 1.377 + "input": 0.114, + "output": 0.286 }, "type": "chat" }, { - "id": "qwen-omni-turbo", - "name": "Qwen-Omni Turbo", - "display_name": "Qwen-Omni Turbo", + "id": "claude-opus-4-5-20251101-thinking", + "name": "claude-opus-4-5-20251101-thinking", + "display_name": "claude-opus-4-5-20251101-thinking", "modalities": { "input": [ "text", - "image", - "audio", - "video" + "image" ], "output": [ - "text", - "audio" + "text" ] }, "limit": { - "context": 32768, - "output": 2048 + "context": 200000, + "output": 64000 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": false, + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": true, + "mode": "mixed", + "budget": { + "min": 1024, + "unit": "tokens" + }, + "effort": "high", + "effort_options": [ + "low", + "medium", + "high" + ], + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ], + "notes": [ + "Claude Opus 4.5 uses manual thinking.type = \"enabled\" with budget_tokens; effort can be used alongside the thinking budget.", + "Interleaved thinking requires the interleaved-thinking-2025-05-14 beta header." + ] + } + }, + "attachment": true, "open_weights": false, - "knowledge": "2024-04", - "release_date": "2025-01-19", - "last_updated": "2025-03-26", + "knowledge": "2025-03", + "release_date": "2025-11-25", + "last_updated": "2025-11-25", "cost": { - "input": 0.058, - "output": 0.23, - "input_audio": 3.584, - "output_audio": 7.168 + "input": 5, + "output": 25 }, "type": "chat" }, { - "id": "qwen3-coder-480b-a35b-instruct", - "name": "Qwen3-Coder 480B-A35B Instruct", - "display_name": "Qwen3-Coder 480B-A35B Instruct", + "id": "gemini-2.0-flash-lite", + "name": "gemini-2.0-flash-lite", + "display_name": "gemini-2.0-flash-lite", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 262144, - "output": 65536 + "context": 2000000, + "output": 8192 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": false }, - "attachment": false, - "open_weights": true, - "knowledge": "2025-04", - "release_date": "2025-04", - "last_updated": "2025-04", + "attachment": true, + "open_weights": false, + "knowledge": "2024-11", + "release_date": "2025-06-16", + "last_updated": "2025-06-16", "cost": { - "input": 0.861, - "output": 3.441 + "input": 0.075, + "output": 0.3 }, "type": "chat" }, { - "id": "qwen3-next-80b-a3b-thinking", - "name": "Qwen3 Next 80B A3B Thinking", - "display_name": "Qwen3 Next 80B A3B Thinking", + "id": "glm-5-turbo", + "name": "glm-5-turbo", + "display_name": "glm-5-turbo", "modalities": { "input": [ "text" @@ -30749,19 +32551,14 @@ ] }, "limit": { - "context": 131072, - "output": 32768 + "context": 200000, + "output": 131072 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { "supported": true, - "default": true, - "budget": { - "default": 81920, - "min": 0, - "max": 81920 - } + "default": true }, "extra_capabilities": { "reasoning": { @@ -30775,52 +32572,83 @@ } }, "attachment": false, - "open_weights": true, - "knowledge": "2025-04", - "release_date": "2025-09", - "last_updated": "2025-09", + "open_weights": false, + "release_date": "2026-03-16", + "last_updated": "2026-03-16", "cost": { - "input": 0.144, - "output": 1.434 + "input": 0.72, + "output": 3.2 }, "type": "chat" }, { - "id": "qwen3-coder-flash", - "name": "Qwen3 Coder Flash", - "display_name": "Qwen3 Coder Flash", + "id": "gpt-5.1", + "name": "gpt-5.1", + "display_name": "gpt-5.1", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 1000000, - "output": 65536 + "context": 400000, + "output": 128000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": false }, - "attachment": false, + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": false, + "mode": "effort", + "effort": "none", + "effort_options": [ + "none", + "low", + "medium", + "high" + ], + "verbosity": "medium", + "verbosity_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" + } + }, + "attachment": true, "open_weights": false, - "knowledge": "2025-04", - "release_date": "2025-07-28", - "last_updated": "2025-07-28", + "knowledge": "2024-09-30", + "release_date": "2025-11-14", + "last_updated": "2025-11-14", "cost": { - "input": 0.144, - "output": 0.574 + "input": 1.25, + "output": 10 }, "type": "chat" - }, + } + ] + }, + "zhipuai": { + "id": "zhipuai", + "name": "Zhipu AI", + "display_name": "Zhipu AI", + "api": "https://open.bigmodel.cn/api/paas/v4", + "doc": "https://docs.z.ai/guides/overview/pricing", + "models": [ { - "id": "moonshot-kimi-k2-instruct", - "name": "Moonshot Kimi K2 Instruct", - "display_name": "Moonshot Kimi K2 Instruct", + "id": "glm-5.1", + "name": "GLM-5.1", + "display_name": "GLM-5.1", "modalities": { "input": [ "text" @@ -30830,41 +32658,56 @@ ] }, "limit": { - "context": 131072, - "output": 8192 + "context": 200000, + "output": 131072 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } }, "attachment": false, - "open_weights": true, - "release_date": "2025-01-01", - "last_updated": "2025-01-01", + "open_weights": false, + "release_date": "2026-03-27", + "last_updated": "2026-03-27", "cost": { - "input": 0.574, - "output": 2.294 + "input": 6, + "output": 24, + "cache_read": 1.3, + "cache_write": 0 }, "type": "chat" }, { - "id": "qwen3.6-flash", - "name": "Qwen3.6 Flash", - "display_name": "Qwen3.6 Flash", + "id": "glm-5v-turbo", + "name": "GLM-5V-Turbo", + "display_name": "GLM-5V-Turbo", "modalities": { "input": [ "text", "image", - "video" + "video", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 1000000, - "output": 65536 + "context": 200000, + "output": 131072 }, "temperature": true, "tool_call": true, @@ -30885,19 +32728,20 @@ }, "attachment": true, "open_weights": false, - "release_date": "2026-04-27", - "last_updated": "2026-04-27", + "release_date": "2026-04-01", + "last_updated": "2026-04-01", "cost": { - "input": 0.1875, - "output": 1.125, - "cache_write": 0.234375 + "input": 5, + "output": 22, + "cache_read": 1.2, + "cache_write": 0 }, "type": "chat" }, { - "id": "qwen-turbo", - "name": "Qwen Turbo", - "display_name": "Qwen Turbo", + "id": "glm-5", + "name": "GLM-5", + "display_name": "GLM-5", "modalities": { "input": [ "text" @@ -30907,19 +32751,14 @@ ] }, "limit": { - "context": 131072, - "output": 16384 + "context": 204800, + "output": 131072 }, "temperature": true, "tool_call": true, "reasoning": { "supported": true, - "default": false, - "budget": { - "default": 38912, - "min": 0, - "max": 38912 - } + "default": true }, "extra_capabilities": { "reasoning": { @@ -30932,28 +32771,22 @@ ] } }, - "search": { - "supported": true, - "default": false, - "forced_search": false, - "search_strategy": "turbo" - }, "attachment": false, - "open_weights": false, - "knowledge": "2024-04", - "release_date": "2024-11-01", - "last_updated": "2025-07-15", + "open_weights": true, + "release_date": "2026-02-11", + "last_updated": "2026-02-11", "cost": { - "input": 0.044, - "output": 0.087, - "reasoning": 0.431 + "input": 1, + "output": 3.2, + "cache_read": 0.2, + "cache_write": 0 }, "type": "chat" }, { - "id": "qwq-plus", - "name": "QwQ Plus", - "display_name": "QwQ Plus", + "id": "glm-4.5-flash", + "name": "GLM-4.5-Flash", + "display_name": "GLM-4.5-Flash", "modalities": { "input": [ "text" @@ -30964,63 +32797,42 @@ }, "limit": { "context": 131072, - "output": 8192 + "output": 98304 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { "supported": true, - "default": true, - "budget": { - "default": 32768, - "min": 0, - "max": 32768 - } - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } - }, - "search": { - "supported": true, - "default": false, - "forced_search": false, - "search_strategy": "turbo" + "default": true }, "attachment": false, - "open_weights": false, - "knowledge": "2024-04", - "release_date": "2025-03-05", - "last_updated": "2025-03-05", + "open_weights": true, + "knowledge": "2025-04", + "release_date": "2025-07-28", + "last_updated": "2025-07-28", "cost": { - "input": 0.23, - "output": 0.574 + "input": 0, + "output": 0, + "cache_read": 0, + "cache_write": 0 }, "type": "chat" }, { - "id": "qwen3-vl-30b-a3b", - "name": "Qwen3-VL 30B-A3B", - "display_name": "Qwen3-VL 30B-A3B", + "id": "glm-4.7-flash", + "name": "GLM-4.7-Flash", + "display_name": "GLM-4.7-Flash", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 131072, - "output": 32768 + "context": 200000, + "output": 131072 }, "temperature": true, "tool_call": true, @@ -31030,31 +32842,26 @@ }, "extra_capabilities": { "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] + "supported": true } }, "attachment": false, "open_weights": true, "knowledge": "2025-04", - "release_date": "2025-04", - "last_updated": "2025-04", + "release_date": "2026-01-19", + "last_updated": "2026-01-19", "cost": { - "input": 0.108, - "output": 0.431, - "reasoning": 1.076 + "input": 0, + "output": 0, + "cache_read": 0, + "cache_write": 0 }, "type": "chat" }, { - "id": "qwen-plus-character", - "name": "Qwen Plus Character", - "display_name": "Qwen Plus Character", + "id": "glm-4.5-air", + "name": "GLM-4.5-Air", + "display_name": "GLM-4.5-Air", "modalities": { "input": [ "text" @@ -31064,40 +32871,45 @@ ] }, "limit": { - "context": 32768, - "output": 4096 + "context": 131072, + "output": 98304 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "attachment": false, - "open_weights": false, - "knowledge": "2024-04", - "release_date": "2024-01", - "last_updated": "2024-01", + "open_weights": true, + "knowledge": "2025-04", + "release_date": "2025-07-28", + "last_updated": "2025-07-28", "cost": { - "input": 0.115, - "output": 0.287 + "input": 0.2, + "output": 1.1, + "cache_read": 0.03, + "cache_write": 0 }, "type": "chat" }, { - "id": "deepseek-r1-distill-qwen-1-5b", - "name": "DeepSeek R1 Distill Qwen 1.5B", - "display_name": "DeepSeek R1 Distill Qwen 1.5B", + "id": "glm-4.6v", + "name": "GLM-4.6V", + "display_name": "GLM-4.6V", "modalities": { "input": [ - "text" + "text", + "image", + "video" ], "output": [ "text" ] }, "limit": { - "context": 32768, - "output": 16384 + "context": 128000, + "output": 32768 }, "temperature": true, "tool_call": true, @@ -31105,20 +32917,21 @@ "supported": true, "default": true }, - "attachment": false, - "open_weights": false, - "release_date": "2025-01-01", - "last_updated": "2025-01-01", + "attachment": true, + "open_weights": true, + "knowledge": "2025-04", + "release_date": "2025-12-08", + "last_updated": "2025-12-08", "cost": { - "input": 0, - "output": 0 + "input": 0.3, + "output": 0.9 }, "type": "chat" }, { - "id": "qwq-32b", - "name": "QwQ 32B", - "display_name": "QwQ 32B", + "id": "glm-4.6", + "name": "GLM-4.6", + "display_name": "GLM-4.6", "modalities": { "input": [ "text" @@ -31128,8 +32941,8 @@ ] }, "limit": { - "context": 131072, - "output": 8192 + "context": 204800, + "output": 131072 }, "temperature": true, "tool_call": true, @@ -31139,30 +32952,26 @@ }, "extra_capabilities": { "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] + "supported": true } }, "attachment": false, "open_weights": true, - "knowledge": "2024-04", - "release_date": "2024-12", - "last_updated": "2024-12", + "knowledge": "2025-04", + "release_date": "2025-09-30", + "last_updated": "2025-09-30", "cost": { - "input": 0.287, - "output": 0.861 + "input": 0.6, + "output": 2.2, + "cache_read": 0.11, + "cache_write": 0 }, "type": "chat" }, { - "id": "deepseek-r1-distill-qwen-14b", - "name": "DeepSeek R1 Distill Qwen 14B", - "display_name": "DeepSeek R1 Distill Qwen 14B", + "id": "glm-4.7-flashx", + "name": "GLM-4.7-FlashX", + "display_name": "GLM-4.7-FlashX", "modalities": { "input": [ "text" @@ -31172,8 +32981,8 @@ ] }, "limit": { - "context": 32768, - "output": 16384 + "context": 200000, + "output": 131072 }, "temperature": true, "tool_call": true, @@ -31182,19 +32991,22 @@ "default": true }, "attachment": false, - "open_weights": false, - "release_date": "2025-01-01", - "last_updated": "2025-01-01", + "open_weights": true, + "knowledge": "2025-04", + "release_date": "2026-01-19", + "last_updated": "2026-01-19", "cost": { - "input": 0.144, - "output": 0.431 + "input": 0.07, + "output": 0.4, + "cache_read": 0.01, + "cache_write": 0 }, "type": "chat" }, { - "id": "deepseek-v4-flash", - "name": "DeepSeek V4 Flash", - "display_name": "DeepSeek V4 Flash", + "id": "glm-4.5", + "name": "GLM-4.5", + "display_name": "GLM-4.5", "modalities": { "input": [ "text" @@ -31204,8 +33016,8 @@ ] }, "limit": { - "context": 1000000, - "output": 384000 + "context": 131072, + "output": 98304 }, "temperature": true, "tool_call": true, @@ -31213,66 +33025,58 @@ "supported": true, "default": true }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } - }, "attachment": false, "open_weights": true, - "knowledge": "2025-05", - "release_date": "2026-04-24", - "last_updated": "2026-04-24", + "knowledge": "2025-04", + "release_date": "2025-07-28", + "last_updated": "2025-07-28", "cost": { - "input": 0.14, - "output": 0.28, - "cache_read": 0.0028 + "input": 0.6, + "output": 2.2, + "cache_read": 0.11, + "cache_write": 0 }, "type": "chat" }, { - "id": "qwen-vl-ocr", - "name": "Qwen Vl Ocr", - "display_name": "Qwen Vl Ocr", + "id": "glm-4.5v", + "name": "GLM-4.5V", + "display_name": "GLM-4.5V", "modalities": { "input": [ "text", - "image" + "image", + "video" ], "output": [ "text" ] }, "limit": { - "context": 34096, - "output": 4096 + "context": 64000, + "output": 16384 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": false, - "open_weights": false, - "knowledge": "2024-04", - "release_date": "2024-10-28", - "last_updated": "2025-04-13", + "attachment": true, + "open_weights": true, + "knowledge": "2025-04", + "release_date": "2025-08-11", + "last_updated": "2025-08-11", "cost": { - "input": 0.717, - "output": 0.717 + "input": 0.6, + "output": 1.8 }, "type": "chat" }, { - "id": "glm-5", - "name": "GLM-5", - "display_name": "GLM-5", + "id": "glm-4.7", + "name": "GLM-4.7", + "display_name": "GLM-4.7", "modalities": { "input": [ "text" @@ -31282,8 +33086,8 @@ ] }, "limit": { - "context": 202752, - "output": 16384 + "context": 204800, + "output": 131072 }, "temperature": true, "tool_call": true, @@ -31303,19 +33107,31 @@ } }, "attachment": false, - "open_weights": false, - "release_date": "2026-02-11", - "last_updated": "2026-02-11", + "open_weights": true, + "knowledge": "2025-04", + "release_date": "2025-12-22", + "last_updated": "2025-12-22", "cost": { - "input": 0.86, - "output": 3.15 + "input": 0.6, + "output": 2.2, + "cache_read": 0.11, + "cache_write": 0 }, "type": "chat" - }, + } + ] + }, + "cortecs": { + "id": "cortecs", + "name": "Cortecs", + "display_name": "Cortecs", + "api": "https://api.cortecs.ai/v1", + "doc": "https://api.cortecs.ai/v1/models", + "models": [ { - "id": "qwen-math-plus", - "name": "Qwen Math Plus", - "display_name": "Qwen Math Plus", + "id": "deepseek-r1-0528", + "name": "DeepSeek R1 0528", + "display_name": "DeepSeek R1 0528", "modalities": { "input": [ "text" @@ -31325,66 +33141,86 @@ ] }, "limit": { - "context": 4096, - "output": 3072 + "context": 164000, + "output": 164000 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } }, "attachment": false, - "open_weights": false, - "knowledge": "2024-04", - "release_date": "2024-08-16", - "last_updated": "2024-09-19", + "open_weights": true, + "knowledge": "2024-07", + "release_date": "2025-05-28", + "last_updated": "2025-05-28", "cost": { - "input": 0.574, - "output": 1.721 + "input": 0.585, + "output": 2.307 }, "type": "chat" }, { - "id": "qwen2-5-omni-7b", - "name": "Qwen2.5-Omni 7B", - "display_name": "Qwen2.5-Omni 7B", + "id": "deepseek-v4-flash", + "name": "DeepSeek V4 Flash", + "display_name": "DeepSeek V4 Flash", "modalities": { "input": [ - "text", - "image", - "audio", - "video" + "text" ], "output": [ - "text", - "audio" + "text" ] }, "limit": { - "context": 32768, - "output": 2048 + "context": 1048576, + "output": 384000 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } }, "attachment": false, "open_weights": true, - "knowledge": "2024-04", - "release_date": "2024-12", - "last_updated": "2024-12", + "knowledge": "2025-05", + "release_date": "2026-04-24", + "last_updated": "2026-04-24", "cost": { - "input": 0.087, - "output": 0.345, - "input_audio": 5.448 + "input": 0.133, + "output": 0.266, + "cache_read": 0.0028 }, "type": "chat" }, { - "id": "deepseek-v3", - "name": "DeepSeek V3", - "display_name": "DeepSeek V3", + "id": "minimax-m2.5", + "name": "MiniMax-M2.5", + "display_name": "MiniMax-M2.5", "modalities": { "input": [ "text" @@ -31394,60 +33230,40 @@ ] }, "limit": { - "context": 65536, - "output": 8192 + "context": 196608, + "output": 196608 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false - }, - "attachment": false, - "open_weights": false, - "release_date": "2024-12-01", - "last_updated": "2024-12-01", - "cost": { - "input": 0.287, - "output": 1.147 - }, - "type": "chat" - }, - { - "id": "qwen-mt-turbo", - "name": "Qwen Mt Turbo", - "display_name": "Qwen Mt Turbo", - "modalities": { - "input": [ - "text" - ], - "output": [ - "text" - ] - }, - "limit": { - "context": 16384, - "output": 8192 + "supported": true, + "default": true }, - "temperature": true, - "tool_call": false, - "reasoning": { - "supported": false + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } }, "attachment": false, - "open_weights": false, - "knowledge": "2024-04", - "release_date": "2025-01", - "last_updated": "2025-01", + "open_weights": true, + "release_date": "2026-02-12", + "last_updated": "2026-02-12", "cost": { - "input": 0.101, - "output": 0.28 + "input": 0.32, + "output": 1.18 }, "type": "chat" }, { - "id": "qwen2-5-32b-instruct", - "name": "Qwen2.5 32B Instruct", - "display_name": "Qwen2.5 32B Instruct", + "id": "deepseek-v3-0324", + "name": "DeepSeek V3 0324", + "display_name": "DeepSeek V3 0324", "modalities": { "input": [ "text" @@ -31457,8 +33273,8 @@ ] }, "limit": { - "context": 131072, - "output": 8192 + "context": 128000, + "output": 128000 }, "temperature": true, "tool_call": true, @@ -31467,51 +33283,56 @@ }, "attachment": false, "open_weights": true, - "knowledge": "2024-04", - "release_date": "2024-09", - "last_updated": "2024-09", + "knowledge": "2024-07", + "release_date": "2025-03-24", + "last_updated": "2025-03-24", "cost": { - "input": 0.287, - "output": 0.861 + "input": 0.551, + "output": 1.654 }, "type": "chat" }, { - "id": "qwen2-5-coder-7b-instruct", - "name": "Qwen2.5-Coder 7B Instruct", - "display_name": "Qwen2.5-Coder 7B Instruct", + "id": "claude-opus4-7", + "name": "Claude Opus 4.7", + "display_name": "Claude Opus 4.7", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 131072, - "output": 8192 + "context": 1000000, + "output": 128000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": false, - "open_weights": true, - "knowledge": "2024-04", - "release_date": "2024-11", - "last_updated": "2024-11", + "attachment": true, + "open_weights": false, + "knowledge": "2026-01-31", + "release_date": "2026-04-16", + "last_updated": "2026-04-16", "cost": { - "input": 0.144, - "output": 0.287 + "input": 5.6, + "output": 27.99, + "cache_read": 0.56, + "cache_write": 6.99 }, "type": "chat" }, { - "id": "qwen3.6-max-preview", - "name": "Qwen3.6 Max Preview", - "display_name": "Qwen3.6 Max Preview", + "id": "glm-4.7", + "name": "GLM 4.7", + "display_name": "GLM 4.7", "modalities": { "input": [ "text" @@ -31521,8 +33342,8 @@ ] }, "limit": { - "context": 245800, - "output": 65536 + "context": 198000, + "output": 198000 }, "temperature": true, "tool_call": true, @@ -31542,53 +33363,53 @@ } }, "attachment": false, - "open_weights": false, - "release_date": "2026-04-20", - "last_updated": "2026-04-21", + "open_weights": true, + "knowledge": "2025-04", + "release_date": "2025-12-22", + "last_updated": "2025-12-22", "cost": { - "input": 1.32, - "output": 7.9, - "cache_read": 0.132 + "input": 0.45, + "output": 2.23 }, "type": "chat" }, { - "id": "qwen-vl-max", - "name": "Qwen-VL Max", - "display_name": "Qwen-VL Max", + "id": "qwen3-235b-a22b-instruct-2507", + "name": "Qwen3 235B A22B Instruct 2507", + "display_name": "Qwen3 235B A22B Instruct 2507", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 131072, - "output": 8192 + "context": 131000, + "output": 131000 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "attachment": false, - "open_weights": false, - "knowledge": "2024-04", - "release_date": "2024-04-08", - "last_updated": "2025-08-13", + "open_weights": true, + "knowledge": "2025-04", + "release_date": "2025-07-23", + "last_updated": "2025-07-23", "cost": { - "input": 0.23, - "output": 0.574 + "input": 0.062, + "output": 0.408 }, "type": "chat" }, { - "id": "qwen2-5-coder-32b-instruct", - "name": "Qwen2.5-Coder 32B Instruct", - "display_name": "Qwen2.5-Coder 32B Instruct", + "id": "qwen3-coder-30b-a3b-instruct", + "name": "Qwen3 Coder 30B A3B Instruct", + "display_name": "Qwen3 Coder 30B A3B Instruct", "modalities": { "input": [ "text" @@ -31598,42 +33419,41 @@ ] }, "limit": { - "context": 131072, - "output": 8192 + "context": 262000, + "output": 262000 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "attachment": false, "open_weights": true, - "knowledge": "2024-04", - "release_date": "2024-11", - "last_updated": "2024-11", + "knowledge": "2025-04", + "release_date": "2025-07-31", + "last_updated": "2025-07-31", "cost": { - "input": 0.287, - "output": 0.861 + "input": 0.053, + "output": 0.222 }, "type": "chat" }, { - "id": "qwen3.5-397b-a17b", - "name": "Qwen3.5 397B-A17B", - "display_name": "Qwen3.5 397B-A17B", + "id": "minimax-m2.1", + "name": "MiniMax-M2.1", + "display_name": "MiniMax-M2.1", "modalities": { "input": [ - "text", - "image", - "video" + "text" ], "output": [ "text" ] }, "limit": { - "context": 262144, - "output": 65536 + "context": 196000, + "output": 196000 }, "temperature": true, "tool_call": true, @@ -31654,20 +33474,18 @@ }, "attachment": false, "open_weights": true, - "knowledge": "2025-04", - "release_date": "2026-02-16", - "last_updated": "2026-02-16", + "release_date": "2025-12-23", + "last_updated": "2025-12-23", "cost": { - "input": 0.43, - "output": 2.58, - "reasoning": 2.58 + "input": 0.34, + "output": 1.34 }, "type": "chat" }, { - "id": "deepseek-r1-distill-qwen-7b", - "name": "DeepSeek R1 Distill Qwen 7B", - "display_name": "DeepSeek R1 Distill Qwen 7B", + "id": "qwen3-32b", + "name": "Qwen3 32B", + "display_name": "Qwen3 32B", "modalities": { "input": [ "text" @@ -31677,98 +33495,131 @@ ] }, "limit": { - "context": 32768, + "context": 16384, "output": 16384 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } }, "attachment": false, - "open_weights": false, - "release_date": "2025-01-01", - "last_updated": "2025-01-01", + "open_weights": true, + "knowledge": "2024-12", + "release_date": "2025-04-29", + "last_updated": "2025-04-29", "cost": { - "input": 0.072, - "output": 0.144 + "input": 0.099, + "output": 0.33 }, "type": "chat" }, { - "id": "qwen3-omni-flash-realtime", - "name": "Qwen3-Omni Flash Realtime", - "display_name": "Qwen3-Omni Flash Realtime", + "id": "claude-4-6-sonnet", + "name": "Claude Sonnet 4.6", + "display_name": "Claude Sonnet 4.6", "modalities": { "input": [ "text", "image", - "audio" + "pdf" ], "output": [ - "text", - "audio" + "text" ] }, "limit": { - "context": 65536, - "output": 16384 + "context": 1000000, + "output": 1000000 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": false, + "attachment": true, "open_weights": false, - "knowledge": "2024-04", - "release_date": "2025-09-15", - "last_updated": "2025-09-15", + "knowledge": "2025-08-31", + "release_date": "2026-02-17", + "last_updated": "2026-03-13", "cost": { - "input": 0.23, - "output": 0.918, - "input_audio": 3.584, - "output_audio": 7.168 + "input": 3.59, + "output": 17.92 }, "type": "chat" }, { - "id": "qwen2-5-14b-instruct", - "name": "Qwen2.5 14B Instruct", - "display_name": "Qwen2.5 14B Instruct", + "id": "claude-sonnet-4", + "name": "Claude Sonnet 4", + "display_name": "Claude Sonnet 4", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 131072, - "output": 8192 + "context": 200000, + "output": 64000 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": false + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": false, + "mode": "budget", + "budget": { + "min": 1024, + "unit": "tokens" + }, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ], + "notes": [ + "Claude 4 manual thinking uses thinking.type = \"enabled\" with budget_tokens.", + "Interleaved thinking requires the interleaved-thinking-2025-05-14 beta header for this model family." + ] + } }, "attachment": false, - "open_weights": true, - "knowledge": "2024-04", - "release_date": "2024-09", - "last_updated": "2024-09", + "open_weights": false, + "knowledge": "2025-03", + "release_date": "2025-05-22", + "last_updated": "2025-05-22", "cost": { - "input": 0.144, - "output": 0.431 + "input": 3.307, + "output": 16.536 }, "type": "chat" }, { - "id": "qwen3.7-plus", - "name": "Qwen3.7 Plus", - "display_name": "Qwen3.7 Plus", + "id": "gemini-2.5-pro", + "name": "Gemini 2.5 Pro", + "display_name": "Gemini 2.5 Pro", "modalities": { "input": [ "text", @@ -31779,8 +33630,8 @@ ] }, "limit": { - "context": 1000000, - "output": 64000 + "context": 1048576, + "output": 65535 }, "temperature": true, "tool_call": true, @@ -31790,69 +33641,73 @@ }, "extra_capabilities": { "reasoning": { - "supported": true + "supported": true, + "default_enabled": true, + "mode": "budget", + "budget": { + "default": -1, + "min": 128, + "max": 32768, + "auto": -1, + "unit": "tokens" + }, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thought_signatures" + ] } }, "attachment": false, "open_weights": false, - "knowledge": "2025-04", - "release_date": "2026-06-02", - "last_updated": "2026-06-02", + "knowledge": "2025-01", + "release_date": "2025-03-20", + "last_updated": "2025-06-17", "cost": { - "input": 0.5, - "output": 3, - "cache_read": 0.05, - "cache_write": 0.625, - "tiers": [ - { - "input": 2, - "output": 6, - "cache_read": 0.2, - "cache_write": 2.5, - "tier": { - "type": "context", - "size": 128000 - } - } - ] + "input": 1.654, + "output": 11.024 }, "type": "chat" }, { - "id": "deepseek-v3-2-exp", - "name": "DeepSeek V3.2 Exp", - "display_name": "DeepSeek V3.2 Exp", + "id": "claude-4-5-sonnet", + "name": "Claude 4.5 Sonnet", + "display_name": "Claude 4.5 Sonnet", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 131072, - "output": 65536 + "context": 200000, + "output": 200000 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": false, + "attachment": true, "open_weights": false, - "release_date": "2025-01-01", - "last_updated": "2025-01-01", + "knowledge": "2025-07-31", + "release_date": "2025-09-29", + "last_updated": "2025-09-29", "cost": { - "input": 0.287, - "output": 0.431 + "input": 3.259, + "output": 16.296 }, "type": "chat" }, { - "id": "deepseek-v4-pro", - "name": "DeepSeek V4 Pro", - "display_name": "DeepSeek V4 Pro", + "id": "mixtral-8x7B-instruct-v0.1", + "name": "Mixtral 8x7B Instruct v0.1", + "display_name": "Mixtral 8x7B Instruct v0.1", "modalities": { "input": [ "text" @@ -31862,55 +33717,41 @@ ] }, "limit": { - "context": 1000000, - "output": 384000 + "context": 32000, + "output": 32000 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": true, "default": true }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } - }, "attachment": false, "open_weights": true, - "knowledge": "2025-05", - "release_date": "2026-04-24", - "last_updated": "2026-04-24", + "knowledge": "2023-09", + "release_date": "2023-12-11", + "last_updated": "2023-12-11", "cost": { - "input": 0.435, - "output": 0.87, - "cache_read": 0.003625 + "input": 0.438, + "output": 0.68 }, "type": "chat" }, { - "id": "kimi-k2.5", - "name": "Moonshot Kimi K2.5", - "display_name": "Moonshot Kimi K2.5", + "id": "glm-4.5", + "name": "GLM 4.5", + "display_name": "GLM 4.5", "modalities": { "input": [ - "text", - "image", - "video" + "text" ], "output": [ "text" ] }, "limit": { - "context": 262144, - "output": 32768 + "context": 131072, + "output": 131072 }, "temperature": true, "tool_call": true, @@ -31931,56 +33772,19 @@ }, "attachment": false, "open_weights": true, - "knowledge": "2025-01", - "release_date": "2026-01-27", - "last_updated": "2026-01-27", - "cost": { - "input": 0.574, - "output": 2.411 - }, - "type": "chat" - }, - { - "id": "qwen-omni-turbo-realtime", - "name": "Qwen-Omni Turbo Realtime", - "display_name": "Qwen-Omni Turbo Realtime", - "modalities": { - "input": [ - "text", - "image", - "audio" - ], - "output": [ - "text", - "audio" - ] - }, - "limit": { - "context": 32768, - "output": 2048 - }, - "temperature": true, - "tool_call": true, - "reasoning": { - "supported": false - }, - "attachment": false, - "open_weights": false, - "knowledge": "2024-04", - "release_date": "2025-05-08", - "last_updated": "2025-05-08", + "knowledge": "2025-04", + "release_date": "2025-07-29", + "last_updated": "2025-07-29", "cost": { - "input": 0.23, - "output": 0.918, - "input_audio": 3.584, - "output_audio": 7.168 + "input": 0.67, + "output": 2.46 }, "type": "chat" }, { - "id": "qwen-mt-plus", - "name": "Qwen Mt Plus", - "display_name": "Qwen Mt Plus", + "id": "kimi-k2-instruct", + "name": "Kimi K2 Instruct", + "display_name": "Kimi K2 Instruct", "modalities": { "input": [ "text" @@ -31990,29 +33794,29 @@ ] }, "limit": { - "context": 16384, - "output": 8192 + "context": 131000, + "output": 131000 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { "supported": false }, "attachment": false, - "open_weights": false, - "knowledge": "2024-04", - "release_date": "2025-01", - "last_updated": "2025-01", + "open_weights": true, + "knowledge": "2024-07", + "release_date": "2025-07-11", + "last_updated": "2025-09-05", "cost": { - "input": 0.259, - "output": 0.775 + "input": 0.551, + "output": 2.646 }, "type": "chat" }, { - "id": "qwen-long", - "name": "Qwen Long", - "display_name": "Qwen Long", + "id": "llama-3.3-70b-instruct", + "name": "Llama 3.3 70B Instruct", + "display_name": "Llama 3.3 70B Instruct", "modalities": { "input": [ "text" @@ -32022,41 +33826,8 @@ ] }, "limit": { - "context": 1000000, - "output": 8192 - }, - "temperature": true, - "tool_call": false, - "reasoning": { - "supported": false - }, - "attachment": false, - "open_weights": false, - "knowledge": "2024-04", - "release_date": "2025-01-25", - "last_updated": "2025-01-25", - "cost": { - "input": 0.072, - "output": 0.287 - }, - "type": "chat" - }, - { - "id": "qvq-max", - "name": "QVQ Max", - "display_name": "QVQ Max", - "modalities": { - "input": [ - "text", - "image" - ], - "output": [ - "text" - ] - }, - "limit": { - "context": 131072, - "output": 8192 + "context": 131000, + "output": 131000 }, "temperature": true, "tool_call": true, @@ -32065,63 +33836,68 @@ "default": true }, "attachment": false, - "open_weights": false, - "knowledge": "2024-04", - "release_date": "2025-03-25", - "last_updated": "2025-03-25", + "open_weights": true, + "knowledge": "2023-12", + "release_date": "2024-12-06", + "last_updated": "2024-12-06", "cost": { - "input": 1.147, - "output": 4.588 + "input": 0.089, + "output": 0.275 }, "type": "chat" }, { - "id": "deepseek-r1-distill-qwen-32b", - "name": "DeepSeek R1 Distill Qwen 32B", - "display_name": "DeepSeek R1 Distill Qwen 32B", + "id": "claude-opus4-8", + "name": "Claude Opus 4.8", + "display_name": "Claude Opus 4.8", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 32768, - "output": 16384 + "context": 1000000, + "output": 128000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { "supported": true, "default": true }, - "attachment": false, + "attachment": true, "open_weights": false, - "release_date": "2025-01-01", - "last_updated": "2025-01-01", + "release_date": "2026-05-28", + "last_updated": "2026-05-28", "cost": { - "input": 0.287, - "output": 0.861 + "input": 5.64, + "output": 28.198, + "cache_read": 0.563, + "cache_write": 7.049 }, "type": "chat" }, { - "id": "qwen-doc-turbo", - "name": "Qwen Doc Turbo", - "display_name": "Qwen Doc Turbo", + "id": "devstral-small-2512", + "name": "Devstral Small 2 2512", + "display_name": "Devstral Small 2 2512", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 131072, - "output": 8192 + "context": 262000, + "output": 262000 }, "temperature": true, "tool_call": true, @@ -32129,13 +33905,13 @@ "supported": false }, "attachment": false, - "open_weights": false, - "knowledge": "2024-04", - "release_date": "2024-01", - "last_updated": "2024-01", + "open_weights": true, + "knowledge": "2025-12", + "release_date": "2025-12-09", + "last_updated": "2025-12-09", "cost": { - "input": 0.087, - "output": 0.144 + "input": 0, + "output": 0 }, "type": "chat" }, @@ -32152,8 +33928,8 @@ ] }, "limit": { - "context": 202752, - "output": 128000 + "context": 204800, + "output": 131072 }, "temperature": true, "tool_call": true, @@ -32177,49 +33953,61 @@ "release_date": "2026-04-14", "last_updated": "2026-04-14", "cost": { - "input": 0.87, - "output": 3.48, - "cache_read": 0.17 + "input": 1.31, + "output": 4.1, + "cache_read": 0.24 }, "type": "chat" }, { - "id": "qwen2-5-vl-7b-instruct", - "name": "Qwen2.5-VL 7B Instruct", - "display_name": "Qwen2.5-VL 7B Instruct", + "id": "deepseek-v4-pro", + "name": "DeepSeek V4 Pro", + "display_name": "DeepSeek V4 Pro", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 131072, - "output": 8192 + "context": 1048576, + "output": 384000 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } }, "attachment": false, "open_weights": true, - "knowledge": "2024-04", - "release_date": "2024-09", - "last_updated": "2024-09", + "knowledge": "2025-05", + "release_date": "2026-04-24", + "last_updated": "2026-04-24", "cost": { - "input": 0.287, - "output": 0.717 + "input": 1.553, + "output": 3.106, + "cache_read": 0.003625 }, "type": "chat" }, { - "id": "qwen-plus", - "name": "Qwen Plus", - "display_name": "Qwen Plus", + "id": "qwen3-next-80b-a3b-thinking", + "name": "Qwen3 Next 80B A3B Thinking", + "display_name": "Qwen3 Next 80B A3B Thinking", "modalities": { "input": [ "text" @@ -32229,19 +34017,14 @@ ] }, "limit": { - "context": 1000000, - "output": 32768 + "context": 128000, + "output": 128000 }, "temperature": true, "tool_call": true, "reasoning": { "supported": true, - "default": false, - "budget": { - "default": 81920, - "min": 0, - "max": 81920 - } + "default": true }, "extra_capabilities": { "reasoning": { @@ -32254,28 +34037,21 @@ ] } }, - "search": { - "supported": true, - "default": false, - "forced_search": false, - "search_strategy": "turbo" - }, "attachment": false, - "open_weights": false, - "knowledge": "2024-04", - "release_date": "2024-01-25", + "open_weights": true, + "knowledge": "2025-04", + "release_date": "2025-09-11", "last_updated": "2025-09-11", "cost": { - "input": 0.115, - "output": 0.287, - "reasoning": 1.147 + "input": 0.164, + "output": 1.311 }, "type": "chat" }, { - "id": "qwen2-5-7b-instruct", - "name": "Qwen2.5 7B Instruct", - "display_name": "Qwen2.5 7B Instruct", + "id": "kimi-k2-thinking", + "name": "Kimi K2 Thinking", + "display_name": "Kimi K2 Thinking", "modalities": { "input": [ "text" @@ -32285,29 +34061,41 @@ ] }, "limit": { - "context": 131072, - "output": 8192 + "context": 262000, + "output": 262000 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": false, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } + }, + "attachment": true, "open_weights": true, - "knowledge": "2024-04", - "release_date": "2024-09", - "last_updated": "2024-09", + "knowledge": "2025-12", + "release_date": "2025-12-08", + "last_updated": "2025-12-08", "cost": { - "input": 0.072, - "output": 0.144 + "input": 0.656, + "output": 2.731 }, "type": "chat" }, { - "id": "MiniMax/MiniMax-M2.7", - "name": "MiniMax-M2.7", - "display_name": "MiniMax-M2.7", + "id": "minimax-m2", + "name": "MiniMax-M2", + "display_name": "MiniMax-M2", "modalities": { "input": [ "text" @@ -32317,8 +34105,8 @@ ] }, "limit": { - "context": 204800, - "output": 131072 + "context": 400000, + "output": 400000 }, "temperature": true, "tool_call": true, @@ -32339,20 +34127,19 @@ }, "attachment": false, "open_weights": true, - "release_date": "2026-03-18", - "last_updated": "2026-03-18", + "knowledge": "2024-11", + "release_date": "2025-10-27", + "last_updated": "2025-10-27", "cost": { - "input": 0.3, - "output": 1.2, - "cache_read": 0.06, - "cache_write": 0.375 + "input": 0.39, + "output": 1.57 }, "type": "chat" }, { - "id": "qwen3-coder-plus", - "name": "Qwen3 Coder Plus", - "display_name": "Qwen3 Coder Plus", + "id": "minimax-m2.7", + "name": "MiniMax-m2.7", + "display_name": "MiniMax-m2.7", "modalities": { "input": [ "text" @@ -32362,40 +34149,53 @@ ] }, "limit": { - "context": 1000000, - "output": 65536 + "context": 202752, + "output": 196072 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } }, "attachment": false, "open_weights": true, - "knowledge": "2025-04", - "release_date": "2025-07-23", - "last_updated": "2025-07-23", + "release_date": "2026-03-18", + "last_updated": "2026-03-18", "cost": { - "input": 1, - "output": 5 + "input": 0.47, + "output": 1.4 }, "type": "chat" }, { - "id": "siliconflow/deepseek-r1-0528", - "name": "siliconflow/deepseek-r1-0528", - "display_name": "siliconflow/deepseek-r1-0528", + "id": "kimi-k2.5", + "name": "Kimi K2.5", + "display_name": "Kimi K2.5", "modalities": { "input": [ - "text" + "text", + "image", + "video" ], "output": [ "text" ] }, "limit": { - "context": 163840, - "output": 32768 + "context": 256000, + "output": 256000 }, "temperature": true, "tool_call": true, @@ -32415,19 +34215,20 @@ } }, "attachment": false, - "open_weights": false, - "release_date": "2025-05-28", - "last_updated": "2025-11-25", + "open_weights": true, + "knowledge": "2025-01", + "release_date": "2026-01-27", + "last_updated": "2026-01-27", "cost": { - "input": 0.5, - "output": 2.18 + "input": 0.55, + "output": 2.76 }, "type": "chat" }, { - "id": "siliconflow/deepseek-v3-0324", - "name": "siliconflow/deepseek-v3-0324", - "display_name": "siliconflow/deepseek-v3-0324", + "id": "gpt-oss-120b", + "name": "GPT Oss 120b", + "display_name": "GPT Oss 120b", "modalities": { "input": [ "text" @@ -32437,28 +34238,34 @@ ] }, "limit": { - "context": 163840, - "output": 163840 + "context": 128000, + "output": 128000 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true + } }, "attachment": false, - "open_weights": false, - "release_date": "2024-12-26", - "last_updated": "2025-11-25", + "open_weights": true, + "knowledge": "2024-01", + "release_date": "2025-08-05", + "last_updated": "2025-08-05", "cost": { - "input": 0.25, - "output": 1 + "input": 0, + "output": 0 }, "type": "chat" }, { - "id": "siliconflow/deepseek-v3.2", - "name": "siliconflow/deepseek-v3.2", - "display_name": "siliconflow/deepseek-v3.2", + "id": "qwen-2.5-72b-instruct", + "name": "Qwen2.5 72B Instruct", + "display_name": "Qwen2.5 72B Instruct", "modalities": { "input": [ "text" @@ -32468,34 +34275,29 @@ ] }, "limit": { - "context": 163840, - "output": 65536 + "context": 33000, + "output": 33000 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true - } + "supported": false }, "attachment": false, - "open_weights": false, - "release_date": "2025-12-03", - "last_updated": "2025-12-03", + "open_weights": true, + "knowledge": "2024-06", + "release_date": "2024-09-19", + "last_updated": "2024-09-19", "cost": { - "input": 0.27, - "output": 0.42 + "input": 0.062, + "output": 0.231 }, "type": "chat" }, { - "id": "siliconflow/deepseek-v3.1-terminus", - "name": "siliconflow/deepseek-v3.1-terminus", - "display_name": "siliconflow/deepseek-v3.1-terminus", + "id": "hermes-4-70b", + "name": "Hermes 4 70B", + "display_name": "Hermes 4 70B", "modalities": { "input": [ "text" @@ -32505,8 +34307,8 @@ ] }, "limit": { - "context": 163840, - "output": 65536 + "context": 128000, + "output": 128000 }, "temperature": true, "tool_call": true, @@ -32515,114 +34317,134 @@ "default": true }, "attachment": false, - "open_weights": false, - "release_date": "2025-09-29", - "last_updated": "2025-11-25", + "open_weights": true, + "knowledge": "2023-12", + "release_date": "2025-08-26", + "last_updated": "2025-08-26", "cost": { - "input": 0.27, - "output": 1 + "input": 0.116, + "output": 0.358 }, "type": "chat" }, { - "id": "kimi/kimi-k2.5", - "name": "kimi/kimi-k2.5", - "display_name": "kimi/kimi-k2.5", + "id": "claude-haiku-4-5", + "name": "Claude Haiku 4.5", + "display_name": "Claude Haiku 4.5", "modalities": { "input": [ "text", "image", - "video" + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 262144, - "output": 262144 + "context": 200000, + "output": 200000 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, - "default": true + "default": false }, "extra_capabilities": { "reasoning": { "supported": true, + "default_enabled": false, + "mode": "budget", + "budget": { + "min": 1024, + "unit": "tokens" + }, "interleaved": true, "summaries": true, "visibility": "summary", "continuation": [ "thinking_blocks" + ], + "notes": [ + "Claude 4 manual thinking uses thinking.type = \"enabled\" with budget_tokens.", + "Interleaved thinking requires the interleaved-thinking-2025-05-14 beta header for this model family." ] } }, - "attachment": false, - "open_weights": true, - "knowledge": "2025-01", - "release_date": "2026-01-27", - "last_updated": "2026-01-27", + "attachment": true, + "open_weights": false, + "knowledge": "2025-02-28", + "release_date": "2025-10-15", + "last_updated": "2025-10-15", "cost": { - "input": 0.6, - "output": 3, - "cache_read": 0.1 + "input": 1.09, + "output": 5.43 }, "type": "chat" }, { - "id": "qwen3-coder-plus-2025-09-23", - "name": "Qwen3 Coder Plus 2025 09 23", - "display_name": "Qwen3 Coder Plus 2025 09 23", + "id": "gpt-5.4", + "name": "GPT-5.4", + "display_name": "GPT-5.4", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 1000000, - "output": 65536 + "context": 1050000, + "output": 128000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { - "supported": false - }, - "attachment": false, - "type": "chat" - }, - { - "id": "qwen3-coder-plus-2025-07-22", - "name": "Qwen3 Coder Plus 2025 07 22", - "display_name": "Qwen3 Coder Plus 2025 07 22", - "modalities": { - "input": [ - "text" - ], - "output": [ - "text" - ] - }, - "limit": { - "context": 1000000, - "output": 65536 + "supported": true, + "default": false }, - "temperature": true, - "tool_call": true, - "reasoning": { - "supported": false + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": false, + "mode": "effort", + "effort": "none", + "effort_options": [ + "none", + "low", + "medium", + "high", + "xhigh" + ], + "verbosity": "medium", + "verbosity_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" + } + }, + "attachment": true, + "open_weights": false, + "knowledge": "2025-08-31", + "release_date": "2026-03-05", + "last_updated": "2026-03-05", + "cost": { + "input": 3, + "output": 16.13, + "cache_read": 0.25 }, - "attachment": false, "type": "chat" }, { - "id": "qwen-vl-ocr-latest", - "name": "Qwen Vl Ocr Latest", - "display_name": "Qwen Vl Ocr Latest", + "id": "kimi-k2.6", + "name": "Kimi K2.6", + "display_name": "Kimi K2.6", "modalities": { "input": [ "text", @@ -32633,21 +34455,41 @@ ] }, "limit": { - "context": 34096, - "output": 4096 + "context": 256000, + "output": 256000 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } }, "attachment": false, + "open_weights": true, + "release_date": "2026-04-17", + "last_updated": "2026-04-17", + "cost": { + "input": 0.81, + "output": 3.54, + "cache_read": 0.2 + }, "type": "chat" }, { - "id": "qvq-max-2025-05-15", - "name": "Qvq Max 2025 05 15", - "display_name": "Qvq Max 2025 05 15", + "id": "gpt-4.1", + "name": "GPT 4.1", + "display_name": "GPT 4.1", "modalities": { "input": [ "text", @@ -32658,74 +34500,62 @@ ] }, "limit": { - "context": 131072, - "output": 8192 + "context": 1047576, + "output": 32768 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { - "supported": true, - "default": false, - "budget": { - "default": 16384, - "min": 0, - "max": 16384 - } + "supported": false }, "attachment": false, + "open_weights": false, + "knowledge": "2024-06", + "release_date": "2025-04-14", + "last_updated": "2025-04-14", + "cost": { + "input": 2.354, + "output": 9.417 + }, "type": "chat" }, { - "id": "qwen-turbo-latest", - "name": "Qwen Turbo Latest", - "display_name": "Qwen Turbo Latest", + "id": "nova-pro-v1", + "name": "Nova Pro 1.0", + "display_name": "Nova Pro 1.0", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 131072, - "output": 16384 + "context": 300000, + "output": 5000 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": false, - "budget": { - "default": 38912, - "min": 0, - "max": 38912 - } - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } - }, - "search": { - "supported": true, - "default": false, - "forced_search": false, - "search_strategy": "turbo" + "supported": false }, "attachment": false, + "open_weights": false, + "knowledge": "2024-04", + "release_date": "2024-12-03", + "last_updated": "2024-12-03", + "cost": { + "input": 1.016, + "output": 4.061 + }, "type": "chat" }, { - "id": "qwen-turbo-2024-09-19", - "name": "Qwen Turbo 2024 09 19", - "display_name": "Qwen Turbo 2024 09 19", + "id": "qwen3-coder-next", + "name": "Qwen3 Coder Next 80B", + "display_name": "Qwen3 Coder Next 80B", "modalities": { "input": [ "text" @@ -32735,68 +34565,65 @@ ] }, "limit": { - "context": 131072, - "output": 8192 + "context": 256000, + "output": 65536 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "attachment": false, + "open_weights": true, + "knowledge": "2025-04", + "release_date": "2026-02-04", + "last_updated": "2026-02-04", + "cost": { + "input": 0.158, + "output": 0.84 + }, "type": "chat" }, { - "id": "qwen-flash-2025-07-28", - "name": "Qwen Flash 2025 07 28", - "display_name": "Qwen Flash 2025 07 28", + "id": "claude-opus4-5", + "name": "Claude Opus 4.5", + "display_name": "Claude Opus 4.5", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 1000000, - "output": 32768 + "context": 200000, + "output": 200000 }, "temperature": true, "tool_call": true, "reasoning": { "supported": true, - "default": false, - "budget": { - "default": 81920, - "min": 0, - "max": 81920 - } - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } + "default": true }, - "search": { - "supported": true, - "default": false, - "forced_search": false, - "search_strategy": "turbo" + "attachment": true, + "open_weights": false, + "knowledge": "2025-03-31", + "release_date": "2025-11-24", + "last_updated": "2025-11-24", + "cost": { + "input": 5.98, + "output": 29.89 }, - "attachment": false, "type": "chat" }, { - "id": "qwen-plus-latest", - "name": "Qwen Plus Latest", - "display_name": "Qwen Plus Latest", + "id": "qwen3-coder-480b-a35b-instruct", + "name": "Qwen3 Coder 480B A35B Instruct", + "display_name": "Qwen3 Coder 480B A35B Instruct", "modalities": { "input": [ "text" @@ -32806,44 +34633,29 @@ ] }, "limit": { - "context": 1000000, - "output": 32768 + "context": 262000, + "output": 262000 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": false, - "budget": { - "default": 81920, - "min": 0, - "max": 81920 - } - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } - }, - "search": { - "supported": true, - "default": false, - "forced_search": false, - "search_strategy": "turbo" + "supported": false }, "attachment": false, + "open_weights": true, + "knowledge": "2025-01", + "release_date": "2025-07-25", + "last_updated": "2025-07-25", + "cost": { + "input": 0.441, + "output": 1.984 + }, "type": "chat" }, { - "id": "qwen-plus-2024-09-19", - "name": "Qwen Plus 2024 09 19", - "display_name": "Qwen Plus 2024 09 19", + "id": "devstral-2512", + "name": "Devstral 2 2512", + "display_name": "Devstral 2 2512", "modalities": { "input": [ "text" @@ -32853,8 +34665,8 @@ ] }, "limit": { - "context": 131072, - "output": 8192 + "context": 262000, + "output": 262000 }, "temperature": true, "tool_call": true, @@ -32862,12 +34674,20 @@ "supported": false }, "attachment": false, + "open_weights": true, + "knowledge": "2025-12", + "release_date": "2025-12-09", + "last_updated": "2025-12-09", + "cost": { + "input": 0, + "output": 0 + }, "type": "chat" }, { - "id": "qwen-plus-2025-07-14", - "name": "Qwen Plus 2025 07 14", - "display_name": "Qwen Plus 2025 07 14", + "id": "qwen3.5-397b-a17b", + "name": "Qwen3.5 397B A17B", + "display_name": "Qwen3.5 397B A17B", "modalities": { "input": [ "text" @@ -32877,19 +34697,14 @@ ] }, "limit": { - "context": 131072, - "output": 16384 + "context": 250000, + "output": 250000 }, "temperature": true, "tool_call": true, "reasoning": { "supported": true, - "default": false, - "budget": { - "default": 38912, - "min": 0, - "max": 38912 - } + "default": true }, "extra_capabilities": { "reasoning": { @@ -32902,19 +34717,54 @@ ] } }, - "search": { + "attachment": false, + "open_weights": true, + "knowledge": "2026-01", + "release_date": "2026-02-16", + "last_updated": "2026-02-16", + "cost": { + "input": 0.6, + "output": 3.6 + }, + "type": "chat" + }, + { + "id": "glm-4.5-air", + "name": "GLM 4.5 Air", + "display_name": "GLM 4.5 Air", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 131072, + "output": 131072 + }, + "temperature": true, + "tool_call": true, + "reasoning": { "supported": true, - "default": false, - "forced_search": false, - "search_strategy": "turbo" + "default": true }, "attachment": false, + "open_weights": true, + "knowledge": "2025-04", + "release_date": "2025-08-01", + "last_updated": "2025-08-01", + "cost": { + "input": 0.22, + "output": 1.34 + }, "type": "chat" }, { - "id": "qwen-plus-2025-09-11", - "name": "Qwen Plus 2025 09 11", - "display_name": "Qwen Plus 2025 09 11", + "id": "glm-4.7-flash", + "name": "GLM-4.7-Flash", + "display_name": "GLM-4.7-Flash", "modalities": { "input": [ "text" @@ -32924,19 +34774,14 @@ ] }, "limit": { - "context": 1000000, - "output": 32768 + "context": 203000, + "output": 203000 }, "temperature": true, "tool_call": true, "reasoning": { "supported": true, - "default": false, - "budget": { - "default": 81920, - "min": 0, - "max": 81920 - } + "default": true }, "extra_capabilities": { "reasoning": { @@ -32949,19 +34794,21 @@ ] } }, - "search": { - "supported": true, - "default": false, - "forced_search": false, - "search_strategy": "turbo" - }, "attachment": false, + "open_weights": true, + "knowledge": "2025-04", + "release_date": "2025-08-08", + "last_updated": "2025-08-08", + "cost": { + "input": 0.09, + "output": 0.53 + }, "type": "chat" }, { - "id": "qwen-max-latest", - "name": "Qwen Max Latest", - "display_name": "Qwen Max Latest", + "id": "intellect-3", + "name": "INTELLECT 3", + "display_name": "INTELLECT 3", "modalities": { "input": [ "text" @@ -32971,27 +34818,30 @@ ] }, "limit": { - "context": 131072, - "output": 8192 + "context": 128000, + "output": 128000 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false - }, - "search": { "supported": true, - "default": false, - "forced_search": false, - "search_strategy": "turbo" + "default": true + }, + "attachment": true, + "open_weights": true, + "knowledge": "2025-11", + "release_date": "2025-11-26", + "last_updated": "2025-11-26", + "cost": { + "input": 0.219, + "output": 1.202 }, - "attachment": false, "type": "chat" }, { - "id": "qwen-max-2024-09-19", - "name": "Qwen Max 2024 09 19", - "display_name": "Qwen Max 2024 09 19", + "id": "llama-3.1-405b-instruct", + "name": "Llama 3.1 405B Instruct", + "display_name": "Llama 3.1 405B Instruct", "modalities": { "input": [ "text" @@ -33001,27 +34851,29 @@ ] }, "limit": { - "context": 32768, - "output": 8192 + "context": 128000, + "output": 128000 }, "temperature": true, "tool_call": true, "reasoning": { "supported": false }, - "search": { - "supported": true, - "default": false, - "forced_search": false, - "search_strategy": "turbo" - }, "attachment": false, + "open_weights": true, + "knowledge": "2023-12", + "release_date": "2024-07-23", + "last_updated": "2024-07-23", + "cost": { + "input": 0, + "output": 0 + }, "type": "chat" }, { - "id": "qwen-max-2024-04-28", - "name": "Qwen Max 2024 04 28", - "display_name": "Qwen Max 2024 04 28", + "id": "glm-5", + "name": "GLM 5", + "display_name": "GLM 5", "modalities": { "input": [ "text" @@ -33031,45 +34883,74 @@ ] }, "limit": { - "context": 8000, - "output": 2000 + "context": 202752, + "output": 202752 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } }, "attachment": false, + "open_weights": true, + "release_date": "2026-02-11", + "last_updated": "2026-02-11", + "cost": { + "input": 1.08, + "output": 3.44 + }, "type": "chat" }, { - "id": "qwen-max-2024-04-03", - "name": "Qwen Max 2024 04 03", - "display_name": "Qwen Max 2024 04 03", + "id": "mistral-large-2512", + "name": "Mistral Large 3 2512", + "display_name": "Mistral Large 3 2512", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 8000, - "output": 2000 + "context": 256000, + "output": 256000 }, "temperature": true, "tool_call": true, "reasoning": { "supported": false }, - "attachment": false, + "attachment": true, + "open_weights": true, + "knowledge": "2025-12", + "release_date": "2025-12-01", + "last_updated": "2025-12-01", + "cost": { + "input": 0.5, + "output": 1.5, + "cache_read": 0.05 + }, "type": "chat" }, { - "id": "qwen-max-2025-01-25", - "name": "Qwen Max 2025 01 25", - "display_name": "Qwen Max 2025 01 25", + "id": "deepseek-v3.2", + "name": "DeepSeek V3.2", + "display_name": "DeepSeek V3.2", "modalities": { "input": [ "text" @@ -33079,27 +34960,35 @@ ] }, "limit": { - "context": 131072, - "output": 8192 + "context": 163840, + "output": 163840 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false - }, - "search": { "supported": true, - "default": false, - "forced_search": false, - "search_strategy": "turbo" + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true + } }, "attachment": false, + "open_weights": true, + "knowledge": "2024-07", + "release_date": "2025-12-01", + "last_updated": "2025-12-01", + "cost": { + "input": 0.266, + "output": 0.444 + }, "type": "chat" }, { - "id": "qwen3-max-2025-09-23", - "name": "Qwen3 Max 20250923", - "display_name": "Qwen3 Max 20250923", + "id": "codestral-2508", + "name": "Codestral 2508", + "display_name": "Codestral 2508", "modalities": { "input": [ "text" @@ -33109,27 +34998,30 @@ ] }, "limit": { - "context": 262144, - "output": 65536 + "context": 256000, + "output": 256000 }, "temperature": true, "tool_call": true, "reasoning": { "supported": false }, - "search": { - "supported": true, - "default": false, - "forced_search": false, - "search_strategy": "turbo" - }, "attachment": false, + "open_weights": true, + "knowledge": "2025-03", + "release_date": "2025-07-30", + "last_updated": "2025-07-30", + "cost": { + "input": 0.3, + "output": 0.9, + "cache_read": 0.03 + }, "type": "chat" }, { - "id": "qwen3-max-preview", - "name": "Qwen3 Max Preview", - "display_name": "Qwen3 Max Preview", + "id": "qwen3.5-122b-a10b", + "name": "Qwen3.5 122B A10B", + "display_name": "Qwen3.5 122B A10B", "modalities": { "input": [ "text" @@ -33140,12 +35032,13 @@ }, "limit": { "context": 262144, - "output": 65536 + "output": 262144 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true + "supported": true, + "default": true }, "extra_capabilities": { "reasoning": { @@ -33158,19 +35051,21 @@ ] } }, - "search": { - "supported": true, - "default": false, - "forced_search": false, - "search_strategy": "turbo" - }, "attachment": false, + "open_weights": true, + "knowledge": "2026-01", + "release_date": "2026-02-24", + "last_updated": "2026-02-24", + "cost": { + "input": 0.444, + "output": 3.106 + }, "type": "chat" }, { - "id": "qwen3-235b-a22b-thinking-2507", - "name": "Qwen3 235B A22B Thinking 2507", - "display_name": "Qwen3 235B A22B Thinking 2507", + "id": "nemotron-3-super-120b-a12b", + "name": "Nemotron 3 Super 120B A12B", + "display_name": "Nemotron 3 Super 120B A12B", "modalities": { "input": [ "text" @@ -33180,38 +35075,74 @@ ] }, "limit": { - "context": 131072, - "output": 32768 + "context": 262144, + "output": 262144 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { "supported": true, - "default": true, - "budget": { - "default": 81920, - "min": 0, - "max": 81920 - } - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } + "default": true }, "attachment": false, + "open_weights": true, + "knowledge": "2025-12", + "release_date": "2026-03-11", + "last_updated": "2026-03-11", + "cost": { + "input": 0.266, + "output": 0.799 + }, "type": "chat" }, { - "id": "qwen3-235b-a22b-instruct-2507", - "name": "Qwen3 235B A22B Instruct 2507", - "display_name": "Qwen3 235B A22B Instruct 2507", + "id": "claude-opus4-6", + "name": "Claude Opus 4.6", + "display_name": "Claude Opus 4.6", + "modalities": { + "input": [ + "text", + "image", + "pdf" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 1000000, + "output": 1000000 + }, + "temperature": true, + "tool_call": true, + "reasoning": { + "supported": true, + "default": true + }, + "attachment": true, + "open_weights": false, + "knowledge": "2025-05-31", + "release_date": "2026-02-05", + "last_updated": "2026-03-13", + "cost": { + "input": 5.98, + "output": 29.89 + }, + "type": "chat" + } + ] + }, + "nebius": { + "id": "nebius", + "name": "Nebius Token Factory", + "display_name": "Nebius Token Factory", + "api": "https://api.tokenfactory.nebius.com/v1", + "doc": "https://docs.tokenfactory.nebius.com/", + "models": [ + { + "id": "meta-llama/Llama-3.3-70B-Instruct", + "name": "Llama-3.3-70B-Instruct", + "display_name": "Llama-3.3-70B-Instruct", "modalities": { "input": [ "text" @@ -33221,8 +35152,8 @@ ] }, "limit": { - "context": 131072, - "output": 32768 + "context": 128000, + "output": 8192 }, "temperature": true, "tool_call": true, @@ -33230,12 +35161,22 @@ "supported": false }, "attachment": false, + "open_weights": true, + "knowledge": "2025-08", + "release_date": "2025-12-05", + "last_updated": "2026-02-04", + "cost": { + "input": 0.13, + "output": 0.4, + "cache_read": 0.013, + "cache_write": 0.16 + }, "type": "chat" }, { - "id": "qwen3-30b-a3b-instruct-2507", - "name": "Qwen3 30B A3B Instruct 2507", - "display_name": "Qwen3 30B A3B Instruct 2507", + "id": "meta-llama/Meta-Llama-3.1-8B-Instruct", + "name": "Meta-Llama-3.1-8B-Instruct", + "display_name": "Meta-Llama-3.1-8B-Instruct", "modalities": { "input": [ "text" @@ -33245,8 +35186,8 @@ ] }, "limit": { - "context": 131072, - "output": 32768 + "context": 128000, + "output": 4096 }, "temperature": true, "tool_call": true, @@ -33254,34 +35195,40 @@ "supported": false }, "attachment": false, + "open_weights": true, + "knowledge": "2024-12", + "release_date": "2024-07-23", + "last_updated": "2026-02-04", + "cost": { + "input": 0.02, + "output": 0.06, + "cache_read": 0.002, + "cache_write": 0.025 + }, "type": "chat" }, { - "id": "qwen3-30b-a3b-thinking-2507", - "name": "Qwen3 30B A3B Thinking 2507", - "display_name": "Qwen3 30B A3B Thinking 2507", + "id": "moonshotai/Kimi-K2.5-fast", + "name": "Kimi-K2.5-fast", + "display_name": "Kimi-K2.5-fast", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 131072, - "output": 32768 + "context": 256000, + "output": 8192 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { "supported": true, - "default": true, - "budget": { - "default": 81920, - "min": 0, - "max": 81920 - } + "default": true }, "extra_capabilities": { "reasoning": { @@ -33294,35 +35241,41 @@ ] } }, - "attachment": false, + "attachment": true, + "open_weights": true, + "knowledge": "2025-06", + "release_date": "2025-12-15", + "last_updated": "2026-02-04", + "cost": { + "input": 0.5, + "output": 2.5, + "cache_read": 0.05, + "cache_write": 0.625 + }, "type": "chat" }, { - "id": "qwen3-30b-a3b", - "name": "Qwen3 30B A3B", - "display_name": "Qwen3 30B A3B", + "id": "moonshotai/Kimi-K2.5", + "name": "Kimi-K2.5", + "display_name": "Kimi-K2.5", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 131072, - "output": 32768 + "context": 256000, + "output": 8192 }, "temperature": true, "tool_call": true, "reasoning": { "supported": true, - "default": false, - "budget": { - "default": 81920, - "min": 0, - "max": 81920 - } + "default": true }, "extra_capabilities": { "reasoning": { @@ -33335,13 +35288,24 @@ ] } }, - "attachment": false, + "attachment": true, + "open_weights": true, + "knowledge": "2025-06", + "release_date": "2025-12-15", + "last_updated": "2026-02-04", + "cost": { + "input": 0.5, + "output": 2.5, + "reasoning": 2.5, + "cache_read": 0.05, + "cache_write": 0.625 + }, "type": "chat" }, { - "id": "qwen3-4b", - "name": "Qwen3 4B", - "display_name": "Qwen3 4B", + "id": "google/gemma-2-2b-it", + "name": "Gemma-2-2b-it", + "display_name": "Gemma-2-2b-it", "modalities": { "input": [ "text" @@ -33351,79 +35315,66 @@ ] }, "limit": { - "context": 131072, - "output": 8192 + "context": 8192, + "output": 4096 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": true, - "budget": { - "default": 38912, - "min": 0, - "max": 38912 - } - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } + "supported": false }, "attachment": false, + "open_weights": true, + "knowledge": "2024-06", + "release_date": "2024-07-31", + "last_updated": "2026-02-04", + "cost": { + "input": 0.02, + "output": 0.06, + "cache_read": 0.002, + "cache_write": 0.025 + }, "type": "chat" }, { - "id": "qwen3-1.7b", - "name": "Qwen3 1.7B", - "display_name": "Qwen3 1.7B", + "id": "google/gemma-3-27b-it", + "name": "Gemma-3-27b-it", + "display_name": "Gemma-3-27b-it", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 32768, + "context": 110000, "output": 8192 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true, - "budget": { - "default": 30720, - "min": 0, - "max": 30720 - } + "supported": false }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } + "attachment": true, + "open_weights": true, + "knowledge": "2025-10", + "release_date": "2026-01-20", + "last_updated": "2026-02-04", + "cost": { + "input": 0.1, + "output": 0.3, + "cache_read": 0.01, + "cache_write": 0.125 }, - "attachment": false, "type": "chat" }, { - "id": "qwen3-0.6b", - "name": "Qwen3 0.6B", - "display_name": "Qwen3 0.6B", + "id": "Qwen/Qwen3-Next-80B-A3B-Thinking-fast", + "name": "Qwen3-Next-80B-A3B-Thinking-fast", + "display_name": "Qwen3-Next-80B-A3B-Thinking-fast", "modalities": { "input": [ "text" @@ -33433,19 +35384,14 @@ ] }, "limit": { - "context": 32768, + "context": 8000, "output": 8192 }, "temperature": true, "tool_call": true, "reasoning": { "supported": true, - "default": true, - "budget": { - "default": 30720, - "min": 0, - "max": 30720 - } + "default": true }, "extra_capabilities": { "reasoning": { @@ -33459,12 +35405,22 @@ } }, "attachment": false, + "open_weights": true, + "knowledge": "2025-07", + "release_date": "2025-07-25", + "last_updated": "2026-05-07", + "cost": { + "input": 0.15, + "output": 1.2, + "cache_read": 0.015, + "cache_write": 0.1875 + }, "type": "chat" }, { - "id": "qwen3-vl-plus-2025-09-23", - "name": "Qwen3 VL Plus 2025 09 23", - "display_name": "Qwen3 VL Plus 2025 09 23", + "id": "Qwen/Qwen2.5-VL-72B-Instruct", + "name": "Qwen2.5-VL-72B-Instruct", + "display_name": "Qwen2.5-VL-72B-Instruct", "modalities": { "input": [ "text", @@ -33475,19 +35431,80 @@ ] }, "limit": { - "context": 262144, - "output": 32768 + "context": 128000, + "output": 8192 }, "temperature": true, + "tool_call": true, + "reasoning": { + "supported": false + }, + "attachment": true, + "open_weights": true, + "knowledge": "2024-12", + "release_date": "2025-01-20", + "last_updated": "2026-02-04", + "cost": { + "input": 0.25, + "output": 0.75, + "cache_read": 0.025, + "cache_write": 0.31 + }, + "type": "chat" + }, + { + "id": "Qwen/Qwen3-Embedding-8B", + "name": "Qwen3-Embedding-8B", + "display_name": "Qwen3-Embedding-8B", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 32768, + "output": 8192 + }, + "temperature": false, "tool_call": false, + "reasoning": { + "supported": false + }, + "attachment": false, + "open_weights": true, + "knowledge": "2025-10", + "release_date": "2026-01-10", + "last_updated": "2026-02-04", + "cost": { + "input": 0.01, + "output": 0 + }, + "type": "embedding" + }, + { + "id": "Qwen/Qwen3.5-397B-A17B", + "name": "Qwen3.5-397B-A17B", + "display_name": "Qwen3.5-397B-A17B", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 262144, + "output": 8192 + }, + "temperature": true, + "tool_call": true, "reasoning": { "supported": true, - "default": false, - "budget": { - "default": 81920, - "min": 0, - "max": 81920 - } + "default": true }, "extra_capabilities": { "reasoning": { @@ -33501,12 +35518,22 @@ } }, "attachment": false, + "open_weights": true, + "knowledge": "2025-07", + "release_date": "2025-07-15", + "last_updated": "2026-05-07", + "cost": { + "input": 0.6, + "output": 3.6, + "cache_read": 0.06, + "cache_write": 0.75 + }, "type": "chat" }, { - "id": "qwq-plus-latest", - "name": "QwQ Plus Latest", - "display_name": "QwQ Plus Latest", + "id": "Qwen/Qwen3.5-397B-A17B-fast", + "name": "Qwen3.5-397B-A17B-fast", + "display_name": "Qwen3.5-397B-A17B-fast", "modalities": { "input": [ "text" @@ -33516,19 +35543,14 @@ ] }, "limit": { - "context": 131072, + "context": 8000, "output": 8192 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { "supported": true, - "default": true, - "budget": { - "default": 32768, - "min": 0, - "max": 32768 - } + "default": true }, "extra_capabilities": { "reasoning": { @@ -33541,60 +35563,57 @@ ] } }, - "search": { - "supported": false - }, "attachment": false, + "open_weights": true, + "knowledge": "2025-07", + "release_date": "2025-07-15", + "last_updated": "2026-05-07", + "cost": { + "input": 0.6, + "output": 3.6, + "cache_read": 0.06, + "cache_write": 0.75 + }, "type": "chat" - } - ] - }, - "digitalocean": { - "id": "digitalocean", - "name": "DigitalOcean", - "display_name": "DigitalOcean", - "api": "https://inference.do-ai.run/v1", - "doc": "https://docs.digitalocean.com/products/gradient-ai-platform/details/models/", - "models": [ + }, { - "id": "openai-gpt-5.2", - "name": "GPT-5.2", - "display_name": "GPT-5.2", + "id": "Qwen/Qwen3-30B-A3B-Instruct-2507", + "name": "Qwen3-30B-A3B-Instruct-2507", + "display_name": "Qwen3-30B-A3B-Instruct-2507", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 400000, - "output": 128000 + "context": 128000, + "output": 8192 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, - "attachment": true, - "open_weights": false, - "knowledge": "2025-08-31", - "release_date": "2025-12-11", - "last_updated": "2025-12-11", + "attachment": false, + "open_weights": true, + "knowledge": "2025-12", + "release_date": "2026-01-28", + "last_updated": "2026-02-04", "cost": { - "input": 1.75, - "output": 14, - "cache_read": 0.175 + "input": 0.1, + "output": 0.3, + "cache_read": 0.01, + "cache_write": 0.125 }, "type": "chat" }, { - "id": "deepseek-3.2", - "name": "DeepSeek V3.2", - "display_name": "DeepSeek V3.2", + "id": "Qwen/Qwen3-Next-80B-A3B-Thinking", + "name": "Qwen3-Next-80B-A3B-Thinking", + "display_name": "Qwen3-Next-80B-A3B-Thinking", "modalities": { "input": [ "text" @@ -33605,7 +35624,7 @@ }, "limit": { "context": 128000, - "output": 64000 + "output": 16384 }, "temperature": true, "tool_call": true, @@ -33626,82 +35645,100 @@ }, "attachment": false, "open_weights": true, - "knowledge": "2024-12", - "release_date": "2025-12-02", - "last_updated": "2026-04-30", + "knowledge": "2025-12", + "release_date": "2026-01-28", + "last_updated": "2026-02-04", "cost": { - "input": 0.5, - "output": 1.6 + "input": 0.15, + "output": 1.2, + "reasoning": 1.2, + "cache_read": 0.015, + "cache_write": 0.18 }, "type": "chat" }, { - "id": "openai-gpt-image-2", - "name": "GPT Image 2", - "display_name": "GPT Image 2", + "id": "Qwen/Qwen3-235B-A22B-Instruct-2507", + "name": "Qwen3 235B A22B Instruct 2507", + "display_name": "Qwen3 235B A22B Instruct 2507", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ - "image" + "text" ] }, "limit": { - "context": 8192, + "context": 262144, "output": 8192 }, - "temperature": false, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": true, + "attachment": false, "open_weights": false, - "release_date": "2025-04-24", - "last_updated": "2025-04-24", + "knowledge": "2025-07", + "release_date": "2025-07-25", + "last_updated": "2025-10-04", + "cost": { + "input": 0.2, + "output": 0.6 + }, "type": "chat" }, { - "id": "openai-gpt-4.1", - "name": "GPT-4.1", - "display_name": "GPT-4.1", + "id": "Qwen/Qwen3-32B", + "name": "Qwen3-32B", + "display_name": "Qwen3-32B", "modalities": { "input": [ - "text", - "image", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 1047576, - "output": 32768 + "context": 128000, + "output": 8192 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true }, - "attachment": true, - "open_weights": false, - "knowledge": "2024-04", - "release_date": "2025-04-14", - "last_updated": "2025-04-14", + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } + }, + "attachment": false, + "open_weights": true, + "knowledge": "2025-12", + "release_date": "2026-01-28", + "last_updated": "2026-02-04", "cost": { - "input": 2, - "output": 8, - "cache_read": 0.5 + "input": 0.1, + "output": 0.3, + "cache_read": 0.01, + "cache_write": 0.125 }, "type": "chat" }, { - "id": "nvidia-nemotron-3-super-120b", - "name": "Nemotron-3-Super-120B", - "display_name": "Nemotron-3-Super-120B", + "id": "Qwen/Qwen3-235B-A22B-Thinking-2507-fast", + "name": "Qwen3-235B-A22B-Thinking-2507-fast", + "display_name": "Qwen3-235B-A22B-Thinking-2507-fast", "modalities": { "input": [ "text" @@ -33711,8 +35748,8 @@ ] }, "limit": { - "context": 256000, - "output": 32768 + "context": 8000, + "output": 8192 }, "temperature": true, "tool_call": true, @@ -33720,66 +35757,80 @@ "supported": true, "default": true }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } + }, "attachment": false, "open_weights": true, - "knowledge": "2026-02", - "release_date": "2026-03-11", - "last_updated": "2026-04-16", + "knowledge": "2025-07", + "release_date": "2025-07-25", + "last_updated": "2026-05-07", "cost": { - "input": 0.3, - "output": 0.65 + "input": 0.5, + "output": 2, + "cache_read": 0.05, + "cache_write": 0.625 }, "type": "chat" }, { - "id": "wan2-2-t2v-a14b", - "name": "Wan2.2-T2V-A14B", - "display_name": "Wan2.2-T2V-A14B", + "id": "openai/gpt-oss-120b-fast", + "name": "gpt-oss-120b-fast", + "display_name": "gpt-oss-120b-fast", "modalities": { "input": [ "text" ], "output": [ - "video" + "text" ] }, "limit": { - "context": 100, - "output": 1 + "context": 8000, + "output": 8192 }, - "temperature": false, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "attachment": false, "open_weights": true, - "release_date": "2025-07-28", - "last_updated": "2026-04-30", + "knowledge": "2025-06", + "release_date": "2025-06-10", + "last_updated": "2026-05-07", "cost": { - "input": 0.6, - "output": 0 + "input": 0.1, + "output": 0.5, + "cache_read": 0.01, + "cache_write": 0.125 }, "type": "chat" }, { - "id": "nemotron-3-nano-omni", - "name": "Nemotron Nano 3 Omni", - "display_name": "Nemotron Nano 3 Omni", + "id": "openai/gpt-oss-120b", + "name": "gpt-oss-120b", + "display_name": "gpt-oss-120b", "modalities": { "input": [ - "text", - "image", - "video", - "audio" + "text" ], "output": [ "text" ] }, "limit": { - "context": 65536, - "output": 65536 + "context": 128000, + "output": 8192 }, "temperature": true, "tool_call": true, @@ -33787,67 +35838,93 @@ "supported": true, "default": true }, - "attachment": true, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } + }, + "attachment": false, "open_weights": true, - "release_date": "2026-04-28", - "last_updated": "2026-04-30", + "knowledge": "2025-09", + "release_date": "2026-01-10", + "last_updated": "2026-02-04", "cost": { - "input": 0.5, - "output": 0.9 + "input": 0.15, + "output": 0.6, + "reasoning": 0.6, + "cache_read": 0.015, + "cache_write": 0.18 }, "type": "chat" }, { - "id": "openai-gpt-5.4-pro", - "name": "GPT-5.4 pro", - "display_name": "GPT-5.4 pro", + "id": "NousResearch/Hermes-4-405B", + "name": "Hermes-4-405B", + "display_name": "Hermes-4-405B", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 400000, - "output": 128000 + "context": 128000, + "output": 8192 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, "default": true }, - "attachment": true, - "open_weights": false, - "knowledge": "2025-08-31", - "release_date": "2026-03-05", - "last_updated": "2026-03-05", + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } + }, + "attachment": false, + "open_weights": true, + "knowledge": "2025-11", + "release_date": "2026-01-30", + "last_updated": "2026-02-04", "cost": { - "input": 30, - "output": 180 + "input": 1, + "output": 3, + "reasoning": 3, + "cache_read": 0.1, + "cache_write": 1.25 }, "type": "chat" }, { - "id": "anthropic-claude-4.1-opus", - "name": "Claude Opus 4.1", - "display_name": "Claude Opus 4.1", + "id": "NousResearch/Hermes-4-70B", + "name": "Hermes-4-70B", + "display_name": "Hermes-4-70B", "modalities": { "input": [ - "text", - "image", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 32000 + "context": 128000, + "output": 8192 }, "temperature": true, "tool_call": true, @@ -33855,140 +35932,149 @@ "supported": true, "default": true }, - "attachment": true, - "open_weights": false, - "knowledge": "2025-03-31", - "release_date": "2025-08-05", - "last_updated": "2025-08-05", + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } + }, + "attachment": false, + "open_weights": true, + "knowledge": "2025-11", + "release_date": "2026-01-30", + "last_updated": "2026-02-04", "cost": { - "input": 15, - "output": 75, - "cache_read": 1.5, - "cache_write": 18.75 + "input": 0.13, + "output": 0.4, + "reasoning": 0.4, + "cache_read": 0.013, + "cache_write": 0.16 }, "type": "chat" }, { - "id": "llama-4-maverick", - "name": "Llama 4 Maverick 17B 128E Instruct", - "display_name": "Llama 4 Maverick 17B 128E Instruct", + "id": "nvidia/NVIDIA-Nemotron-3-Nano-30B-A3B", + "name": "Nemotron-3-Nano-30B-A3B", + "display_name": "Nemotron-3-Nano-30B-A3B", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 1000000, - "output": 16384 + "context": 32000, + "output": 4096 }, "temperature": true, "tool_call": true, "reasoning": { "supported": false }, - "attachment": true, + "attachment": false, "open_weights": true, - "knowledge": "2024-08", - "release_date": "2025-04-05", - "last_updated": "2026-04-30", + "knowledge": "2025-05", + "release_date": "2025-08-10", + "last_updated": "2026-02-04", "cost": { - "input": 0.25, - "output": 0.87 + "input": 0.06, + "output": 0.24, + "cache_read": 0.006, + "cache_write": 0.075 }, "type": "chat" }, { - "id": "openai-gpt-5.4", - "name": "GPT-5.4", - "display_name": "GPT-5.4", + "id": "nvidia/Nemotron-3-Nano-Omni", + "name": "Nemotron-3-Nano-Omni", + "display_name": "Nemotron-3-Nano-Omni", "modalities": { "input": [ - "text", - "image", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 1000000, - "output": 128000 + "context": 65536, + "output": 8192 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, "default": true }, - "attachment": true, - "open_weights": false, - "knowledge": "2025-08-31", - "release_date": "2026-03-05", - "last_updated": "2026-03-05", + "attachment": false, + "open_weights": true, + "knowledge": "2025-01", + "release_date": "2025-01-20", + "last_updated": "2026-05-07", "cost": { - "input": 2.5, - "output": 15, - "cache_read": 0.25 + "input": 0.06, + "output": 0.24, + "cache_read": 0.006, + "cache_write": 0.075 }, "type": "chat" }, { - "id": "openai-gpt-5.4-mini", - "name": "GPT-5.4 mini", - "display_name": "GPT-5.4 mini", + "id": "nvidia/Llama-3_1-Nemotron-Ultra-253B-v1", + "name": "Llama-3.1-Nemotron-Ultra-253B-v1", + "display_name": "Llama-3.1-Nemotron-Ultra-253B-v1", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 400000, - "output": 128000 + "context": 128000, + "output": 4096 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, - "attachment": true, - "open_weights": false, - "knowledge": "2025-08-31", - "release_date": "2026-03-17", - "last_updated": "2026-03-17", + "attachment": false, + "open_weights": true, + "knowledge": "2024-12", + "release_date": "2025-01-15", + "last_updated": "2026-02-04", "cost": { - "input": 0.75, - "output": 4.5, - "cache_read": 0.075 + "input": 0.6, + "output": 1.8, + "cache_read": 0.06, + "cache_write": 0.75 }, "type": "chat" }, { - "id": "anthropic-claude-4.5-sonnet", - "name": "Claude Sonnet 4.5", - "display_name": "Claude Sonnet 4.5", + "id": "nvidia/nemotron-3-super-120b-a12b", + "name": "Nemotron-3-Super-120B-A12B", + "display_name": "Nemotron-3-Super-120B-A12B", "modalities": { "input": [ - "text", - "image", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 1000000, - "output": 64000 + "context": 256000, + "output": 32768 }, "temperature": true, "tool_call": true, @@ -33996,46 +36082,24 @@ "supported": true, "default": true }, - "attachment": true, - "open_weights": false, - "knowledge": "2025-07-31", - "release_date": "2025-09-29", - "last_updated": "2025-09-29", + "attachment": false, + "open_weights": true, + "knowledge": "2026-02", + "release_date": "2026-03-11", + "last_updated": "2026-03-12", "cost": { - "input": 3, - "output": 15, - "cache_read": 0.3, - "cache_write": 3.75, - "tiers": [ - { - "input": 6, - "output": 22.5, - "cache_read": 0.3, - "cache_write": 3.75, - "tier": { - "type": "context", - "size": 200000 - } - } - ], - "context_over_200k": { - "input": 6, - "output": 22.5, - "cache_read": 0.3, - "cache_write": 3.75 - } + "input": 0.3, + "output": 0.9 }, "type": "chat" }, { - "id": "openai-o3", - "name": "o3", - "display_name": "o3", + "id": "zai-org/GLM-5", + "name": "GLM-5", + "display_name": "GLM-5", "modalities": { "input": [ - "text", - "image", - "pdf" + "text" ], "output": [ "text" @@ -34043,30 +36107,42 @@ }, "limit": { "context": 200000, - "output": 100000 + "output": 16384 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, "default": true }, - "attachment": true, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } + }, + "attachment": false, "open_weights": false, - "knowledge": "2024-05", - "release_date": "2025-04-16", - "last_updated": "2025-04-16", + "knowledge": "2026-01", + "release_date": "2026-03-01", + "last_updated": "2026-03-10", "cost": { - "input": 2, - "output": 8, - "cache_read": 0.5 + "input": 1, + "output": 3.2, + "cache_read": 0.1, + "cache_write": 1 }, "type": "chat" }, { - "id": "mistral-3-14B", - "name": "Ministral 3 14B Instruct", - "display_name": "Ministral 3 14B Instruct", + "id": "deepseek-ai/DeepSeek-V3.2-fast", + "name": "DeepSeek-V3.2-fast", + "display_name": "DeepSeek-V3.2-fast", "modalities": { "input": [ "text" @@ -34076,55 +36152,32 @@ ] }, "limit": { - "context": 262144, - "output": 128000 + "context": 8000, + "output": 8192 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "attachment": false, "open_weights": true, - "release_date": "2025-12-15", - "last_updated": "2026-04-30", + "knowledge": "2025-01", + "release_date": "2025-01-27", + "last_updated": "2026-05-07", "cost": { - "input": 0.2, - "output": 0.2 - }, - "type": "chat" - }, - { - "id": "mistral-7b-instruct-v0.3", - "name": "Mistral 7B Instruct v0.3", - "display_name": "Mistral 7B Instruct v0.3", - "modalities": { - "input": [ - "text" - ], - "output": [ - "text" - ] - }, - "limit": { - "context": 32768, - "output": 32768 - }, - "temperature": true, - "tool_call": true, - "reasoning": { - "supported": false + "input": 0.4, + "output": 2, + "cache_read": 0.04, + "cache_write": 0.5 }, - "attachment": false, - "open_weights": true, - "release_date": "2024-05-22", - "last_updated": "2024-05-22", "type": "chat" }, { - "id": "openai-gpt-oss-120b", - "name": "gpt-oss-120b", - "display_name": "gpt-oss-120b", + "id": "deepseek-ai/DeepSeek-V4-Pro", + "name": "DeepSeek V4 Pro", + "display_name": "DeepSeek V4 Pro", "modalities": { "input": [ "text" @@ -34134,8 +36187,8 @@ ] }, "limit": { - "context": 131072, - "output": 131072 + "context": 1000000, + "output": 384000 }, "temperature": true, "tool_call": true, @@ -34156,83 +36209,67 @@ }, "attachment": false, "open_weights": true, - "knowledge": "2024-06", - "release_date": "2025-08-05", - "last_updated": "2026-04-16", + "knowledge": "2025-05", + "release_date": "2026-04-24", + "last_updated": "2026-04-24", "cost": { - "input": 0.1, - "output": 0.7 + "input": 1.75, + "output": 3.5, + "cache_read": 0.15 }, "type": "chat" }, { - "id": "anthropic-claude-opus-4.5", - "name": "Claude Opus 4.5", - "display_name": "Claude Opus 4.5", + "id": "deepseek-ai/DeepSeek-V3.2", + "name": "DeepSeek-V3.2", + "display_name": "DeepSeek-V3.2", "modalities": { "input": [ - "text", - "image", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 64000 + "context": 163000, + "output": 16384 }, "temperature": true, "tool_call": true, "reasoning": { "supported": true, - "default": false + "default": true }, "extra_capabilities": { "reasoning": { "supported": true, - "default_enabled": false, - "mode": "mixed", - "budget": { - "min": 1024, - "unit": "tokens" - }, - "effort": "high", - "effort_options": [ - "low", - "medium", - "high" - ], "interleaved": true, "summaries": true, "visibility": "summary", "continuation": [ "thinking_blocks" - ], - "notes": [ - "Claude Opus 4.5 uses manual thinking.type = \"enabled\" with budget_tokens; effort can be used alongside the thinking budget.", - "Interleaved thinking requires the interleaved-thinking-2025-05-14 beta header." ] } }, - "attachment": true, - "open_weights": false, - "knowledge": "2025-03-31", - "release_date": "2025-11-24", - "last_updated": "2025-11-24", + "attachment": false, + "open_weights": true, + "knowledge": "2025-11", + "release_date": "2026-01-20", + "last_updated": "2026-02-04", "cost": { - "input": 5, - "output": 25, - "cache_read": 0.5, - "cache_write": 6.25 + "input": 0.3, + "output": 0.45, + "reasoning": 0.45, + "cache_read": 0.03, + "cache_write": 0.375 }, "type": "chat" }, { - "id": "multi-qa-mpnet-base-dot-v1", - "name": "Multi-QA-mpnet-base-dot-v1", - "display_name": "Multi-QA-mpnet-base-dot-v1", + "id": "MiniMaxAI/MiniMax-M2.5", + "name": "MiniMax-M2.5", + "display_name": "MiniMax-M2.5", "modalities": { "input": [ "text" @@ -34242,63 +36279,72 @@ ] }, "limit": { - "context": 512, - "output": 768 + "context": 196608, + "output": 8192 }, - "temperature": false, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true + } }, "attachment": false, "open_weights": true, - "release_date": "2021-08-30", - "last_updated": "2026-04-16", + "knowledge": "2025-01", + "release_date": "2025-01-20", + "last_updated": "2026-05-07", "cost": { - "input": 0.009, - "output": 0 + "input": 0.3, + "output": 1.2, + "cache_read": 0.03, + "cache_write": 0.375 }, "type": "chat" }, { - "id": "openai-gpt-4o-mini", - "name": "GPT-4o mini", - "display_name": "GPT-4o mini", + "id": "MiniMaxAI/MiniMax-M2.5-fast", + "name": "MiniMax-M2.5-fast", + "display_name": "MiniMax-M2.5-fast", "modalities": { "input": [ - "text", - "image", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 16384 + "context": 8000, + "output": 8192 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": true, - "open_weights": false, - "knowledge": "2023-09", - "release_date": "2024-07-18", - "last_updated": "2024-07-18", + "attachment": false, + "open_weights": true, + "knowledge": "2025-01", + "release_date": "2025-01-20", + "last_updated": "2026-05-07", "cost": { - "input": 0.15, - "output": 0.6, - "cache_read": 0.075 + "input": 0.3, + "output": 1.2, + "cache_read": 0.03, + "cache_write": 0.375 }, "type": "chat" }, { - "id": "llama3-8b-instruct", - "name": "Llama 3.1 Instruct (8B)", - "display_name": "Llama 3.1 Instruct (8B)", + "id": "PrimeIntellect/INTELLECT-3", + "name": "INTELLECT-3", + "display_name": "INTELLECT-3", "modalities": { "input": [ "text" @@ -34308,8 +36354,8 @@ ] }, "limit": { - "context": 131072, - "output": 131072 + "context": 128000, + "output": 8192 }, "temperature": true, "tool_call": true, @@ -34318,19 +36364,30 @@ }, "attachment": false, "open_weights": true, - "knowledge": "2023-12", - "release_date": "2024-07-23", - "last_updated": "2024-07-23", + "knowledge": "2025-10", + "release_date": "2026-01-25", + "last_updated": "2026-02-04", "cost": { - "input": 0.198, - "output": 0.198 + "input": 0.2, + "output": 1.1, + "cache_read": 0.02, + "cache_write": 0.25 }, "type": "chat" - }, + } + ] + }, + "auriko": { + "id": "auriko", + "name": "Auriko", + "display_name": "Auriko", + "api": "https://api.auriko.ai/v1", + "doc": "https://docs.auriko.ai", + "models": [ { - "id": "all-mini-lm-l6-v2", - "name": "All-MiniLM-L6-v2", - "display_name": "All-MiniLM-L6-v2", + "id": "deepseek-v4-flash", + "name": "DeepSeek V4 Flash", + "display_name": "DeepSeek V4 Flash", "modalities": { "input": [ "text" @@ -34340,126 +36397,128 @@ ] }, "limit": { - "context": 256, - "output": 384 + "context": 1000000, + "output": 384000 }, - "temperature": false, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } }, "attachment": false, "open_weights": true, - "release_date": "2021-08-30", - "last_updated": "2026-04-16", + "knowledge": "2025-05", + "release_date": "2026-04-24", + "last_updated": "2026-04-24", "cost": { - "input": 0.009, - "output": 0 + "input": 0.14, + "output": 0.28, + "cache_read": 0.0028 }, "type": "chat" }, { - "id": "anthropic-claude-3.7-sonnet", - "name": "Claude 3.7 Sonnet", - "display_name": "Claude 3.7 Sonnet", + "id": "gemini-2.5-pro", + "name": "Gemini 2.5 Pro", + "display_name": "Gemini 2.5 Pro", "modalities": { "input": [ "text", - "image" + "image", + "audio", + "video", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 64000 + "context": 1048576, + "output": 65536 }, "temperature": true, "tool_call": true, "reasoning": { "supported": true, - "default": false + "default": true }, "extra_capabilities": { "reasoning": { "supported": true, - "default_enabled": false, + "default_enabled": true, "mode": "budget", "budget": { - "min": 1024, + "default": -1, + "min": 128, + "max": 32768, + "auto": -1, "unit": "tokens" }, - "interleaved": false, - "summaries": false, - "visibility": "full", + "summaries": true, + "visibility": "summary", "continuation": [ - "thinking_blocks" - ], - "notes": [ - "Anthropic uses thinking budget tokens" + "thought_signatures" ] } }, "attachment": true, "open_weights": false, - "knowledge": "2024-11", - "release_date": "2025-02-24", - "last_updated": "2025-02-24", + "knowledge": "2025-01", + "release_date": "2025-03-20", + "last_updated": "2025-06-05", "cost": { - "input": 3, - "output": 15, - "cache_read": 0.3, - "cache_write": 3.75 - }, - "type": "chat" - }, - { - "id": "bge-m3", - "name": "BGE M3", - "display_name": "BGE M3", - "modalities": { - "input": [ - "text" + "input": 1.25, + "output": 10, + "cache_read": 0.125, + "tiers": [ + { + "input": 2.5, + "output": 15, + "cache_read": 0.25, + "tier": { + "type": "context", + "size": 200000 + } + } ], - "output": [ - "text" - ] - }, - "limit": { - "context": 8192, - "output": 1024 - }, - "temperature": false, - "tool_call": false, - "reasoning": { - "supported": false - }, - "attachment": false, - "open_weights": true, - "release_date": "2024-01-30", - "last_updated": "2026-04-30", - "cost": { - "input": 0.02, - "output": 0 + "context_over_200k": { + "input": 2.5, + "output": 15, + "cache_read": 0.25 + } }, - "type": "embedding" + "type": "chat" }, { - "id": "nemotron-3-nano-30b", - "name": "Nemotron 3 Nano 30B A3B", - "display_name": "Nemotron 3 Nano 30B A3B", + "id": "grok-4.3", + "name": "Grok 4.3", + "display_name": "Grok 4.3", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 262144, - "output": 262144 + "context": 1000000, + "output": 30000 }, "temperature": true, "tool_call": true, @@ -34467,20 +36526,48 @@ "supported": true, "default": true }, - "attachment": false, - "open_weights": true, - "release_date": "2025-04-14", - "last_updated": "2025-04-14", + "extra_capabilities": { + "reasoning": { + "supported": true + } + }, + "attachment": true, + "open_weights": false, + "release_date": "2026-04-17", + "last_updated": "2026-04-17", + "cost": { + "input": 1.25, + "output": 2.5, + "cache_read": 0.2, + "tiers": [ + { + "input": 2.5, + "output": 5, + "cache_read": 0.4, + "tier": { + "type": "context", + "size": 200000 + } + } + ], + "context_over_200k": { + "input": 2.5, + "output": 5, + "cache_read": 0.4 + } + }, "type": "chat" }, { - "id": "anthropic-claude-sonnet-4", - "name": "Claude Sonnet 4", - "display_name": "Claude Sonnet 4", + "id": "gemini-2.5-flash", + "name": "Gemini 2.5 Flash", + "display_name": "Gemini 2.5 Flash", "modalities": { "input": [ "text", "image", + "audio", + "video", "pdf" ], "output": [ @@ -34488,252 +36575,203 @@ ] }, "limit": { - "context": 1000000, - "output": 64000 + "context": 1048576, + "output": 65536 }, "temperature": true, "tool_call": true, "reasoning": { "supported": true, - "default": false + "default": true }, "extra_capabilities": { "reasoning": { "supported": true, - "default_enabled": false, + "default_enabled": true, "mode": "budget", "budget": { - "min": 1024, + "default": -1, + "min": 0, + "max": 24576, + "auto": -1, + "off": 0, "unit": "tokens" }, - "interleaved": true, "summaries": true, "visibility": "summary", "continuation": [ - "thinking_blocks" - ], - "notes": [ - "Claude 4 manual thinking uses thinking.type = \"enabled\" with budget_tokens.", - "Interleaved thinking requires the interleaved-thinking-2025-05-14 beta header for this model family." + "thought_signatures" ] } }, "attachment": true, "open_weights": false, - "knowledge": "2025-03-31", - "release_date": "2025-05-22", - "last_updated": "2025-05-22", + "knowledge": "2025-01", + "release_date": "2025-03-20", + "last_updated": "2025-06-05", "cost": { - "input": 3, - "output": 15, - "cache_read": 0.3, - "cache_write": 3.75, - "tiers": [ - { - "input": 6, - "output": 22.5, - "cache_read": 0.3, - "cache_write": 3.75, - "tier": { - "type": "context", - "size": 200000 - } - } - ], - "context_over_200k": { - "input": 6, - "output": 22.5, - "cache_read": 0.3, - "cache_write": 3.75 - } + "input": 0.3, + "output": 2.5, + "cache_read": 0.03 }, "type": "chat" }, { - "id": "openai-gpt-5.2-pro", - "name": "GPT-5.2 pro", - "display_name": "GPT-5.2 pro", + "id": "glm-5.1", + "name": "GLM-5.1", + "display_name": "GLM-5.1", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 400000, - "output": 128000 + "context": 200000, + "output": 131072 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, "default": true }, - "attachment": true, - "open_weights": false, - "knowledge": "2025-08-31", - "release_date": "2025-12-11", - "last_updated": "2025-12-11", + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } + }, + "attachment": false, + "open_weights": true, + "release_date": "2026-03-27", + "last_updated": "2026-03-27", "cost": { - "input": 21, - "output": 168 + "input": 1.4, + "output": 4.4, + "cache_read": 0.26 }, "type": "chat" }, { - "id": "openai-gpt-5", - "name": "GPT-5", - "display_name": "GPT-5", + "id": "deepseek-v4-pro", + "name": "DeepSeek V4 Pro", + "display_name": "DeepSeek V4 Pro", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 400000, - "output": 128000 + "context": 1000000, + "output": 384000 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, "default": true }, - "attachment": true, - "open_weights": false, - "knowledge": "2024-09-30", - "release_date": "2025-08-07", - "last_updated": "2025-08-07", + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } + }, + "attachment": false, + "open_weights": true, + "knowledge": "2025-05", + "release_date": "2026-04-24", + "last_updated": "2026-04-24", "cost": { - "input": 1.25, - "output": 10, - "cache_read": 0.125 + "input": 0.435, + "output": 0.87, + "cache_read": 0.003625 }, "type": "chat" }, { - "id": "anthropic-claude-4.5-haiku", - "name": "Claude Haiku 4.5", - "display_name": "Claude Haiku 4.5", + "id": "claude-opus-4-7", + "name": "Claude Opus 4.7", + "display_name": "Claude Opus 4.7", "modalities": { "input": [ "text", - "image" + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 64000 + "context": 1000000, + "output": 128000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { "supported": true, - "default": true - }, - "attachment": true, - "open_weights": false, - "knowledge": "2025-02-28", - "release_date": "2025-10-15", - "last_updated": "2025-10-15", - "cost": { - "input": 1, - "output": 5, - "cache_read": 1, - "cache_write": 1.25 - }, - "type": "chat" - }, - { - "id": "stable-diffusion-3.5-large", - "name": "Stable Diffusion 3.5 Large", - "display_name": "Stable Diffusion 3.5 Large", - "modalities": { - "input": [ - "text" - ], - "output": [ - "image" - ] - }, - "limit": { - "context": 256, - "output": 1 - }, - "temperature": false, - "tool_call": false, - "reasoning": { - "supported": false - }, - "attachment": false, - "open_weights": true, - "release_date": "2024-10-22", - "last_updated": "2026-04-30", - "cost": { - "input": 0.08, - "output": 0 - }, - "type": "chat" - }, - { - "id": "kimi-k2.6", - "name": "Kimi K2.6", - "display_name": "Kimi K2.6", - "modalities": { - "input": [ - "text", - "image" - ], - "output": [ - "text" - ] - }, - "limit": { - "context": 262144, - "output": 262144 - }, - "temperature": false, - "tool_call": true, - "reasoning": { - "supported": true, - "default": true + "default": false }, "extra_capabilities": { "reasoning": { "supported": true, + "default_enabled": false, + "mode": "effort", + "effort": "high", + "effort_options": [ + "low", + "medium", + "high", + "xhigh", + "max" + ], "interleaved": true, "summaries": true, - "visibility": "summary", + "visibility": "omitted", "continuation": [ "thinking_blocks" + ], + "notes": [ + "Claude Opus 4.7 and newer Opus models require thinking.type = \"adaptive\" to enable thinking explicitly.", + "Manual budget_tokens requests return 400 on Claude Opus 4.7 and newer adaptive-only Opus models.", + "task_budget is separate from thinking control and should not be treated as a thinking budget." ] } }, "attachment": true, - "open_weights": true, - "knowledge": "2025-01", - "release_date": "2026-04-21", - "last_updated": "2026-04-21", + "open_weights": false, + "knowledge": "2026-01-31", + "release_date": "2026-04-16", + "last_updated": "2026-04-16", "cost": { - "input": 0.95, - "output": 4 + "input": 5, + "output": 25, + "cache_read": 0.5, + "cache_write": 6.25 }, "type": "chat" }, { - "id": "openai-gpt-oss-20b", - "name": "gpt-oss-20b", - "display_name": "gpt-oss-20b", + "id": "minimax-m2-7-highspeed", + "name": "MiniMax-M2.7-highspeed", + "display_name": "MiniMax-M2.7-highspeed", "modalities": { "input": [ "text" @@ -34743,7 +36781,7 @@ ] }, "limit": { - "context": 131072, + "context": 204800, "output": 131072 }, "temperature": true, @@ -34754,127 +36792,119 @@ }, "attachment": false, "open_weights": true, - "knowledge": "2024-06", - "release_date": "2025-08-05", - "last_updated": "2026-04-16", + "release_date": "2026-03-18", + "last_updated": "2026-03-18", "cost": { - "input": 0.05, - "output": 0.45 + "input": 0.6, + "output": 2.4, + "cache_write": 0.375 }, "type": "chat" }, { - "id": "ministral-3-8b-instruct-2512", - "name": "Ministral 3 8B", - "display_name": "Ministral 3 8B", + "id": "minimax-m2-7", + "name": "MiniMax-M2.7", + "display_name": "MiniMax-M2.7", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 262144, - "output": 262144 + "context": 204800, + "output": 131072 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": true, + "attachment": false, "open_weights": true, - "release_date": "2025-12-15", - "last_updated": "2025-12-15", - "type": "chat" - }, - { - "id": "openai-gpt-image-1.5", - "name": "GPT Image 1.5", - "display_name": "GPT Image 1.5", - "modalities": { - "input": [ - "text", - "image" - ], - "output": [ - "image" - ] - }, - "limit": { - "context": 8192, - "output": 8192 - }, - "temperature": false, - "tool_call": false, - "reasoning": { - "supported": false - }, - "attachment": true, - "open_weights": false, - "release_date": "2025-11-25", - "last_updated": "2025-11-25", + "release_date": "2026-03-18", + "last_updated": "2026-03-18", "cost": { - "input": 5, - "output": 10, - "cache_read": 1 + "input": 0.3, + "output": 1.2, + "cache_write": 0.375 }, "type": "chat" }, { - "id": "anthropic-claude-3-opus", - "name": "Claude 3 Opus", - "display_name": "Claude 3 Opus", + "id": "qwen-3.6-plus", + "name": "Qwen3.6 Plus", + "display_name": "Qwen3.6 Plus", "modalities": { "input": [ "text", - "image" + "image", + "video" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 4096 + "context": 1000000, + "output": 65536 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": true, + "attachment": false, "open_weights": false, - "knowledge": "2023-08", - "release_date": "2024-02-29", - "last_updated": "2024-02-29", + "knowledge": "2025-04", + "release_date": "2026-04-02", + "last_updated": "2026-04-02", "cost": { - "input": 15, - "output": 75, - "cache_read": 1.5, - "cache_write": 18.75 + "input": 0.5, + "output": 3, + "cache_read": 0.1, + "tiers": [ + { + "input": 2, + "output": 6, + "cache_read": 0.2, + "cache_write": 2.5, + "tier": { + "type": "context", + "size": 256000 + } + } + ], + "context_over_200k": { + "input": 2, + "output": 6, + "cache_read": 0.2, + "cache_write": 2.5 + } }, "type": "chat" }, { - "id": "openai-gpt-5.4-nano", - "name": "GPT-5.4 nano", - "display_name": "GPT-5.4 nano", + "id": "kimi-k2.5", + "name": "Kimi K2.5", + "display_name": "Kimi K2.5", "modalities": { "input": [ "text", - "image" + "image", + "video" ], "output": [ "text" ] }, "limit": { - "context": 400000, - "output": 128000 + "context": 262144, + "output": 262144 }, "temperature": false, "tool_call": true, @@ -34882,33 +36912,45 @@ "supported": true, "default": true }, - "attachment": true, - "open_weights": false, - "knowledge": "2025-08-31", - "release_date": "2026-03-17", - "last_updated": "2026-03-17", + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } + }, + "attachment": false, + "open_weights": true, + "knowledge": "2025-01", + "release_date": "2026-01", + "last_updated": "2026-01", "cost": { - "input": 0.2, - "output": 1.25, - "cache_read": 0.02 + "input": 0.5, + "output": 2.8 }, "type": "chat" }, { - "id": "deepseek-r1-distill-llama-70b", - "name": "DeepSeek R1 Distill Llama 70B", - "display_name": "DeepSeek R1 Distill Llama 70B", + "id": "kimi-k2.6", + "name": "Kimi K2.6", + "display_name": "Kimi K2.6", "modalities": { "input": [ - "text" + "text", + "image", + "video" ], "output": [ "text" ] }, "limit": { - "context": 131072, - "output": 32768 + "context": 262144, + "output": 262144 }, "temperature": true, "tool_call": true, @@ -34918,89 +36960,102 @@ }, "extra_capabilities": { "reasoning": { - "supported": true + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] } }, - "attachment": false, + "attachment": true, "open_weights": true, - "release_date": "2025-01-30", - "last_updated": "2025-01-30", + "knowledge": "2025-01", + "release_date": "2026-04-21", + "last_updated": "2026-04-21", "cost": { - "input": 0.99, - "output": 0.99 + "input": 0.95, + "output": 4, + "cache_read": 0.16 }, "type": "chat" }, { - "id": "llama3.3-70b-instruct", - "name": "Llama 3.3 Instruct 70B", - "display_name": "Llama 3.3 Instruct 70B", + "id": "gemini-3.1-pro-preview", + "name": "Gemini 3.1 Pro Preview", + "display_name": "Gemini 3.1 Pro Preview", "modalities": { "input": [ - "text" + "text", + "image", + "video", + "audio", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 128000 + "context": 1048576, + "output": 65536 }, "temperature": true, "tool_call": true, - "reasoning": { - "supported": false - }, - "attachment": false, - "open_weights": true, - "knowledge": "2023-12", - "release_date": "2024-12-06", - "last_updated": "2024-12-06", - "cost": { - "input": 0.65, - "output": 0.65 - }, - "type": "chat" - }, - { - "id": "openai-o3-mini", - "name": "o3-mini", - "display_name": "o3-mini", - "modalities": { - "input": [ - "text" - ], - "output": [ - "text" - ] - }, - "limit": { - "context": 200000, - "output": 100000 - }, - "temperature": false, - "tool_call": true, "reasoning": { "supported": true, "default": true }, - "attachment": false, + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": true, + "mode": "level", + "level": "high", + "level_options": [ + "low", + "high" + ], + "summaries": true, + "visibility": "summary", + "continuation": [ + "thought_signatures" + ] + } + }, + "attachment": true, "open_weights": false, - "knowledge": "2024-05", - "release_date": "2024-12-20", - "last_updated": "2025-01-29", + "knowledge": "2025-01", + "release_date": "2026-02-19", + "last_updated": "2026-02-19", "cost": { - "input": 1.1, - "output": 4.4, - "cache_read": 0.55 + "input": 2, + "output": 12, + "cache_read": 0.2, + "tiers": [ + { + "input": 4, + "output": 18, + "cache_read": 0.4, + "tier": { + "type": "context", + "size": 200000 + } + } + ], + "context_over_200k": { + "input": 4, + "output": 18, + "cache_read": 0.4 + } }, "type": "chat" }, { - "id": "anthropic-claude-opus-4.7", - "name": "Claude Opus 4.7", - "display_name": "Claude Opus 4.7", + "id": "claude-opus-4-6", + "name": "Claude Opus 4.6", + "display_name": "Claude Opus 4.6", "modalities": { "input": [ "text", @@ -35015,7 +37070,7 @@ "context": 1000000, "output": 128000 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, @@ -35025,33 +37080,35 @@ "reasoning": { "supported": true, "default_enabled": false, - "mode": "effort", + "mode": "mixed", + "budget": { + "min": 1024, + "unit": "tokens" + }, "effort": "high", "effort_options": [ "low", "medium", "high", - "xhigh", "max" ], "interleaved": true, "summaries": true, - "visibility": "omitted", + "visibility": "summary", "continuation": [ "thinking_blocks" ], "notes": [ - "Claude Opus 4.7 and newer Opus models require thinking.type = \"adaptive\" to enable thinking explicitly.", - "Manual budget_tokens requests return 400 on Claude Opus 4.7 and newer adaptive-only Opus models.", - "task_budget is separate from thinking control and should not be treated as a thinking budget." + "Anthropic recommends adaptive thinking with effort for Claude 4.6; budget_tokens remains a deprecated compatibility path.", + "Anthropic API defaults effort to high; lower effort levels should be chosen per workload." ] } }, "attachment": true, "open_weights": false, - "knowledge": "2026-01-31", - "release_date": "2026-04-16", - "last_updated": "2026-04-16", + "knowledge": "2025-05-31", + "release_date": "2026-02-05", + "last_updated": "2026-03-13", "cost": { "input": 5, "output": 25, @@ -35061,79 +37118,120 @@ "type": "chat" }, { - "id": "bge-reranker-v2-m3", - "name": "BGE Reranker v2 M3", - "display_name": "BGE Reranker v2 M3", + "id": "claude-sonnet-4-6", + "name": "Claude Sonnet 4.6", + "display_name": "Claude Sonnet 4.6", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 8192, - "output": 1 + "context": 1000000, + "output": 64000 }, - "temperature": false, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": false }, - "attachment": false, - "open_weights": true, - "release_date": "2024-03-12", - "last_updated": "2026-04-30", + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": false, + "mode": "mixed", + "budget": { + "min": 1024, + "unit": "tokens" + }, + "effort": "high", + "effort_options": [ + "low", + "medium", + "high", + "max" + ], + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ], + "notes": [ + "Anthropic recommends adaptive thinking with effort for Claude 4.6; budget_tokens remains a deprecated compatibility path.", + "Anthropic API defaults effort to high; lower effort levels should be chosen per workload." + ] + } + }, + "attachment": true, + "open_weights": false, + "knowledge": "2025-08-31", + "release_date": "2026-02-17", + "last_updated": "2026-03-13", "cost": { - "input": 0.01, - "output": 0 + "input": 3, + "output": 15, + "cache_read": 0.3, + "cache_write": 3.75 }, - "type": "rerank" - }, + "type": "chat" + } + ] + }, + "stepfun-ai": { + "id": "stepfun-ai", + "name": "StepFun AI", + "display_name": "StepFun AI", + "api": "https://api.stepfun.ai/step_plan/v1", + "doc": "https://platform.stepfun.ai/docs/en/step-plan/integrations/open-code", + "models": [ { - "id": "openai-gpt-5-mini", - "name": "GPT-5 mini", - "display_name": "GPT-5 mini", + "id": "step-3.5-flash", + "name": "Step 3.5 Flash", + "display_name": "Step 3.5 Flash", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 400000, - "output": 128000 + "context": 256000, + "output": 256000 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, "default": true }, - "attachment": true, - "open_weights": false, - "knowledge": "2024-05-30", - "release_date": "2025-08-07", - "last_updated": "2025-08-07", + "attachment": false, + "open_weights": true, + "knowledge": "2025-01", + "release_date": "2026-01-29", + "last_updated": "2026-02-13", "cost": { - "input": 0.25, - "output": 2, - "cache_read": 0.025 + "input": 0.096, + "output": 0.288, + "cache_read": 0.019 }, "type": "chat" }, { - "id": "gemma-4-31B-it", - "name": "Gemma 4 31B", - "display_name": "Gemma 4 31B", + "id": "step-3.5-flash-2603", + "name": "Step 3.5 Flash 2603", + "display_name": "Step 3.5 Flash 2603", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" @@ -35141,27 +37239,39 @@ }, "limit": { "context": 256000, - "output": 8192 + "output": 256000 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": true, + "attachment": false, "open_weights": true, - "release_date": "2026-04-22", - "last_updated": "2026-04-30", + "knowledge": "2025-01", + "release_date": "2026-04-02", + "last_updated": "2026-04-02", "cost": { - "input": 0.18, - "output": 0.5 + "input": 0.1, + "output": 0.3, + "cache_read": 0.02 }, "type": "chat" - }, + } + ] + }, + "vivgrid": { + "id": "vivgrid", + "name": "Vivgrid", + "display_name": "Vivgrid", + "api": "https://api.vivgrid.com/v1", + "doc": "https://docs.vivgrid.com/models", + "models": [ { - "id": "qwen-2.5-14b-instruct", - "name": "Qwen 2.5 14B Instruct", - "display_name": "Qwen 2.5 14B Instruct", + "id": "deepseek-v4-pro", + "name": "DeepSeek V4 Pro", + "display_name": "DeepSeek V4 Pro", "modalities": { "input": [ "text" @@ -35171,25 +37281,42 @@ ] }, "limit": { - "context": 131072, - "output": 131072 + "context": 1000000, + "output": 384000 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } }, "attachment": false, "open_weights": true, - "knowledge": "2024-09", - "release_date": "2024-09-19", - "last_updated": "2024-09-19", + "knowledge": "2025-05", + "release_date": "2026-04-24", + "last_updated": "2026-04-24", + "cost": { + "input": 0.435, + "output": 0.87, + "cache_read": 0.003625 + }, "type": "chat" }, { - "id": "openai-gpt-4o", - "name": "GPT-4o", - "display_name": "GPT-4o", + "id": "gpt-5.4-nano", + "name": "GPT-5.4 Nano", + "display_name": "GPT-5.4 Nano", "modalities": { "input": [ "text", @@ -35201,45 +37328,67 @@ ] }, "limit": { - "context": 128000, - "output": 16384 + "context": 400000, + "output": 128000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": false + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": false, + "mode": "effort", + "effort": "none", + "effort_options": [ + "none", + "low", + "medium", + "high", + "xhigh" + ], + "verbosity": "medium", + "verbosity_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" + } }, "attachment": true, "open_weights": false, - "knowledge": "2023-09", - "release_date": "2024-05-13", - "last_updated": "2024-08-06", + "knowledge": "2025-08-31", + "release_date": "2026-03-17", + "last_updated": "2026-03-17", "cost": { - "input": 2.5, - "output": 10, - "cache_read": 1.25 + "input": 0.2, + "output": 1.25, + "cache_read": 0.02 }, "type": "chat" }, { - "id": "anthropic-claude-opus-4.6", - "name": "Claude Opus 4.6", - "display_name": "Claude Opus 4.6", + "id": "gpt-5.1-codex", + "name": "GPT-5.1 Codex", + "display_name": "GPT-5.1 Codex", "modalities": { "input": [ "text", - "image", - "pdf" + "image" ], "output": [ "text" ] }, "limit": { - "context": 1000000, + "context": 400000, "output": 128000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { "supported": true, @@ -35249,110 +37398,107 @@ "reasoning": { "supported": true, "default_enabled": false, - "mode": "mixed", - "budget": { - "min": 1024, - "unit": "tokens" - }, - "effort": "high", + "mode": "effort", + "effort": "none", "effort_options": [ + "none", "low", "medium", - "high", - "max" + "high" ], - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" + "verbosity": "medium", + "verbosity_options": [ + "low", + "medium", + "high" ], - "notes": [ - "Anthropic recommends adaptive thinking with effort for Claude 4.6; budget_tokens remains a deprecated compatibility path.", - "Anthropic API defaults effort to high; lower effort levels should be chosen per workload." - ] + "visibility": "hidden" } }, - "attachment": true, + "attachment": false, "open_weights": false, - "knowledge": "2025-05-31", - "release_date": "2026-02-05", - "last_updated": "2026-03-13", + "knowledge": "2024-09-30", + "release_date": "2025-11-13", + "last_updated": "2025-11-13", "cost": { - "input": 5, - "output": 25, - "cache_read": 0.5, - "cache_write": 6.25, - "tiers": [ - { - "input": 10, - "output": 37.5, - "cache_read": 0.5, - "cache_write": 6.25, - "tier": { - "type": "context", - "size": 200000 - } - } - ], - "context_over_200k": { - "input": 10, - "output": 37.5, - "cache_read": 0.5, - "cache_write": 6.25 - } + "input": 1.25, + "output": 10, + "cache_read": 0.125 }, "type": "chat" }, { - "id": "qwen3-coder-flash", - "name": "Qwen3 Coder Flash", - "display_name": "Qwen3 Coder Flash", + "id": "gpt-5.1-codex-max", + "name": "GPT-5.1 Codex Max", + "display_name": "GPT-5.1 Codex Max", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 262144, - "output": 65536 + "context": 400000, + "output": 128000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": false + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": false, + "mode": "effort", + "effort": "none", + "effort_options": [ + "none", + "low", + "medium", + "high" + ], + "verbosity": "medium", + "verbosity_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" + } }, "attachment": false, - "open_weights": true, - "knowledge": "2025-04", - "release_date": "2025-07-28", - "last_updated": "2026-04-30", + "open_weights": false, + "knowledge": "2024-09-30", + "release_date": "2025-11-13", + "last_updated": "2025-11-13", "cost": { - "input": 0.45, - "output": 1.7 + "input": 1.25, + "output": 10, + "cache_read": 0.125 }, "type": "chat" }, { - "id": "openai-o1", - "name": "o1", - "display_name": "o1", + "id": "gpt-5.3-codex", + "name": "GPT-5.3 Codex", + "display_name": "GPT-5.3 Codex", "modalities": { "input": [ "text", - "image", - "pdf" + "image" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 100000 + "context": 400000, + "output": 128000 }, "temperature": false, "tool_call": true, @@ -35360,91 +37506,165 @@ "supported": true, "default": true }, - "attachment": true, + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": true, + "mode": "effort", + "effort": "medium", + "effort_options": [ + "low", + "medium", + "high", + "xhigh" + ], + "verbosity": "medium", + "verbosity_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" + } + }, + "attachment": false, "open_weights": false, - "knowledge": "2023-09", - "release_date": "2024-12-05", - "last_updated": "2024-12-05", + "knowledge": "2025-08-31", + "release_date": "2026-02-24", + "last_updated": "2026-02-24", "cost": { - "input": 15, - "output": 60, - "cache_read": 7.5 + "input": 1.75, + "output": 14, + "cache_read": 0.175 }, "type": "chat" }, { - "id": "anthropic-claude-3.5-haiku", - "name": "Claude 3.5 Haiku", - "display_name": "Claude 3.5 Haiku", + "id": "gpt-5.4", + "name": "GPT-5.4", + "display_name": "GPT-5.4", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 8192 + "context": 400000, + "output": 128000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": false }, - "attachment": false, + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": false, + "mode": "effort", + "effort": "none", + "effort_options": [ + "none", + "low", + "medium", + "high", + "xhigh" + ], + "verbosity": "medium", + "verbosity_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" + } + }, + "attachment": true, "open_weights": false, - "knowledge": "2024-07", - "release_date": "2024-11-05", - "last_updated": "2024-11-05", + "knowledge": "2025-08-31", + "release_date": "2026-03-05", + "last_updated": "2026-03-05", "cost": { - "input": 0.8, - "output": 4, - "cache_read": 0.08, - "cache_write": 1 + "input": 2.5, + "output": 15, + "cache_read": 0.25 }, "type": "chat" }, { - "id": "e5-large-v2", - "name": "E5 Large v2", - "display_name": "E5 Large v2", + "id": "gpt-5.4-mini", + "name": "GPT-5.4 Mini", + "display_name": "GPT-5.4 Mini", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 512, - "output": 1024 + "context": 400000, + "output": 128000 }, "temperature": false, - "tool_call": false, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": false }, - "attachment": false, - "open_weights": true, - "release_date": "2023-05-19", - "last_updated": "2026-04-30", + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": false, + "mode": "effort", + "effort": "none", + "effort_options": [ + "none", + "low", + "medium", + "high", + "xhigh" + ], + "verbosity": "medium", + "verbosity_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" + } + }, + "attachment": true, + "open_weights": false, + "knowledge": "2025-08-31", + "release_date": "2026-03-17", + "last_updated": "2026-03-17", "cost": { - "input": 0.02, - "output": 0 + "input": 0.75, + "output": 4.5, + "cache_read": 0.075 }, "type": "chat" }, { - "id": "anthropic-claude-4.6-sonnet", - "name": "Claude Sonnet 4.6", - "display_name": "Claude Sonnet 4.6", + "id": "gemini-3.1-pro-preview", + "name": "Gemini 3.1 Pro Preview", + "display_name": "Gemini 3.1 Pro Preview", "modalities": { "input": [ "text", "image", + "video", + "audio", "pdf" ], "output": [ @@ -35452,8 +37672,8 @@ ] }, "limit": { - "context": 1000000, - "output": 64000 + "context": 1048576, + "output": 65536 }, "temperature": true, "tool_call": true, @@ -35461,22 +37681,37 @@ "supported": true, "default": true }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": true, + "mode": "level", + "level": "high", + "level_options": [ + "low", + "high" + ], + "summaries": true, + "visibility": "summary", + "continuation": [ + "thought_signatures" + ] + } + }, "attachment": true, "open_weights": false, - "knowledge": "2025-08-31", - "release_date": "2026-02-17", - "last_updated": "2026-03-13", + "knowledge": "2025-01", + "release_date": "2026-02-19", + "last_updated": "2026-02-19", "cost": { - "input": 3, - "output": 15, - "cache_read": 0.3, - "cache_write": 3.75, + "input": 2, + "output": 12, + "cache_read": 0.2, "tiers": [ { - "input": 6, - "output": 22.5, - "cache_read": 0.3, - "cache_write": 3.75, + "input": 4, + "output": 18, + "cache_read": 0.4, "tier": { "type": "context", "size": 200000 @@ -35484,18 +37719,17 @@ } ], "context_over_200k": { - "input": 6, - "output": 22.5, - "cache_read": 0.3, - "cache_write": 3.75 + "input": 4, + "output": 18, + "cache_read": 0.4 } }, "type": "chat" }, { - "id": "openai-gpt-5-nano", - "name": "GPT-5 nano", - "display_name": "GPT-5 nano", + "id": "gpt-5-mini", + "name": "GPT-5 Mini", + "display_name": "GPT-5 Mini", "modalities": { "input": [ "text", @@ -35506,7 +37740,7 @@ ] }, "limit": { - "context": 400000, + "context": 272000, "output": 128000 }, "temperature": false, @@ -35515,22 +37749,43 @@ "supported": true, "default": true }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": true, + "mode": "effort", + "effort": "medium", + "effort_options": [ + "minimal", + "low", + "medium", + "high" + ], + "verbosity": "medium", + "verbosity_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" + } + }, "attachment": true, "open_weights": false, "knowledge": "2024-05-30", "release_date": "2025-08-07", "last_updated": "2025-08-07", "cost": { - "input": 0.05, - "output": 0.4, - "cache_read": 0.005 + "input": 0.25, + "output": 2, + "cache_read": 0.03 }, "type": "chat" }, { - "id": "qwen3-embedding-0.6b", - "name": "Qwen3 Embedding 0.6B", - "display_name": "Qwen3 Embedding 0.6B", + "id": "deepseek-v3.2", + "name": "DeepSeek-V3.2", + "display_name": "DeepSeek-V3.2", "modalities": { "input": [ "text" @@ -35540,26 +37795,133 @@ ] }, "limit": { - "context": 8000, - "output": 1024 + "context": 128000, + "output": 128000 }, - "temperature": false, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true + } }, "attachment": false, "open_weights": true, - "release_date": "2025-06-03", - "last_updated": "2026-04-16", + "knowledge": "2024-07", + "release_date": "2025-12-01", + "last_updated": "2025-12-01", "cost": { - "input": 0.04, - "output": 0 + "input": 0.28, + "output": 0.42 }, - "type": "embedding" + "type": "chat" }, { - "id": "openai-gpt-5.5", + "id": "gemini-3.1-flash-lite-preview", + "name": "Gemini 3.1 Flash Lite Preview", + "display_name": "Gemini 3.1 Flash Lite Preview", + "modalities": { + "input": [ + "text", + "image", + "video", + "audio", + "pdf" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 1048576, + "output": 65536 + }, + "temperature": true, + "tool_call": true, + "reasoning": { + "supported": true, + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true + } + }, + "attachment": true, + "open_weights": false, + "knowledge": "2025-01", + "release_date": "2026-03-03", + "last_updated": "2026-03-03", + "cost": { + "input": 0.25, + "output": 1.5, + "cache_read": 0.025, + "cache_write": 1 + }, + "type": "chat" + }, + { + "id": "gpt-5.2-codex", + "name": "GPT-5.2 Codex", + "display_name": "GPT-5.2 Codex", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 400000, + "output": 128000 + }, + "temperature": false, + "tool_call": true, + "reasoning": { + "supported": true, + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": true, + "mode": "effort", + "effort": "medium", + "effort_options": [ + "low", + "medium", + "high", + "xhigh" + ], + "verbosity": "medium", + "verbosity_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" + } + }, + "attachment": false, + "open_weights": false, + "knowledge": "2025-08-31", + "release_date": "2026-01-14", + "last_updated": "2026-01-14", + "cost": { + "input": 1.75, + "output": 14, + "cache_read": 0.175 + }, + "type": "chat" + }, + { + "id": "gpt-5.5", "name": "GPT-5.5", "display_name": "GPT-5.5", "modalities": { @@ -35573,7 +37935,7 @@ ] }, "limit": { - "context": 1000000, + "context": 1050000, "output": 128000 }, "temperature": false, @@ -35582,11 +37944,32 @@ "supported": true, "default": true }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": true, + "mode": "effort", + "effort": "medium", + "effort_options": [ + "low", + "medium", + "high", + "xhigh" + ], + "verbosity": "medium", + "verbosity_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" + } + }, "attachment": true, "open_weights": false, "knowledge": "2025-12-01", "release_date": "2026-04-23", - "last_updated": "2026-04-30", + "last_updated": "2026-04-23", "cost": { "input": 5, "output": 30, @@ -35609,11 +37992,19 @@ } }, "type": "chat" - }, + } + ] + }, + "mistral": { + "id": "mistral", + "name": "Mistral", + "display_name": "Mistral", + "doc": "https://docs.mistral.ai/getting-started/models/", + "models": [ { - "id": "glm-5", - "name": "GLM 5", - "display_name": "GLM 5", + "id": "codestral-latest", + "name": "Codestral (latest)", + "display_name": "Codestral (latest)", "modalities": { "input": [ "text" @@ -35623,39 +38014,62 @@ ] }, "limit": { - "context": 202752, - "output": 128000 + "context": 256000, + "output": 4096 }, + "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } + "supported": false }, "attachment": false, "open_weights": true, - "release_date": "2026-02-11", - "last_updated": "2026-04-16", + "knowledge": "2024-10", + "release_date": "2024-05-29", + "last_updated": "2025-01-04", "cost": { - "input": 1, - "output": 3.2 + "input": 0.3, + "output": 0.9 }, "type": "chat" }, { - "id": "deepseek-v3", - "name": "DeepSeek V3", - "display_name": "DeepSeek V3", + "id": "mistral-large-latest", + "name": "Mistral Large (latest)", + "display_name": "Mistral Large (latest)", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 262144, + "output": 262144 + }, + "temperature": true, + "tool_call": true, + "reasoning": { + "supported": false + }, + "attachment": true, + "open_weights": true, + "knowledge": "2024-11", + "release_date": "2024-11-01", + "last_updated": "2025-12-02", + "cost": { + "input": 0.5, + "output": 1.5 + }, + "type": "chat" + }, + { + "id": "open-mistral-7b", + "name": "Mistral 7B", + "display_name": "Mistral 7B", "modalities": { "input": [ "text" @@ -35665,8 +38079,8 @@ ] }, "limit": { - "context": 163840, - "output": 131072 + "context": 8000, + "output": 8000 }, "temperature": true, "tool_call": true, @@ -35675,15 +38089,19 @@ }, "attachment": false, "open_weights": true, - "knowledge": "2024-07", - "release_date": "2024-12-26", - "last_updated": "2025-03-24", + "knowledge": "2023-12", + "release_date": "2023-09-27", + "last_updated": "2023-09-27", + "cost": { + "input": 0.25, + "output": 0.25 + }, "type": "chat" }, { - "id": "arcee-trinity-large-thinking", - "name": "Trinity Large Thinking", - "display_name": "Trinity Large Thinking", + "id": "devstral-small-2507", + "name": "Devstral Small", + "display_name": "Devstral Small", "modalities": { "input": [ "text" @@ -35693,65 +38111,61 @@ ] }, "limit": { - "context": 256000, + "context": 128000, "output": 128000 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, "attachment": false, "open_weights": true, - "release_date": "2026-04-02", - "last_updated": "2026-04-16", + "knowledge": "2025-05", + "release_date": "2025-07-10", + "last_updated": "2025-07-10", "cost": { - "input": 0.25, - "output": 0.9, - "cache_read": 0.06 + "input": 0.1, + "output": 0.3 }, "type": "chat" }, { - "id": "anthropic-claude-3.5-sonnet", - "name": "Claude 3.5 Sonnet", - "display_name": "Claude 3.5 Sonnet", + "id": "ministral-3b-latest", + "name": "Ministral 3B (latest)", + "display_name": "Ministral 3B (latest)", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 8192 + "context": 128000, + "output": 128000 }, "temperature": true, "tool_call": true, "reasoning": { "supported": false }, - "attachment": true, - "open_weights": false, - "knowledge": "2024-04", - "release_date": "2024-06-20", - "last_updated": "2024-10-22", + "attachment": false, + "open_weights": true, + "knowledge": "2024-10", + "release_date": "2024-10-01", + "last_updated": "2024-10-04", "cost": { - "input": 3, - "output": 15, - "cache_read": 0.3, - "cache_write": 3.75 + "input": 0.04, + "output": 0.04 }, "type": "chat" }, { - "id": "nemotron-nano-12b-v2-vl", - "name": "Nemotron Nano 12B v2 VL", - "display_name": "Nemotron Nano 12B v2 VL", + "id": "pixtral-large-latest", + "name": "Pixtral Large (latest)", + "display_name": "Pixtral Large (latest)", "modalities": { "input": [ "text", @@ -35763,29 +38177,28 @@ }, "limit": { "context": 128000, - "output": 16384 + "output": 128000 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, "attachment": true, "open_weights": true, - "knowledge": "2024-10", - "release_date": "2025-12-01", - "last_updated": "2026-04-30", + "knowledge": "2024-11", + "release_date": "2024-11-01", + "last_updated": "2024-11-04", "cost": { - "input": 0.2, - "output": 0.6 + "input": 2, + "output": 6 }, "type": "chat" }, { - "id": "gte-large-en-v1.5", - "name": "GTE Large (v1.5)", - "display_name": "GTE Large (v1.5)", + "id": "mistral-nemo", + "name": "Mistral Nemo", + "display_name": "Mistral Nemo", "modalities": { "input": [ "text" @@ -35795,132 +38208,93 @@ ] }, "limit": { - "context": 8192, - "output": 1024 + "context": 128000, + "output": 128000 }, - "temperature": false, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { "supported": false }, "attachment": false, "open_weights": true, - "release_date": "2024-03-27", - "last_updated": "2026-04-16", + "knowledge": "2024-07", + "release_date": "2024-07-01", + "last_updated": "2024-07-01", "cost": { - "input": 0.09, - "output": 0 + "input": 0.15, + "output": 0.15 }, "type": "chat" }, { - "id": "anthropic-claude-opus-4.8", - "name": "Claude Opus 4.8", - "display_name": "Claude Opus 4.8", + "id": "mistral-embed", + "name": "Mistral Embed", + "display_name": "Mistral Embed", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 1000000, - "output": 128000 + "context": 8000, + "output": 3072 }, - "temperature": true, - "tool_call": true, + "temperature": false, + "tool_call": false, "reasoning": { - "supported": true, - "default": false - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": false, - "mode": "effort", - "effort": "high", - "effort_options": [ - "low", - "medium", - "high", - "xhigh", - "max" - ], - "interleaved": true, - "summaries": true, - "visibility": "omitted", - "continuation": [ - "thinking_blocks" - ], - "notes": [ - "Claude Opus 4.7 and newer Opus models require thinking.type = \"adaptive\" to enable thinking explicitly.", - "Manual budget_tokens requests return 400 on Claude Opus 4.7 and newer adaptive-only Opus models.", - "task_budget is separate from thinking control and should not be treated as a thinking budget." - ] - } + "supported": false }, - "attachment": true, + "attachment": false, "open_weights": false, - "release_date": "2026-05-28", - "last_updated": "2026-05-29", + "release_date": "2023-12-11", + "last_updated": "2023-12-11", "cost": { - "input": 5, - "output": 25, - "cache_read": 0.5, - "cache_write": 6.25 + "input": 0.1, + "output": 0 }, "type": "chat" }, { - "id": "qwen3.5-397b-a17b", - "name": "Qwen 3.5 397B A17B", - "display_name": "Qwen 3.5 397B A17B", + "id": "mistral-small-2506", + "name": "Mistral Small 3.2", + "display_name": "Mistral Small 3.2", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 262144, - "output": 81920 + "context": 128000, + "output": 16384 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } + "supported": false }, "attachment": false, "open_weights": true, - "release_date": "2026-02-15", - "last_updated": "2026-04-30", + "knowledge": "2025-03", + "release_date": "2025-06-20", + "last_updated": "2025-06-20", "cost": { - "input": 0.55, - "output": 3.5 + "input": 0.1, + "output": 0.3 }, "type": "chat" }, { - "id": "minimax-m2.5", - "name": "MiniMax M2.5", - "display_name": "MiniMax M2.5", + "id": "ministral-8b-latest", + "name": "Ministral 8B (latest)", + "display_name": "Ministral 8B (latest)", "modalities": { "input": [ "text" @@ -35930,96 +38304,65 @@ ] }, "limit": { - "context": 204800, + "context": 128000, "output": 128000 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true - } + "supported": false }, "attachment": false, "open_weights": true, - "knowledge": "2025-08", - "release_date": "2026-02-12", - "last_updated": "2026-04-16", + "knowledge": "2024-10", + "release_date": "2024-10-01", + "last_updated": "2024-10-04", "cost": { - "input": 0.3, - "output": 1.2 + "input": 0.1, + "output": 0.1 }, "type": "chat" }, { - "id": "anthropic-claude-haiku-4.5", - "name": "Claude Haiku 4.5", - "display_name": "Claude Haiku 4.5", + "id": "open-mixtral-8x22b", + "name": "Mixtral 8x22B", + "display_name": "Mixtral 8x22B", "modalities": { "input": [ - "text", - "image", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 200000, + "context": 64000, "output": 64000 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": false - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": false, - "mode": "budget", - "budget": { - "min": 1024, - "unit": "tokens" - }, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ], - "notes": [ - "Claude 4 manual thinking uses thinking.type = \"enabled\" with budget_tokens.", - "Interleaved thinking requires the interleaved-thinking-2025-05-14 beta header for this model family." - ] - } + "supported": false }, - "attachment": true, - "open_weights": false, - "knowledge": "2025-02-28", - "release_date": "2025-10-15", - "last_updated": "2025-10-15", + "attachment": false, + "open_weights": true, + "knowledge": "2024-04", + "release_date": "2024-04-17", + "last_updated": "2024-04-17", "cost": { - "input": 1, - "output": 5, - "cache_read": 1, - "cache_write": 1.25 + "input": 2, + "output": 6 }, "type": "chat" }, { - "id": "deepseek-4-flash", - "name": "Deepseek V4 Flash", - "display_name": "Deepseek V4 Flash", + "id": "mistral-medium-latest", + "name": "Mistral Medium (latest)", + "display_name": "Mistral Medium (latest)", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" @@ -36027,23 +38370,28 @@ }, "limit": { "context": 262144, - "output": 8192 + "output": 262144 }, "temperature": true, "tool_call": true, "reasoning": { "supported": false }, - "attachment": false, + "attachment": true, "open_weights": false, - "release_date": "2026-05-27", - "last_updated": "2026-05-29", + "knowledge": "2025-05", + "release_date": "2025-08-12", + "last_updated": "2025-08-12", + "cost": { + "input": 0.4, + "output": 2 + }, "type": "chat" }, { - "id": "mistral-nemo-instruct-2407", - "name": "Mistral Nemo Instruct", - "display_name": "Mistral Nemo Instruct", + "id": "devstral-small-2505", + "name": "Devstral Small 2505", + "display_name": "Devstral Small 2505", "modalities": { "input": [ "text" @@ -36054,7 +38402,7 @@ }, "limit": { "context": 128000, - "output": 16384 + "output": 128000 }, "temperature": true, "tool_call": true, @@ -36063,18 +38411,19 @@ }, "attachment": false, "open_weights": true, - "release_date": "2024-07-18", - "last_updated": "2024-07-18", + "knowledge": "2025-05", + "release_date": "2025-05-07", + "last_updated": "2025-05-07", "cost": { - "input": 0.3, + "input": 0.1, "output": 0.3 }, "type": "chat" }, { - "id": "deepseek-v4-pro", - "name": "DeepSeek V4 Pro", - "display_name": "DeepSeek V4 Pro", + "id": "magistral-small", + "name": "Magistral Small", + "display_name": "Magistral Small", "modalities": { "input": [ "text" @@ -36084,8 +38433,8 @@ ] }, "limit": { - "context": 1048576, - "output": 393216 + "context": 128000, + "output": 128000 }, "temperature": true, "tool_call": true, @@ -36093,35 +38442,25 @@ "supported": true, "default": true }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } - }, "attachment": false, "open_weights": true, - "knowledge": "2025-05", - "release_date": "2026-04-24", - "last_updated": "2026-04-24", + "knowledge": "2025-06", + "release_date": "2025-03-17", + "last_updated": "2025-03-17", "cost": { - "input": 1.74, - "output": 3.48 + "input": 0.5, + "output": 1.5 }, "type": "chat" }, { - "id": "kimi-k2.5", - "name": "Kimi K2.5", - "display_name": "Kimi K2.5", + "id": "mistral-medium-2604", + "name": "Mistral Medium 3.5", + "display_name": "Mistral Medium 3.5", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" @@ -36129,100 +38468,94 @@ }, "limit": { "context": 262144, - "output": 32768 + "output": 262144 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, "default": true }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } - }, - "attachment": false, + "attachment": true, "open_weights": true, - "knowledge": "2025-01", - "release_date": "2026-01", - "last_updated": "2026-04-16", + "release_date": "2026-04-29", + "last_updated": "2026-04-29", "cost": { - "input": 0.5, - "output": 2.7 + "input": 1.5, + "output": 7.5 }, "type": "chat" }, { - "id": "openai-gpt-image-1", - "name": "GPT Image 1", - "display_name": "GPT Image 1", + "id": "mistral-small-latest", + "name": "Mistral Small (latest)", + "display_name": "Mistral Small (latest)", "modalities": { "input": [ "text", "image" ], "output": [ - "image" + "text" ] }, "limit": { - "context": 8192, - "output": 8192 + "context": 256000, + "output": 256000 }, - "temperature": false, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "attachment": true, - "open_weights": false, - "release_date": "2025-04-24", - "last_updated": "2025-04-24", + "open_weights": true, + "knowledge": "2025-06", + "release_date": "2026-03-16", + "last_updated": "2026-03-16", "cost": { - "input": 5, - "output": 40, - "cache_read": 1.25 + "input": 0.15, + "output": 0.6 }, "type": "chat" }, { - "id": "qwen3-tts-voicedesign", - "name": "Qwen3 TTS VoiceDesign", - "display_name": "Qwen3 TTS VoiceDesign", + "id": "open-mixtral-8x7b", + "name": "Mixtral 8x7B", + "display_name": "Mixtral 8x7B", "modalities": { "input": [ "text" ], "output": [ - "audio" + "text" ] }, "limit": { - "context": 32768, - "output": 1 + "context": 32000, + "output": 32000 }, - "temperature": false, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { "supported": false }, "attachment": false, "open_weights": true, - "release_date": "2026-04-21", - "last_updated": "2026-04-30", + "knowledge": "2024-01", + "release_date": "2023-12-11", + "last_updated": "2023-12-11", + "cost": { + "input": 0.7, + "output": 0.7 + }, "type": "chat" }, { - "id": "alibaba-qwen3-32b", - "name": "Qwen3-32B", - "display_name": "Qwen3-32B", + "id": "devstral-latest", + "name": "Devstral 2", + "display_name": "Devstral 2", "modalities": { "input": [ "text" @@ -36232,29 +38565,29 @@ ] }, "limit": { - "context": 131000, - "output": 40960 + "context": 262144, + "output": 262144 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, "attachment": false, "open_weights": true, - "release_date": "2025-04-30", - "last_updated": "2026-04-16", + "knowledge": "2025-12", + "release_date": "2025-12-09", + "last_updated": "2025-12-09", "cost": { - "input": 0.25, - "output": 0.55 + "input": 0.4, + "output": 2 }, "type": "chat" }, { - "id": "openai-gpt-5.1-codex-max", - "name": "GPT-5.1 Codex Max", - "display_name": "GPT-5.1 Codex Max", + "id": "mistral-small-2603", + "name": "Mistral Small 4", + "display_name": "Mistral Small 4", "modalities": { "input": [ "text", @@ -36265,242 +38598,225 @@ ] }, "limit": { - "context": 400000, - "output": 128000 + "context": 256000, + "output": 256000 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, "default": true }, "attachment": true, - "open_weights": false, - "knowledge": "2024-09-30", - "release_date": "2025-11-13", - "last_updated": "2025-11-13", + "open_weights": true, + "knowledge": "2025-06", + "release_date": "2026-03-16", + "last_updated": "2026-03-16", "cost": { - "input": 1.25, - "output": 10, - "cache_read": 0.125 + "input": 0.15, + "output": 0.6 }, "type": "chat" }, { - "id": "anthropic-claude-opus-4", - "name": "Claude Opus 4", - "display_name": "Claude Opus 4", + "id": "mistral-medium-2505", + "name": "Mistral Medium 3", + "display_name": "Mistral Medium 3", "modalities": { "input": [ "text", - "image", - "pdf" + "image" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 32000 + "context": 131072, + "output": 131072 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": false - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": false, - "mode": "budget", - "budget": { - "min": 1024, - "unit": "tokens" - }, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ], - "notes": [ - "Claude 4 manual thinking uses thinking.type = \"enabled\" with budget_tokens.", - "Interleaved thinking requires the interleaved-thinking-2025-05-14 beta header for this model family." - ] - } + "supported": false }, "attachment": true, "open_weights": false, - "knowledge": "2025-03-31", - "release_date": "2025-05-22", - "last_updated": "2025-05-22", + "knowledge": "2025-05", + "release_date": "2025-05-07", + "last_updated": "2025-05-07", "cost": { - "input": 15, - "output": 75, - "cache_read": 1.5, - "cache_write": 18.75 + "input": 0.4, + "output": 2 }, "type": "chat" }, { - "id": "openai-gpt-5.3-codex", - "name": "GPT-5.3 Codex", - "display_name": "GPT-5.3 Codex", + "id": "mistral-large-2411", + "name": "Mistral Large 2.1", + "display_name": "Mistral Large 2.1", "modalities": { "input": [ - "text", - "image", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 400000, - "output": 128000 + "context": 131072, + "output": 16384 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, - "attachment": true, - "open_weights": false, - "knowledge": "2025-08-31", - "release_date": "2026-02-05", - "last_updated": "2026-02-05", + "attachment": false, + "open_weights": true, + "knowledge": "2024-11", + "release_date": "2024-11-01", + "last_updated": "2024-11-04", "cost": { - "input": 1.75, - "output": 14, - "cache_read": 0.175 + "input": 2, + "output": 6 }, "type": "chat" }, { - "id": "fal-ai/fast-sdxl", - "name": "Fast SDXL", - "display_name": "Fast SDXL", + "id": "mistral-medium-2508", + "name": "Mistral Medium 3.1", + "display_name": "Mistral Medium 3.1", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ - "image" + "text" ] }, "limit": { - "context": 8192, - "output": 8192 + "context": 262144, + "output": 262144 }, - "temperature": false, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { "supported": false }, - "attachment": false, - "open_weights": true, - "release_date": "2023-07-26", - "last_updated": "2026-04-16", + "attachment": true, + "open_weights": false, + "knowledge": "2025-05", + "release_date": "2025-08-12", + "last_updated": "2025-08-12", + "cost": { + "input": 0.4, + "output": 2 + }, "type": "chat" }, { - "id": "fal-ai/elevenlabs/tts/multilingual-v2", - "name": "ElevenLabs Multilingual TTS v2", - "display_name": "ElevenLabs Multilingual TTS v2", + "id": "open-mistral-nemo", + "name": "Open Mistral Nemo", + "display_name": "Open Mistral Nemo", "modalities": { "input": [ "text" ], "output": [ - "audio" + "text" ] }, "limit": { - "context": 8192, - "output": 8192 + "context": 128000, + "output": 128000 }, - "temperature": false, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { "supported": false }, "attachment": false, - "open_weights": false, - "release_date": "2023-08-22", - "last_updated": "2026-04-16", + "open_weights": true, + "knowledge": "2024-07", + "release_date": "2024-07-01", + "last_updated": "2024-07-01", + "cost": { + "input": 0.15, + "output": 0.15 + }, "type": "chat" }, { - "id": "fal-ai/stable-audio-25/text-to-audio", - "name": "Stable Audio 2.5 (Text-to-Audio)", - "display_name": "Stable Audio 2.5 (Text-to-Audio)", + "id": "magistral-medium-latest", + "name": "Magistral Medium (latest)", + "display_name": "Magistral Medium (latest)", "modalities": { "input": [ "text" ], "output": [ - "audio" + "text" ] }, "limit": { - "context": 8192, - "output": 8192 + "context": 128000, + "output": 16384 }, - "temperature": false, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "attachment": false, - "open_weights": false, - "release_date": "2025-10-08", - "last_updated": "2026-04-16", + "open_weights": true, + "knowledge": "2025-06", + "release_date": "2025-03-17", + "last_updated": "2025-03-20", + "cost": { + "input": 2, + "output": 5 + }, "type": "chat" }, { - "id": "fal-ai/flux/schnell", - "name": "FLUX.1 [schnell]", - "display_name": "FLUX.1 [schnell]", + "id": "devstral-medium-latest", + "name": "Devstral 2 (latest)", + "display_name": "Devstral 2 (latest)", "modalities": { "input": [ "text" ], "output": [ - "image" + "text" ] }, "limit": { - "context": 8192, - "output": 8192 + "context": 262144, + "output": 262144 }, - "temperature": false, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { "supported": false }, "attachment": false, "open_weights": true, - "release_date": "2024-08-01", - "last_updated": "2026-04-16", + "knowledge": "2025-12", + "release_date": "2025-12-02", + "last_updated": "2025-12-02", + "cost": { + "input": 0.4, + "output": 2 + }, "type": "chat" - } - ] - }, - "submodel": { - "id": "submodel", - "name": "submodel", - "display_name": "submodel", - "api": "https://llm.submodel.ai/v1", - "doc": "https://submodel.gitbook.io", - "models": [ + }, { - "id": "zai-org/GLM-4.5-FP8", - "name": "GLM 4.5 FP8", - "display_name": "GLM 4.5 FP8", + "id": "devstral-2512", + "name": "Devstral 2", + "display_name": "Devstral 2", "modalities": { "input": [ "text" @@ -36510,40 +38826,41 @@ ] }, "limit": { - "context": 131072, - "output": 131072 + "context": 262144, + "output": 262144 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, "attachment": false, "open_weights": true, - "release_date": "2025-07-28", - "last_updated": "2025-07-28", + "knowledge": "2025-12", + "release_date": "2025-12-09", + "last_updated": "2025-12-09", "cost": { - "input": 0.2, - "output": 0.8 + "input": 0.4, + "output": 2 }, "type": "chat" }, { - "id": "zai-org/GLM-4.5-Air", - "name": "GLM 4.5 Air", - "display_name": "GLM 4.5 Air", + "id": "labs-devstral-small-2512", + "name": "Devstral Small 2", + "display_name": "Devstral Small 2", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 131072, - "output": 131072 + "context": 256000, + "output": 256000 }, "temperature": true, "tool_call": true, @@ -36552,198 +38869,85 @@ }, "attachment": false, "open_weights": true, - "release_date": "2025-07-28", - "last_updated": "2025-07-28", + "knowledge": "2025-12", + "release_date": "2025-12-09", + "last_updated": "2025-12-09", "cost": { - "input": 0.1, - "output": 0.5 + "input": 0, + "output": 0 }, "type": "chat" }, { - "id": "deepseek-ai/DeepSeek-V3.1", - "name": "DeepSeek V3.1", - "display_name": "DeepSeek V3.1", + "id": "pixtral-12b", + "name": "Pixtral 12B", + "display_name": "Pixtral 12B", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 75000, - "output": 163840 + "context": 128000, + "output": 128000 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, - "attachment": false, - "open_weights": false, - "release_date": "2025-08-23", - "last_updated": "2025-08-23", + "attachment": true, + "open_weights": true, + "knowledge": "2024-09", + "release_date": "2024-09-01", + "last_updated": "2024-09-01", "cost": { - "input": 0.2, - "output": 0.8 + "input": 0.15, + "output": 0.15 }, "type": "chat" }, { - "id": "deepseek-ai/DeepSeek-V3-0324", - "name": "DeepSeek V3 0324", - "display_name": "DeepSeek V3 0324", + "id": "mistral-large-2512", + "name": "Mistral Large 3", + "display_name": "Mistral Large 3", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 75000, - "output": 163840 + "context": 262144, + "output": 262144 }, "temperature": true, "tool_call": true, "reasoning": { "supported": false }, - "attachment": false, - "open_weights": false, - "release_date": "2025-08-23", - "last_updated": "2025-08-23", - "cost": { - "input": 0.2, - "output": 0.8 - }, - "type": "chat" - }, - { - "id": "deepseek-ai/DeepSeek-R1-0528", - "name": "DeepSeek R1 0528", - "display_name": "DeepSeek R1 0528", - "modalities": { - "input": [ - "text" - ], - "output": [ - "text" - ] - }, - "limit": { - "context": 75000, - "output": 163840 - }, - "temperature": true, - "tool_call": true, - "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } - }, - "attachment": false, - "open_weights": false, - "release_date": "2025-08-23", - "last_updated": "2025-08-23", + "attachment": true, + "open_weights": true, + "knowledge": "2024-11", + "release_date": "2024-11-01", + "last_updated": "2025-12-02", "cost": { "input": 0.5, - "output": 2.15 - }, - "type": "chat" - }, - { - "id": "Qwen/Qwen3-235B-A22B-Thinking-2507", - "name": "Qwen3 235B A22B Thinking 2507", - "display_name": "Qwen3 235B A22B Thinking 2507", - "modalities": { - "input": [ - "text" - ], - "output": [ - "text" - ] - }, - "limit": { - "context": 262144, - "output": 131072 - }, - "temperature": true, - "tool_call": true, - "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } - }, - "attachment": false, - "open_weights": true, - "release_date": "2025-08-23", - "last_updated": "2025-08-23", - "cost": { - "input": 0.2, - "output": 0.6 - }, - "type": "chat" - }, - { - "id": "Qwen/Qwen3-235B-A22B-Instruct-2507", - "name": "Qwen3 235B A22B Instruct 2507", - "display_name": "Qwen3 235B A22B Instruct 2507", - "modalities": { - "input": [ - "text" - ], - "output": [ - "text" - ] - }, - "limit": { - "context": 262144, - "output": 131072 - }, - "temperature": true, - "tool_call": true, - "reasoning": { - "supported": false - }, - "attachment": false, - "open_weights": true, - "release_date": "2025-08-23", - "last_updated": "2025-08-23", - "cost": { - "input": 0.2, - "output": 0.3 + "output": 1.5 }, "type": "chat" }, { - "id": "Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8", - "name": "Qwen3 Coder 480B A35B Instruct", - "display_name": "Qwen3 Coder 480B A35B Instruct", + "id": "devstral-medium-2507", + "name": "Devstral Medium", + "display_name": "Devstral Medium", "modalities": { "input": [ "text" @@ -36753,8 +38957,8 @@ ] }, "limit": { - "context": 262144, - "output": 262144 + "context": 128000, + "output": 128000 }, "temperature": true, "tool_call": true, @@ -36762,49 +38966,13 @@ "supported": false }, "attachment": false, - "open_weights": false, - "release_date": "2025-08-23", - "last_updated": "2025-08-23", - "cost": { - "input": 0.2, - "output": 0.8 - }, - "type": "chat" - }, - { - "id": "openai/gpt-oss-120b", - "name": "GPT OSS 120B", - "display_name": "GPT OSS 120B", - "modalities": { - "input": [ - "text" - ], - "output": [ - "text" - ] - }, - "limit": { - "context": 131072, - "output": 32768 - }, - "temperature": true, - "tool_call": true, - "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true - } - }, - "attachment": false, "open_weights": true, - "release_date": "2025-08-23", - "last_updated": "2025-08-23", + "knowledge": "2025-05", + "release_date": "2025-07-10", + "last_updated": "2025-07-10", "cost": { - "input": 0.1, - "output": 0.5 + "input": 0.4, + "output": 2 }, "type": "chat" } @@ -36889,28 +39057,29 @@ } ] }, - "kimi-for-coding": { - "id": "kimi-for-coding", - "name": "Kimi For Coding", - "display_name": "Kimi For Coding", - "api": "https://api.kimi.com/coding/v1", - "doc": "https://www.kimi.com/code/docs/en/third-party-tools/other-coding-agents.html", + "firepass": { + "id": "firepass", + "name": "Fireworks (Firepass)", + "display_name": "Fireworks (Firepass)", + "api": "https://api.fireworks.ai/inference/v1/", + "doc": "https://docs.fireworks.ai/firepass", "models": [ { - "id": "kimi-k2-thinking", - "name": "Kimi K2 Thinking", - "display_name": "Kimi K2 Thinking", + "id": "accounts/fireworks/routers/kimi-k2p6-turbo", + "name": "Kimi K2.6 Turbo", + "display_name": "Kimi K2.6 Turbo", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 262144, - "output": 32768 + "context": 262000, + "output": 262000 }, "temperature": true, "tool_call": true, @@ -36931,34 +39100,41 @@ }, "attachment": false, "open_weights": true, - "knowledge": "2025-07", - "release_date": "2025-11", - "last_updated": "2025-12", + "release_date": "2026-04-17", + "last_updated": "2026-04-17", "cost": { "input": 0, "output": 0, - "cache_read": 0, - "cache_write": 0 + "cache_read": 0 }, "type": "chat" - }, + } + ] + }, + "anyapi": { + "id": "anyapi", + "name": "AnyAPI", + "display_name": "AnyAPI", + "api": "https://api.anyapi.ai/v1", + "doc": "https://docs.anyapi.ai", + "models": [ { - "id": "k2p5", - "name": "Kimi K2.5", - "display_name": "Kimi K2.5", + "id": "xai/grok-4.3", + "name": "Grok 4.3", + "display_name": "Grok 4.3", "modalities": { "input": [ "text", "image", - "video" + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 262144, - "output": 32768 + "context": 1000000, + "output": 30000 }, "temperature": true, "tool_call": true, @@ -36966,36 +39142,36 @@ "supported": true, "default": true }, - "attachment": false, - "open_weights": true, - "knowledge": "2025-01", - "release_date": "2026-01", - "last_updated": "2026-01", - "cost": { - "input": 0, - "output": 0, - "cache_read": 0, - "cache_write": 0 + "extra_capabilities": { + "reasoning": { + "supported": true + } }, + "attachment": true, + "open_weights": false, + "release_date": "2026-04-17", + "last_updated": "2026-04-17", "type": "chat" }, { - "id": "k2p6", - "name": "Kimi K2.6", - "display_name": "Kimi K2.6", + "id": "google/gemini-2.5-pro", + "name": "Gemini 2.5 Pro", + "display_name": "Gemini 2.5 Pro", "modalities": { "input": [ "text", "image", - "video" + "audio", + "video", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 262144, - "output": 32768 + "context": 1048576, + "output": 65536 }, "temperature": true, "tool_call": true, @@ -37003,43 +39179,51 @@ "supported": true, "default": true }, - "attachment": false, - "open_weights": true, - "knowledge": "2025-01", - "release_date": "2026-04", - "last_updated": "2026-04", - "cost": { - "input": 0, - "output": 0, - "cache_read": 0, - "cache_write": 0 + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": true, + "mode": "budget", + "budget": { + "default": -1, + "min": 128, + "max": 32768, + "auto": -1, + "unit": "tokens" + }, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thought_signatures" + ] + } }, + "attachment": true, + "open_weights": false, + "knowledge": "2025-01", + "release_date": "2025-03-20", + "last_updated": "2025-06-05", "type": "chat" - } - ] - }, - "dinference": { - "id": "dinference", - "name": "DInference", - "display_name": "DInference", - "api": "https://api.dinference.com/v1", - "doc": "https://dinference.com", - "models": [ + }, { - "id": "glm-4.7", - "name": "GLM-4.7", - "display_name": "GLM-4.7", + "id": "google/gemini-2.5-flash", + "name": "Gemini 2.5 Flash", + "display_name": "Gemini 2.5 Flash", "modalities": { "input": [ - "text" + "text", + "image", + "audio", + "video", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 128000 + "context": 1048576, + "output": 65536 }, "temperature": true, "tool_call": true, @@ -37050,76 +39234,101 @@ "extra_capabilities": { "reasoning": { "supported": true, - "interleaved": true, + "default_enabled": true, + "mode": "budget", + "budget": { + "default": -1, + "min": 0, + "max": 24576, + "auto": -1, + "off": 0, + "unit": "tokens" + }, "summaries": true, "visibility": "summary", "continuation": [ - "thinking_blocks" + "thought_signatures" ] } }, - "attachment": false, - "open_weights": true, - "knowledge": "2025-04", - "release_date": "2025-12-22", - "last_updated": "2025-12-22", - "cost": { - "input": 0.45, - "output": 1.65 - }, + "attachment": true, + "open_weights": false, + "knowledge": "2025-01", + "release_date": "2025-03-20", + "last_updated": "2025-06-05", "type": "chat" }, { - "id": "gpt-oss-120b", - "name": "GPT OSS 120B", - "display_name": "GPT OSS 120B", + "id": "google/gemini-2.5-flash-lite", + "name": "Gemini 2.5 Flash-Lite", + "display_name": "Gemini 2.5 Flash-Lite", "modalities": { "input": [ - "text" + "text", + "image", + "audio", + "video", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 131072, - "output": 32768 + "context": 1048576, + "output": 65536 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true + "supported": true, + "default": false }, "extra_capabilities": { "reasoning": { - "supported": true + "supported": true, + "default_enabled": false, + "mode": "budget", + "budget": { + "default": -1, + "min": 512, + "max": 24576, + "auto": -1, + "unit": "tokens" + }, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thought_signatures" + ] } }, - "attachment": false, - "open_weights": true, - "release_date": "2025-08", - "last_updated": "2025-08", - "cost": { - "input": 0.0675, - "output": 0.27 - }, + "attachment": true, + "open_weights": false, + "knowledge": "2025-01", + "release_date": "2025-06-17", + "last_updated": "2025-06-17", "type": "chat" }, { - "id": "glm-5", - "name": "GLM-5", - "display_name": "GLM-5", + "id": "google/gemini-3-pro-preview", + "name": "Gemini 3 Pro Preview", + "display_name": "Gemini 3 Pro Preview", "modalities": { "input": [ - "text" + "text", + "image", + "video", + "audio", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 128000 + "context": 1048576, + "output": 65536 }, "temperature": true, "tool_call": true, @@ -37130,39 +39339,46 @@ "extra_capabilities": { "reasoning": { "supported": true, - "interleaved": true, + "default_enabled": true, + "mode": "level", + "level": "high", + "level_options": [ + "low", + "high" + ], "summaries": true, "visibility": "summary", "continuation": [ - "thinking_blocks" + "thought_signatures" ] } }, - "attachment": false, - "open_weights": true, - "release_date": "2026-02-11", - "last_updated": "2026-02-11", - "cost": { - "input": 0.75, - "output": 2.4 - }, + "attachment": true, + "open_weights": false, + "knowledge": "2025-01", + "release_date": "2025-11-18", + "last_updated": "2025-11-18", "type": "chat" }, { - "id": "minimax-m2.5", - "name": "MiniMax-M2.5", - "display_name": "MiniMax-M2.5", + "id": "google/gemini-3-flash-preview", + "name": "Gemini 3 Flash Preview", + "display_name": "Gemini 3 Flash Preview", "modalities": { "input": [ - "text" + "text", + "image", + "video", + "audio", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 32000 + "context": 1048576, + "output": 65536 }, "temperature": true, "tool_call": true, @@ -37172,26 +39388,39 @@ }, "extra_capabilities": { "reasoning": { - "supported": true + "supported": true, + "default_enabled": true, + "mode": "level", + "level": "high", + "level_options": [ + "minimal", + "low", + "medium", + "high" + ], + "summaries": true, + "visibility": "summary", + "continuation": [ + "thought_signatures" + ] } }, - "attachment": false, - "open_weights": true, - "release_date": "2026-02-12", - "last_updated": "2026-02-12", - "cost": { - "input": 0.22, - "output": 0.88 - }, + "attachment": true, + "open_weights": false, + "knowledge": "2025-01", + "release_date": "2025-12-17", + "last_updated": "2025-12-17", "type": "chat" }, { - "id": "glm-5.1", - "name": "GLM-5.1", - "display_name": "GLM-5.1", + "id": "openai/o3", + "name": "o3", + "display_name": "o3", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ "text" @@ -37199,9 +39428,9 @@ }, "limit": { "context": 200000, - "output": 128000 + "output": 100000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { "supported": true, @@ -37210,100 +39439,123 @@ "extra_capabilities": { "reasoning": { "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] + "default_enabled": true, + "mode": "effort", + "effort": "medium", + "effort_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" } }, - "attachment": false, - "open_weights": true, - "release_date": "2026-03-27", - "last_updated": "2026-03-27", - "cost": { - "input": 1.25, - "output": 3.89 - }, + "attachment": true, + "open_weights": false, + "knowledge": "2024-05", + "release_date": "2025-04-16", + "last_updated": "2025-04-16", "type": "chat" - } - ] - }, - "novita-ai": { - "id": "novita-ai", - "name": "NovitaAI", - "display_name": "NovitaAI", - "api": "https://api.novita.ai/openai", - "doc": "https://novita.ai/docs/guides/introduction", - "models": [ + }, { - "id": "kwaipilot/kat-coder-pro", - "name": "Kat Coder Pro", - "display_name": "Kat Coder Pro", + "id": "openai/gpt-5", + "name": "GPT-5", + "display_name": "GPT-5", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 256000, + "context": 400000, "output": 128000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": false, - "open_weights": true, - "release_date": "2026-01-05", - "last_updated": "2026-01-05", - "cost": { - "input": 0.3, - "output": 1.2, - "cache_read": 0.06 + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": true, + "mode": "effort", + "effort": "medium", + "effort_options": [ + "minimal", + "low", + "medium", + "high" + ], + "verbosity": "medium", + "verbosity_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" + } }, + "attachment": true, + "open_weights": false, + "knowledge": "2024-09-30", + "release_date": "2025-08-07", + "last_updated": "2025-08-07", "type": "chat" }, { - "id": "nousresearch/hermes-2-pro-llama-3-8b", - "name": "Hermes 2 Pro Llama 3 8B", - "display_name": "Hermes 2 Pro Llama 3 8B", + "id": "openai/o4-mini", + "name": "o4-mini", + "display_name": "o4-mini", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 8192, - "output": 8192 + "context": 200000, + "output": 100000 }, - "temperature": true, - "tool_call": false, + "temperature": false, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": false, - "open_weights": true, - "release_date": "2024-06-27", - "last_updated": "2024-06-27", - "cost": { - "input": 0.14, - "output": 0.14 + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": true, + "mode": "effort", + "effort": "medium", + "effort_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" + } }, + "attachment": true, + "open_weights": false, + "knowledge": "2024-05", + "release_date": "2025-04-16", + "last_updated": "2025-04-16", "type": "chat" }, { - "id": "mistralai/mistral-nemo", - "name": "Mistral Nemo", - "display_name": "Mistral Nemo", + "id": "openai/o3-mini", + "name": "o3-mini", + "display_name": "o3-mini", "modalities": { "input": [ "text" @@ -37313,250 +39565,307 @@ ] }, "limit": { - "context": 60288, - "output": 16000 + "context": 200000, + "output": 100000 }, - "temperature": true, - "tool_call": false, + "temperature": false, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": false, - "open_weights": true, - "release_date": "2024-07-30", - "last_updated": "2024-07-30", - "cost": { - "input": 0.04, - "output": 0.17 + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": true, + "mode": "effort", + "effort": "medium", + "effort_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" + } }, + "attachment": false, + "open_weights": false, + "knowledge": "2024-05", + "release_date": "2024-12-20", + "last_updated": "2025-01-29", "type": "chat" }, { - "id": "deepseek/deepseek-r1-0528", - "name": "DeepSeek R1 0528", - "display_name": "DeepSeek R1 0528", + "id": "openai/gpt-5.2", + "name": "GPT-5.2", + "display_name": "GPT-5.2", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 163840, - "output": 32768 + "context": 400000, + "output": 128000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { "supported": true, - "default": true + "default": false }, "extra_capabilities": { "reasoning": { "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] + "default_enabled": false, + "mode": "effort", + "effort": "none", + "effort_options": [ + "none", + "low", + "medium", + "high", + "xhigh" + ], + "verbosity": "medium", + "verbosity_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" } }, - "attachment": false, - "open_weights": true, - "knowledge": "2024-07", - "release_date": "2025-05-28", - "last_updated": "2025-05-28", - "cost": { - "input": 0.7, - "output": 2.5, - "cache_read": 0.35 - }, + "attachment": true, + "open_weights": false, + "knowledge": "2025-08-31", + "release_date": "2025-12-11", + "last_updated": "2025-12-11", "type": "chat" }, { - "id": "deepseek/deepseek-v3-0324", - "name": "DeepSeek V3 0324", - "display_name": "DeepSeek V3 0324", + "id": "openai/gpt-5.4", + "name": "GPT-5.4", + "display_name": "GPT-5.4", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 163840, - "output": 163840 + "context": 1050000, + "output": 128000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": false }, - "attachment": false, - "open_weights": true, - "knowledge": "2024-07", - "release_date": "2025-03-25", - "last_updated": "2025-03-25", - "cost": { - "input": 0.27, - "output": 1.12, - "cache_read": 0.135 + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": false, + "mode": "effort", + "effort": "none", + "effort_options": [ + "none", + "low", + "medium", + "high", + "xhigh" + ], + "verbosity": "medium", + "verbosity_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" + } }, + "attachment": true, + "open_weights": false, + "knowledge": "2025-08-31", + "release_date": "2026-03-05", + "last_updated": "2026-03-05", "type": "chat" }, { - "id": "deepseek/deepseek-v3.2", - "name": "Deepseek V3.2", - "display_name": "Deepseek V3.2", + "id": "openai/gpt-4.1", + "name": "GPT-4.1", + "display_name": "GPT-4.1", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 163840, - "output": 65536 + "context": 1047576, + "output": 32768 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } - }, - "attachment": false, - "open_weights": true, - "release_date": "2025-12-01", - "last_updated": "2025-12-01", - "cost": { - "input": 0.269, - "output": 0.4, - "cache_read": 0.1345 + "supported": false }, + "attachment": true, + "open_weights": false, + "knowledge": "2024-04", + "release_date": "2025-04-14", + "last_updated": "2025-04-14", "type": "chat" }, { - "id": "deepseek/deepseek-r1-turbo", - "name": "DeepSeek R1 (Turbo)\t", - "display_name": "DeepSeek R1 (Turbo)\t", + "id": "openai/gpt-5-mini", + "name": "GPT-5 Mini", + "display_name": "GPT-5 Mini", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 64000, - "output": 16000 + "context": 400000, + "output": 128000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { "supported": true, "default": true }, - "attachment": false, - "open_weights": true, - "release_date": "2025-03-05", - "last_updated": "2025-03-05", - "cost": { - "input": 0.7, - "output": 2.5 + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": true, + "mode": "effort", + "effort": "medium", + "effort_options": [ + "minimal", + "low", + "medium", + "high" + ], + "verbosity": "medium", + "verbosity_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" + } }, + "attachment": true, + "open_weights": false, + "knowledge": "2024-05-30", + "release_date": "2025-08-07", + "last_updated": "2025-08-07", "type": "chat" }, { - "id": "deepseek/deepseek-prover-v2-671b", - "name": "Deepseek Prover V2 671B", - "display_name": "Deepseek Prover V2 671B", + "id": "openai/gpt-4.1-mini", + "name": "GPT-4.1 mini", + "display_name": "GPT-4.1 mini", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 160000, - "output": 160000 + "context": 1047576, + "output": 32768 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { "supported": false }, - "attachment": false, - "open_weights": true, - "release_date": "2025-04-30", - "last_updated": "2025-04-30", - "cost": { - "input": 0.7, - "output": 2.5 - }, + "attachment": true, + "open_weights": false, + "knowledge": "2024-04", + "release_date": "2025-04-14", + "last_updated": "2025-04-14", "type": "chat" }, { - "id": "deepseek/deepseek-r1-distill-llama-70b", - "name": "DeepSeek R1 Distill LLama 70B", - "display_name": "DeepSeek R1 Distill LLama 70B", + "id": "openai/gpt-5.1", + "name": "GPT-5.1", + "display_name": "GPT-5.1", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 8192, - "output": 8192 + "context": 400000, + "output": 128000 }, - "temperature": true, - "tool_call": false, + "temperature": false, + "tool_call": true, "reasoning": { "supported": true, - "default": true + "default": false }, "extra_capabilities": { "reasoning": { - "supported": true + "supported": true, + "default_enabled": false, + "mode": "effort", + "effort": "none", + "effort_options": [ + "none", + "low", + "medium", + "high" + ], + "verbosity": "medium", + "verbosity_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" } }, - "attachment": false, - "open_weights": true, - "release_date": "2025-01-27", - "last_updated": "2025-01-27", - "cost": { - "input": 0.8, - "output": 0.8 - }, + "attachment": true, + "open_weights": false, + "knowledge": "2024-09-30", + "release_date": "2025-11-13", + "last_updated": "2025-11-13", "type": "chat" }, { - "id": "deepseek/deepseek-v3.1-terminus", - "name": "Deepseek V3.1 Terminus", - "display_name": "Deepseek V3.1 Terminus", + "id": "mistralai/devstral-2512", + "name": "Devstral 2", + "display_name": "Devstral 2", "modalities": { "input": [ "text" @@ -37566,373 +39875,420 @@ ] }, "limit": { - "context": 131072, - "output": 32768 + "context": 262144, + "output": 262144 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, "attachment": false, "open_weights": true, - "release_date": "2025-09-22", - "last_updated": "2025-09-22", - "cost": { - "input": 0.27, - "output": 1, - "cache_read": 0.135 - }, + "knowledge": "2025-12", + "release_date": "2025-12-09", + "last_updated": "2025-12-09", "type": "chat" }, { - "id": "deepseek/deepseek-r1-0528-qwen3-8b", - "name": "DeepSeek R1 0528 Qwen3 8B", - "display_name": "DeepSeek R1 0528 Qwen3 8B", + "id": "mistralai/mistral-large-2512", + "name": "Mistral Large 3", + "display_name": "Mistral Large 3", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 32000 + "context": 262144, + "output": 262144 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, - "attachment": false, + "attachment": true, "open_weights": true, - "release_date": "2025-05-29", - "last_updated": "2025-05-29", - "cost": { - "input": 0.06, - "output": 0.09 - }, + "knowledge": "2024-11", + "release_date": "2024-11-01", + "last_updated": "2025-12-02", "type": "chat" }, { - "id": "deepseek/deepseek-v3-turbo", - "name": "DeepSeek V3 (Turbo)\t", - "display_name": "DeepSeek V3 (Turbo)\t", + "id": "anthropic/claude-sonnet-4-5", + "name": "Claude Sonnet 4.5 (latest)", + "display_name": "Claude Sonnet 4.5 (latest)", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 64000, - "output": 16000 + "context": 200000, + "output": 64000 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false - }, - "attachment": false, - "open_weights": true, - "release_date": "2025-03-05", - "last_updated": "2025-03-05", - "cost": { - "input": 0.4, - "output": 1.3 + "supported": true, + "default": false }, - "type": "chat" - }, - { - "id": "deepseek/deepseek-ocr", - "name": "DeepSeek-OCR", - "display_name": "DeepSeek-OCR", - "modalities": { - "input": [ - "text", - "image" - ], - "output": [ - "text" - ] - }, - "limit": { - "context": 8192, - "output": 8192 - }, - "temperature": true, - "tool_call": false, - "reasoning": { - "supported": false + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": false, + "mode": "budget", + "budget": { + "min": 1024, + "unit": "tokens" + }, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ], + "notes": [ + "Claude 4 manual thinking uses thinking.type = \"enabled\" with budget_tokens.", + "Interleaved thinking requires the interleaved-thinking-2025-05-14 beta header for this model family." + ] + } }, "attachment": true, - "open_weights": true, - "release_date": "2025-10-24", - "last_updated": "2025-10-24", - "cost": { - "input": 0.03, - "output": 0.03 - }, + "open_weights": false, + "knowledge": "2025-07-31", + "release_date": "2025-09-29", + "last_updated": "2025-09-29", "type": "chat" }, { - "id": "deepseek/deepseek-r1-distill-qwen-14b", - "name": "DeepSeek R1 Distill Qwen 14B", - "display_name": "DeepSeek R1 Distill Qwen 14B", + "id": "anthropic/claude-opus-4-7", + "name": "Claude Opus 4.7", + "display_name": "Claude Opus 4.7", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 32768, - "output": 16384 + "context": 1000000, + "output": 128000 }, - "temperature": true, - "tool_call": false, + "temperature": false, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": false }, - "attachment": false, - "open_weights": true, - "release_date": "2025-01-20", - "last_updated": "2025-01-20", - "cost": { - "input": 0.15, - "output": 0.15 + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": false, + "mode": "effort", + "effort": "high", + "effort_options": [ + "low", + "medium", + "high", + "xhigh", + "max" + ], + "interleaved": true, + "summaries": true, + "visibility": "omitted", + "continuation": [ + "thinking_blocks" + ], + "notes": [ + "Claude Opus 4.7 and newer Opus models require thinking.type = \"adaptive\" to enable thinking explicitly.", + "Manual budget_tokens requests return 400 on Claude Opus 4.7 and newer adaptive-only Opus models.", + "task_budget is separate from thinking control and should not be treated as a thinking budget." + ] + } }, + "attachment": true, + "open_weights": false, + "knowledge": "2026-01-31", + "release_date": "2026-04-16", + "last_updated": "2026-04-16", "type": "chat" }, { - "id": "deepseek/deepseek-v4-flash", - "name": "DeepSeek V4 Flash", - "display_name": "DeepSeek V4 Flash", + "id": "anthropic/claude-haiku-4-5", + "name": "Claude Haiku 4.5 (latest)", + "display_name": "Claude Haiku 4.5 (latest)", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 1048576, - "output": 393216 + "context": 200000, + "output": 64000 }, "temperature": true, "tool_call": true, "reasoning": { "supported": true, - "default": true + "default": false }, "extra_capabilities": { "reasoning": { "supported": true, + "default_enabled": false, + "mode": "budget", + "budget": { + "min": 1024, + "unit": "tokens" + }, "interleaved": true, "summaries": true, "visibility": "summary", "continuation": [ "thinking_blocks" + ], + "notes": [ + "Claude 4 manual thinking uses thinking.type = \"enabled\" with budget_tokens.", + "Interleaved thinking requires the interleaved-thinking-2025-05-14 beta header for this model family." ] } }, - "attachment": false, - "open_weights": true, - "knowledge": "2025-05", - "release_date": "2026-04-24", - "last_updated": "2026-04-24", - "cost": { - "input": 0.14, - "output": 0.28, - "cache_read": 0.028 - }, + "attachment": true, + "open_weights": false, + "knowledge": "2025-02-28", + "release_date": "2025-10-15", + "last_updated": "2025-10-15", "type": "chat" }, { - "id": "deepseek/deepseek-v3.2-exp", - "name": "Deepseek V3.2 Exp", - "display_name": "Deepseek V3.2 Exp", + "id": "anthropic/claude-opus-4-6", + "name": "Claude Opus 4.6", + "display_name": "Claude Opus 4.6", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 163840, - "output": 65536 + "context": 1000000, + "output": 128000 }, "temperature": true, "tool_call": true, "reasoning": { "supported": true, - "default": true + "default": false }, - "attachment": false, - "open_weights": true, - "release_date": "2025-09-29", - "last_updated": "2025-09-29", - "cost": { - "input": 0.27, - "output": 0.41 + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": false, + "mode": "mixed", + "budget": { + "min": 1024, + "unit": "tokens" + }, + "effort": "high", + "effort_options": [ + "low", + "medium", + "high", + "max" + ], + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ], + "notes": [ + "Anthropic recommends adaptive thinking with effort for Claude 4.6; budget_tokens remains a deprecated compatibility path.", + "Anthropic API defaults effort to high; lower effort levels should be chosen per workload." + ] + } }, + "attachment": true, + "open_weights": false, + "knowledge": "2025-05-31", + "release_date": "2026-02-05", + "last_updated": "2026-03-13", "type": "chat" }, { - "id": "deepseek/deepseek-v4-pro", - "name": "DeepSeek V4 Pro", - "display_name": "DeepSeek V4 Pro", + "id": "anthropic/claude-sonnet-4-6", + "name": "Claude Sonnet 4.6", + "display_name": "Claude Sonnet 4.6", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 1048576, - "output": 393216 + "context": 1000000, + "output": 64000 }, "temperature": true, "tool_call": true, "reasoning": { "supported": true, - "default": true + "default": false }, "extra_capabilities": { "reasoning": { "supported": true, + "default_enabled": false, + "mode": "mixed", + "budget": { + "min": 1024, + "unit": "tokens" + }, + "effort": "high", + "effort_options": [ + "low", + "medium", + "high", + "max" + ], "interleaved": true, "summaries": true, "visibility": "summary", "continuation": [ "thinking_blocks" + ], + "notes": [ + "Anthropic recommends adaptive thinking with effort for Claude 4.6; budget_tokens remains a deprecated compatibility path.", + "Anthropic API defaults effort to high; lower effort levels should be chosen per workload." ] } }, - "attachment": false, - "open_weights": true, - "knowledge": "2025-05", - "release_date": "2026-04-24", - "last_updated": "2026-04-24", - "cost": { - "input": 1.69, - "output": 3.38, - "cache_read": 0.13 - }, + "attachment": true, + "open_weights": false, + "knowledge": "2025-08-31", + "release_date": "2026-02-17", + "last_updated": "2026-03-13", "type": "chat" }, { - "id": "deepseek/deepseek-ocr-2", - "name": "deepseek/deepseek-ocr-2", - "display_name": "deepseek/deepseek-ocr-2", + "id": "cohere/command-r-plus-08-2024", + "name": "Command R+", + "display_name": "Command R+", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 8192, - "output": 8192 + "context": 128000, + "output": 4000 }, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { "supported": false }, - "attachment": true, + "attachment": false, "open_weights": true, - "release_date": "2026-01-27", - "last_updated": "2026-01-27", - "cost": { - "input": 0.03, - "output": 0.03 - }, + "knowledge": "2024-06-01", + "release_date": "2024-08-30", + "last_updated": "2024-08-30", "type": "chat" }, { - "id": "deepseek/deepseek-v3.1", - "name": "DeepSeek V3.1", - "display_name": "DeepSeek V3.1", + "id": "perplexity/sonar-reasoning-pro", + "name": "Sonar Reasoning Pro", + "display_name": "Sonar Reasoning Pro", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 131072, - "output": 32768 + "context": 128000, + "output": 4096 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": true, "default": true }, - "attachment": false, - "open_weights": true, - "release_date": "2025-08-21", - "last_updated": "2025-08-21", - "cost": { - "input": 0.27, - "output": 1, - "cache_read": 0.135 - }, + "attachment": true, + "open_weights": false, + "knowledge": "2025-09-01", + "release_date": "2024-01-01", + "last_updated": "2025-09-01", "type": "chat" }, { - "id": "deepseek/deepseek-r1-distill-qwen-32b", - "name": "DeepSeek R1 Distill Qwen 32B", - "display_name": "DeepSeek R1 Distill Qwen 32B", + "id": "perplexity/sonar-pro", + "name": "Sonar Pro", + "display_name": "Sonar Pro", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 64000, - "output": 32000 + "context": 200000, + "output": 8192 }, "temperature": true, "tool_call": false, "reasoning": { "supported": false }, - "attachment": false, - "open_weights": true, - "release_date": "2025-01-20", - "last_updated": "2025-01-20", - "cost": { - "input": 0.3, - "output": 0.3 - }, + "attachment": true, + "open_weights": false, + "knowledge": "2025-09-01", + "release_date": "2024-01-01", + "last_updated": "2025-09-01", "type": "chat" }, { - "id": "xiaomimimo/mimo-v2-pro", - "name": "MiMo-V2-Pro", - "display_name": "MiMo-V2-Pro", + "id": "deepseek/deepseek-v4-flash", + "name": "DeepSeek V4 Flash", + "display_name": "DeepSeek V4 Flash", "modalities": { "input": [ "text" @@ -37942,8 +40298,8 @@ ] }, "limit": { - "context": 1048576, - "output": 131072 + "context": 1000000, + "output": 384000 }, "temperature": true, "tool_call": true, @@ -37963,71 +40319,16 @@ } }, "attachment": false, - "open_weights": false, - "knowledge": "2024-12", - "release_date": "2026-03-18", - "last_updated": "2026-05-27", - "cost": { - "input": 2, - "output": 6, - "cache_read": 0.4, - "tiers": [ - { - "input": 2, - "output": 6, - "cache_read": 0.4, - "tier": { - "type": "context", - "size": 256000 - } - } - ], - "context_over_200k": { - "input": 2, - "output": 6, - "cache_read": 0.4 - } - }, - "type": "chat" - }, - { - "id": "xiaomimimo/mimo-v2-flash", - "name": "XiaomiMiMo/MiMo-V2-Flash", - "display_name": "XiaomiMiMo/MiMo-V2-Flash", - "modalities": { - "input": [ - "text" - ], - "output": [ - "text" - ] - }, - "limit": { - "context": 262144, - "output": 32000 - }, - "temperature": true, - "tool_call": true, - "reasoning": { - "supported": true, - "default": true - }, - "attachment": false, "open_weights": true, - "knowledge": "2024-12", - "release_date": "2025-12-19", - "last_updated": "2025-12-19", - "cost": { - "input": 0.1, - "output": 0.3, - "cache_read": 0.3 - }, + "knowledge": "2025-05", + "release_date": "2026-04-24", + "last_updated": "2026-04-24", "type": "chat" }, { - "id": "xiaomimimo/mimo-v2.5-pro", - "name": "MiMo-V2.5-Pro", - "display_name": "MiMo-V2.5-Pro", + "id": "deepseek/deepseek-v4-pro", + "name": "DeepSeek V4 Pro", + "display_name": "DeepSeek V4 Pro", "modalities": { "input": [ "text" @@ -38037,8 +40338,8 @@ ] }, "limit": { - "context": 1048576, - "output": 131072 + "context": 1000000, + "output": 384000 }, "temperature": true, "tool_call": true, @@ -38059,36 +40360,15 @@ }, "attachment": false, "open_weights": true, - "knowledge": "2024-12", - "release_date": "2026-04-22", - "last_updated": "2026-05-27", - "cost": { - "input": 2, - "output": 6, - "cache_read": 0.4, - "tiers": [ - { - "input": 2, - "output": 6, - "cache_read": 0.4, - "tier": { - "type": "context", - "size": 256000 - } - } - ], - "context_over_200k": { - "input": 2, - "output": 6, - "cache_read": 0.4 - } - }, + "knowledge": "2025-05", + "release_date": "2026-04-24", + "last_updated": "2026-04-24", "type": "chat" }, { - "id": "zai-org/glm-4.6", - "name": "GLM 4.6", - "display_name": "GLM 4.6", + "id": "deepseek/deepseek-r1", + "name": "DeepSeek Reasoner", + "display_name": "DeepSeek Reasoner", "modalities": { "input": [ "text" @@ -38098,8 +40378,8 @@ ] }, "limit": { - "context": 204800, - "output": 131072 + "context": 1000000, + "output": 384000 }, "temperature": true, "tool_call": true, @@ -38118,21 +40398,17 @@ ] } }, - "attachment": false, + "attachment": true, "open_weights": true, - "release_date": "2025-09-30", - "last_updated": "2025-09-30", - "cost": { - "input": 0.55, - "output": 2.2, - "cache_read": 0.11 - }, + "knowledge": "2025-09", + "release_date": "2025-12-01", + "last_updated": "2026-02-28", "type": "chat" }, { - "id": "zai-org/glm-4.7", - "name": "GLM-4.7", - "display_name": "GLM-4.7", + "id": "deepseek/deepseek-chat", + "name": "DeepSeek Chat", + "display_name": "DeepSeek Chat", "modalities": { "input": [ "text" @@ -38142,54 +40418,48 @@ ] }, "limit": { - "context": 204800, - "output": 131072 + "context": 1000000, + "output": 384000 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } + "supported": false }, - "attachment": false, + "attachment": true, "open_weights": true, - "release_date": "2025-12-22", - "last_updated": "2025-12-22", - "cost": { - "input": 0.6, - "output": 2.2, - "cache_read": 0.11 - }, + "knowledge": "2025-09", + "release_date": "2025-12-01", + "last_updated": "2026-02-28", "type": "chat" - }, + } + ] + }, + "google": { + "id": "google", + "name": "google", + "display_name": "google", + "doc": "https://ai.google.dev/gemini-api/docs/models", + "models": [ { - "id": "zai-org/glm-4.5v", - "name": "GLM 4.5V", - "display_name": "GLM 4.5V", + "id": "gemini-3.1-flash-lite", + "name": "Gemini 3.1 Flash Lite", + "display_name": "Gemini 3.1 Flash Lite", "modalities": { "input": [ "text", + "image", "video", - "image" + "audio", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 65536, - "output": 16384 + "context": 1048576, + "output": 65536 }, "temperature": true, "tool_call": true, @@ -38197,152 +40467,219 @@ "supported": true, "default": true }, + "extra_capabilities": { + "reasoning": { + "supported": true + } + }, "attachment": true, - "open_weights": true, - "knowledge": "2025-04", - "release_date": "2025-08-11", - "last_updated": "2025-08-11", + "open_weights": false, + "knowledge": "2025-01", + "release_date": "2026-05-07", + "last_updated": "2026-05-07", "cost": { - "input": 0.6, - "output": 1.8, - "cache_read": 0.11 + "input": 0.25, + "output": 1.5, + "cache_read": 0.025, + "input_audio": 0.5 }, "type": "chat" }, { - "id": "zai-org/glm-4.6v", - "name": "GLM 4.6V", - "display_name": "GLM 4.6V", + "id": "gemini-2.5-flash-preview-tts", + "name": "Gemini 2.5 Flash Preview TTS", + "display_name": "Gemini 2.5 Flash Preview TTS", "modalities": { "input": [ - "text", - "video", - "image" + "text" ], "output": [ - "text" + "audio" ] }, "limit": { - "context": 131072, - "output": 32768 + "context": 8192, + "output": 16384 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": true + "supported": false }, - "attachment": true, - "open_weights": true, - "knowledge": "2025-04", - "release_date": "2025-12-08", - "last_updated": "2025-12-08", + "attachment": false, + "open_weights": false, + "knowledge": "2025-01", + "release_date": "2025-05-01", + "last_updated": "2025-05-01", "cost": { - "input": 0.3, - "output": 0.9, - "cache_read": 0.055 + "input": 0.5, + "output": 10 }, "type": "chat" }, { - "id": "zai-org/glm-4.7-flash", - "name": "GLM-4.7-Flash", - "display_name": "GLM-4.7-Flash", + "id": "gemini-2.5-pro", + "name": "Gemini 2.5 Pro", + "display_name": "Gemini 2.5 Pro", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 128000 + "context": 1048576, + "output": 65536 }, "temperature": true, "tool_call": true, "reasoning": { "supported": true, - "default": true + "default": true, + "budget": { + "default": -1, + "min": 128, + "max": 32768 + } }, "extra_capabilities": { "reasoning": { - "supported": true + "supported": true, + "default_enabled": true, + "mode": "budget", + "budget": { + "default": -1, + "min": 128, + "max": 32768, + "auto": -1, + "unit": "tokens" + }, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thought_signatures" + ] } }, - "attachment": false, - "open_weights": true, - "knowledge": "2025-04", - "release_date": "2026-01-19", - "last_updated": "2026-01-19", + "search": { + "supported": true, + "default": false + }, + "attachment": true, + "open_weights": false, + "knowledge": "2025-01", + "release_date": "2025-03-20", + "last_updated": "2025-06-05", "cost": { - "input": 0.07, - "output": 0.4, - "cache_read": 0.01 + "input": 1.25, + "output": 10, + "cache_read": 0.125, + "tiers": [ + { + "input": 2.5, + "output": 15, + "cache_read": 0.25, + "tier": { + "type": "context", + "size": 200000 + } + } + ], + "context_over_200k": { + "input": 2.5, + "output": 15, + "cache_read": 0.25 + } }, "type": "chat" }, { - "id": "zai-org/glm-5", - "name": "GLM-5", - "display_name": "GLM-5", + "id": "gemini-2.5-flash", + "name": "Gemini 2.5 Flash", + "display_name": "Gemini 2.5 Flash", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 202800, - "output": 131072 + "context": 1048576, + "output": 65536 }, "temperature": true, "tool_call": true, "reasoning": { "supported": true, - "default": true + "default": true, + "budget": { + "default": -1, + "min": 0, + "max": 24576 + } }, "extra_capabilities": { "reasoning": { "supported": true, - "interleaved": true, + "default_enabled": true, + "mode": "budget", + "budget": { + "default": -1, + "min": 0, + "max": 24576, + "auto": -1, + "off": 0, + "unit": "tokens" + }, "summaries": true, "visibility": "summary", "continuation": [ - "thinking_blocks" + "thought_signatures" ] } }, - "attachment": false, - "open_weights": true, - "release_date": "2026-02-11", - "last_updated": "2026-02-12", + "search": { + "supported": true, + "default": false + }, + "attachment": true, + "open_weights": false, + "knowledge": "2025-01", + "release_date": "2025-03-20", + "last_updated": "2025-06-05", "cost": { - "input": 1, - "output": 3.2, - "cache_read": 0.2 + "input": 0.3, + "output": 2.5, + "cache_read": 0.03, + "input_audio": 1 }, "type": "chat" }, { - "id": "zai-org/glm-4.5", - "name": "GLM-4.5", - "display_name": "GLM-4.5", + "id": "gemini-3.5-flash", + "name": "Gemini 3.5 Flash", + "display_name": "Gemini 3.5 Flash", "modalities": { "input": [ - "text" + "text", + "image", + "video", + "audio", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 131072, - "output": 98304 + "context": 1048576, + "output": 65536 }, "temperature": true, "tool_call": true, @@ -38353,29 +40690,39 @@ "extra_capabilities": { "reasoning": { "supported": true, - "interleaved": true, + "default_enabled": true, + "mode": "level", + "level": "high", + "level_options": [ + "minimal", + "low", + "medium", + "high" + ], "summaries": true, "visibility": "summary", "continuation": [ - "thinking_blocks" + "thought_signatures" ] } }, - "attachment": false, - "open_weights": true, - "release_date": "2025-07-28", - "last_updated": "2025-07-28", + "attachment": true, + "open_weights": false, + "knowledge": "2025-01", + "release_date": "2026-05-19", + "last_updated": "2026-05-19", "cost": { - "input": 0.6, - "output": 2.2, - "cache_read": 0.11 + "input": 1.5, + "output": 9, + "cache_read": 0.15, + "input_audio": 1.5 }, "type": "chat" }, { - "id": "zai-org/autoglm-phone-9b-multilingual", - "name": "AutoGLM-Phone-9B-Multilingual", - "display_name": "AutoGLM-Phone-9B-Multilingual", + "id": "gemma-4-31b-it", + "name": "Gemma 4 31B IT", + "display_name": "Gemma 4 31B IT", "modalities": { "input": [ "text", @@ -38386,61 +40733,64 @@ ] }, "limit": { - "context": 65536, - "output": 65536 + "context": 262144, + "output": 32768 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "attachment": true, "open_weights": true, - "release_date": "2025-12-10", - "last_updated": "2025-12-10", - "cost": { - "input": 0.035, - "output": 0.138 - }, + "release_date": "2026-04-02", + "last_updated": "2026-04-02", "type": "chat" }, { - "id": "zai-org/glm-4.5-air", - "name": "GLM 4.5 Air", - "display_name": "GLM 4.5 Air", + "id": "gemini-2.0-flash", + "name": "Gemini 2.0 Flash", + "display_name": "Gemini 2.0 Flash", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 131072, - "output": 98304 + "context": 1048576, + "output": 8192 }, "temperature": true, "tool_call": true, "reasoning": { "supported": true, - "default": true + "default": false }, - "attachment": false, - "open_weights": true, - "knowledge": "2025-04", - "release_date": "2025-10-13", - "last_updated": "2025-10-13", + "search": { + "supported": true, + "default": false + }, + "attachment": true, + "open_weights": false, + "knowledge": "2024-06", + "release_date": "2024-12-11", + "last_updated": "2024-12-11", "cost": { - "input": 0.13, - "output": 0.85 + "input": 0.1, + "output": 0.4, + "cache_read": 0.025 }, "type": "chat" }, { - "id": "zai-org/glm-5.1", - "name": "GLM-5.1", - "display_name": "GLM-5.1", + "id": "gemini-embedding-001", + "name": "Gemini Embedding 001", + "display_name": "Gemini Embedding 001", "modalities": { "input": [ "text" @@ -38450,53 +40800,43 @@ ] }, "limit": { - "context": 204800, - "output": 131072 + "context": 2048, + "output": 1 }, - "temperature": true, - "tool_call": true, + "temperature": false, + "tool_call": false, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } + "supported": false }, "attachment": false, - "open_weights": true, - "release_date": "2026-03-27", - "last_updated": "2026-03-27", + "open_weights": false, + "knowledge": "2025-05", + "release_date": "2025-05-20", + "last_updated": "2025-05-20", "cost": { - "input": 1.4, - "output": 4.4, - "cache_read": 0.26 + "input": 0.15, + "output": 0 }, - "type": "chat" + "type": "embedding" }, { - "id": "qwen/qwen3.5-122b-a10b", - "name": "Qwen3.5-122B-A10B", - "display_name": "Qwen3.5-122B-A10B", + "id": "gemini-3.1-pro-preview-customtools", + "name": "Gemini 3.1 Pro Preview Custom Tools", + "display_name": "Gemini 3.1 Pro Preview Custom Tools", "modalities": { "input": [ "text", "image", - "video" + "video", + "audio", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 262144, + "context": 1048576, "output": 65536 }, "temperature": true, @@ -38508,414 +40848,617 @@ "extra_capabilities": { "reasoning": { "supported": true, - "interleaved": true, + "default_enabled": true, + "mode": "level", + "level": "high", + "level_options": [ + "low", + "high" + ], "summaries": true, "visibility": "summary", "continuation": [ - "thinking_blocks" + "thought_signatures" ] } }, "attachment": true, - "open_weights": true, - "release_date": "2026-02-26", - "last_updated": "2026-02-26", + "open_weights": false, + "knowledge": "2025-01", + "release_date": "2026-02-19", + "last_updated": "2026-02-19", "cost": { - "input": 0.4, - "output": 3.2 + "input": 2, + "output": 12, + "cache_read": 0.2, + "tiers": [ + { + "input": 4, + "output": 18, + "cache_read": 0.4, + "tier": { + "type": "context", + "size": 200000 + } + } + ], + "context_over_200k": { + "input": 4, + "output": 18, + "cache_read": 0.4 + } }, "type": "chat" }, { - "id": "qwen/qwen3-next-80b-a3b-instruct", - "name": "Qwen3 Next 80B A3B Instruct", - "display_name": "Qwen3 Next 80B A3B Instruct", + "id": "gemini-flash-lite-latest", + "name": "Gemini Flash-Lite Latest", + "display_name": "Gemini Flash-Lite Latest", "modalities": { "input": [ - "text" + "text", + "image", + "audio", + "video", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 131072, - "output": 32768 + "context": 1048576, + "output": 65536 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": false, - "open_weights": true, - "release_date": "2025-09-10", - "last_updated": "2025-09-10", + "attachment": true, + "open_weights": false, + "knowledge": "2025-01", + "release_date": "2025-09-25", + "last_updated": "2025-09-25", "cost": { - "input": 0.15, - "output": 1.5 + "input": 0.1, + "output": 0.4, + "cache_read": 0.025 }, "type": "chat" }, { - "id": "qwen/qwen2.5-vl-72b-instruct", - "name": "Qwen2.5 VL 72B Instruct", - "display_name": "Qwen2.5 VL 72B Instruct", + "id": "gemini-3-pro-image-preview", + "name": "Nano Banana Pro", + "display_name": "Nano Banana Pro", "modalities": { "input": [ "text", - "image", - "video" + "image" ], "output": [ - "text" + "text", + "image" ] }, "limit": { - "context": 32768, + "context": 131072, "output": 32768 }, "temperature": true, "tool_call": false, "reasoning": { - "supported": false + "supported": true, + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": true, + "mode": "level", + "level": "high", + "level_options": [ + "low", + "high" + ], + "summaries": true, + "visibility": "summary", + "continuation": [ + "thought_signatures" + ] + } }, "attachment": true, - "open_weights": true, - "release_date": "2025-03-25", - "last_updated": "2025-03-25", + "open_weights": false, + "knowledge": "2025-01", + "release_date": "2025-11-20", + "last_updated": "2025-11-20", "cost": { - "input": 0.8, - "output": 0.8 + "input": 2, + "output": 120 }, - "type": "chat" + "type": "imageGeneration" }, { - "id": "qwen/qwen3-vl-30b-a3b-instruct", - "name": "qwen/qwen3-vl-30b-a3b-instruct", - "display_name": "qwen/qwen3-vl-30b-a3b-instruct", + "id": "gemini-2.5-flash-image", + "name": "Gemini 2.5 Flash Image", + "display_name": "Gemini 2.5 Flash Image", "modalities": { "input": [ "text", - "video", "image" ], "output": [ - "text" + "text", + "image" ] }, "limit": { - "context": 131072, + "context": 32768, "output": 32768 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": false }, - "attachment": true, - "open_weights": true, - "release_date": "2025-10-11", - "last_updated": "2025-10-11", + "attachment": false, + "open_weights": false, + "knowledge": "2025-06", + "release_date": "2025-08-26", + "last_updated": "2025-08-26", "cost": { - "input": 0.2, - "output": 0.7 + "input": 0.3, + "output": 30, + "cache_read": 0.075 }, - "type": "chat" + "type": "imageGeneration" }, { - "id": "qwen/qwen3-8b-fp8", - "name": "Qwen3 8B", - "display_name": "Qwen3 8B", + "id": "gemini-2.5-flash-lite", + "name": "Gemini 2.5 Flash Lite", + "display_name": "Gemini 2.5 Flash Lite", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 20000 + "context": 1048576, + "output": 65536 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { "supported": true, - "default": true + "default": false, + "budget": { + "default": -1, + "min": 512, + "max": 24576 + } }, - "attachment": false, - "open_weights": true, - "release_date": "2025-04-29", - "last_updated": "2025-04-29", + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": false, + "mode": "budget", + "budget": { + "default": -1, + "min": 512, + "max": 24576, + "auto": -1, + "unit": "tokens" + }, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thought_signatures" + ] + } + }, + "search": { + "supported": true, + "default": false + }, + "attachment": true, + "open_weights": false, + "knowledge": "2025-01", + "release_date": "2025-06-17", + "last_updated": "2025-06-17", "cost": { - "input": 0.035, - "output": 0.138 + "input": 0.1, + "output": 0.4, + "cache_read": 0.01, + "input_audio": 0.3 }, "type": "chat" }, { - "id": "qwen/qwen3-coder-30b-a3b-instruct", - "name": "Qwen3 Coder 30b A3B Instruct", - "display_name": "Qwen3 Coder 30b A3B Instruct", + "id": "gemini-3.1-flash-image-preview", + "name": "Nano Banana 2", + "display_name": "Nano Banana 2", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ - "text" + "text", + "image" ] }, "limit": { - "context": 160000, - "output": 32768 + "context": 65536, + "output": 65536 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": false, - "open_weights": true, - "release_date": "2025-10-09", - "last_updated": "2025-10-09", + "extra_capabilities": { + "reasoning": { + "supported": true + } + }, + "attachment": true, + "open_weights": false, + "knowledge": "2025-01", + "release_date": "2026-02-26", + "last_updated": "2026-02-26", "cost": { - "input": 0.07, - "output": 0.27 + "input": 0.5, + "output": 60 }, - "type": "chat" + "type": "imageGeneration" }, { - "id": "qwen/qwen3-vl-30b-a3b-thinking", - "name": "qwen/qwen3-vl-30b-a3b-thinking", - "display_name": "qwen/qwen3-vl-30b-a3b-thinking", + "id": "gemini-3.1-pro-preview", + "name": "Gemini 3.1 Pro Preview", + "display_name": "Gemini 3.1 Pro Preview", "modalities": { "input": [ "text", "image", - "video" + "video", + "audio", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 131072, - "output": 32768 + "context": 1048576, + "output": 65536 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true + "supported": true, + "default": true }, "extra_capabilities": { "reasoning": { "supported": true, - "interleaved": true, + "default_enabled": true, + "mode": "level", + "level": "high", + "level_options": [ + "low", + "high" + ], "summaries": true, "visibility": "summary", "continuation": [ - "thinking_blocks" + "thought_signatures" ] } }, "attachment": true, - "open_weights": true, - "release_date": "2025-10-11", - "last_updated": "2025-10-11", + "open_weights": false, + "knowledge": "2025-01", + "release_date": "2026-02-19", + "last_updated": "2026-02-19", "cost": { - "input": 0.2, - "output": 1 + "input": 2, + "output": 12, + "cache_read": 0.2, + "tiers": [ + { + "input": 4, + "output": 18, + "cache_read": 0.4, + "tier": { + "type": "context", + "size": 200000 + } + } + ], + "context_over_200k": { + "input": 4, + "output": 18, + "cache_read": 0.4 + } }, "type": "chat" }, { - "id": "qwen/qwen3-235b-a22b-fp8", - "name": "Qwen3 235B A22B", - "display_name": "Qwen3 235B A22B", + "id": "gemma-4-26b-a4b-it", + "name": "Gemma 4 26B A4B IT", + "display_name": "Gemma 4 26B A4B IT", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 40960, - "output": 20000 + "context": 262144, + "output": 32768 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { "supported": true, "default": true }, - "attachment": false, + "attachment": true, "open_weights": true, - "release_date": "2025-04-29", - "last_updated": "2025-04-29", - "cost": { - "input": 0.2, - "output": 0.8 - }, + "release_date": "2026-04-02", + "last_updated": "2026-04-02", "type": "chat" }, { - "id": "qwen/qwen3-vl-235b-a22b-instruct", - "name": "Qwen3 VL 235B A22B Instruct", - "display_name": "Qwen3 VL 235B A22B Instruct", + "id": "gemini-3-pro-preview", + "name": "Gemini 3 Pro Preview", + "display_name": "Gemini 3 Pro Preview", "modalities": { "input": [ "text", "image", - "video" + "video", + "audio", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 131072, - "output": 32768 + "context": 1048576, + "output": 65536 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": true, + "mode": "level", + "level": "high", + "level_options": [ + "low", + "high" + ], + "summaries": true, + "visibility": "summary", + "continuation": [ + "thought_signatures" + ] + } }, "attachment": true, - "open_weights": true, - "release_date": "2025-09-24", - "last_updated": "2025-09-24", + "open_weights": false, + "knowledge": "2025-01", + "release_date": "2025-11-18", + "last_updated": "2025-11-18", "cost": { - "input": 0.3, - "output": 1.5 + "input": 2, + "output": 12, + "cache_read": 0.2, + "tiers": [ + { + "input": 4, + "output": 18, + "cache_read": 0.4, + "tier": { + "type": "context", + "size": 200000 + } + } + ], + "context_over_200k": { + "input": 4, + "output": 18, + "cache_read": 0.4 + } }, "type": "chat" }, { - "id": "qwen/qwen3-32b-fp8", - "name": "Qwen3 32B", - "display_name": "Qwen3 32B", + "id": "gemini-3-flash-preview", + "name": "Gemini 3 Flash Preview", + "display_name": "Gemini 3 Flash Preview", "modalities": { "input": [ - "text" + "text", + "image", + "video", + "audio", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 40960, - "output": 20000 + "context": 1048576, + "output": 65536 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { "supported": true, "default": true }, - "attachment": false, - "open_weights": true, - "release_date": "2025-04-29", - "last_updated": "2025-04-29", + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": true, + "mode": "level", + "level": "high", + "level_options": [ + "minimal", + "low", + "medium", + "high" + ], + "summaries": true, + "visibility": "summary", + "continuation": [ + "thought_signatures" + ] + } + }, + "attachment": true, + "open_weights": false, + "knowledge": "2025-01", + "release_date": "2025-12-17", + "last_updated": "2025-12-17", "cost": { - "input": 0.1, - "output": 0.45 + "input": 0.5, + "output": 3, + "cache_read": 0.05, + "input_audio": 1 }, "type": "chat" }, { - "id": "qwen/qwen3-max", - "name": "Qwen3 Max", - "display_name": "Qwen3 Max", + "id": "gemini-2.5-pro-preview-tts", + "name": "Gemini 2.5 Pro Preview TTS", + "display_name": "Gemini 2.5 Pro Preview TTS", "modalities": { "input": [ "text" ], "output": [ - "text" + "audio" ] }, "limit": { - "context": 262144, - "output": 65536 + "context": 8192, + "output": 16384 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true + "supported": true, + "default": true }, "extra_capabilities": { "reasoning": { "supported": true, - "interleaved": true, + "default_enabled": true, + "mode": "budget", + "budget": { + "default": -1, + "min": 128, + "max": 32768, + "auto": -1, + "unit": "tokens" + }, "summaries": true, "visibility": "summary", "continuation": [ - "thinking_blocks" + "thought_signatures" ] } }, "attachment": false, "open_weights": false, - "knowledge": "2025-04", - "release_date": "2025-09-24", - "last_updated": "2025-09-24", + "knowledge": "2025-01", + "release_date": "2025-05-01", + "last_updated": "2025-05-01", "cost": { - "input": 2.11, - "output": 8.45 + "input": 1, + "output": 20 }, "type": "chat" }, { - "id": "qwen/qwen3-coder-next", - "name": "Qwen3 Coder Next", - "display_name": "Qwen3 Coder Next", + "id": "gemini-flash-latest", + "name": "Gemini Flash Latest", + "display_name": "Gemini Flash Latest", "modalities": { "input": [ - "text" + "text", + "image", + "audio", + "video", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 262144, + "context": 1048576, "output": 65536 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": false, - "open_weights": true, - "release_date": "2026-02-03", - "last_updated": "2026-02-03", + "attachment": true, + "open_weights": false, + "knowledge": "2025-01", + "release_date": "2025-09-25", + "last_updated": "2025-09-25", "cost": { - "input": 0.2, - "output": 1.5 + "input": 0.3, + "output": 2.5, + "cache_read": 0.075, + "input_audio": 1 }, "type": "chat" }, { - "id": "qwen/qwen3-235b-a22b-thinking-2507", - "name": "Qwen3 235B A22b Thinking 2507", - "display_name": "Qwen3 235B A22b Thinking 2507", + "id": "gemini-3.1-flash-lite-preview", + "name": "Gemini 3.1 Flash Lite Preview", + "display_name": "Gemini 3.1 Flash Lite Preview", "modalities": { "input": [ - "text" + "text", + "image", + "video", + "audio", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 131072, - "output": 32768 + "context": 1048576, + "output": 65536 }, "temperature": true, "tool_call": true, @@ -38925,214 +41468,235 @@ }, "extra_capabilities": { "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] + "supported": true } }, - "attachment": false, - "open_weights": true, - "knowledge": "2025-04", - "release_date": "2025-07-25", - "last_updated": "2025-07-25", + "attachment": true, + "open_weights": false, + "knowledge": "2025-01", + "release_date": "2026-03-03", + "last_updated": "2026-03-03", "cost": { - "input": 0.3, - "output": 3 + "input": 0.25, + "output": 1.5, + "cache_read": 0.025, + "input_audio": 0.5 }, "type": "chat" }, { - "id": "qwen/qwen3-4b-fp8", - "name": "Qwen3 4B", - "display_name": "Qwen3 4B", + "id": "gemini-2.0-flash-lite", + "name": "Gemini 2.0 Flash Lite", + "display_name": "Gemini 2.0 Flash Lite", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 20000 + "context": 1048576, + "output": 8192 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, - "attachment": false, - "open_weights": true, - "release_date": "2025-04-29", - "last_updated": "2025-04-29", + "search": { + "supported": false + }, + "attachment": true, + "open_weights": false, + "knowledge": "2024-06", + "release_date": "2024-12-11", + "last_updated": "2024-12-11", "cost": { - "input": 0.03, - "output": 0.03 + "input": 0.075, + "output": 0.3 }, "type": "chat" }, { - "id": "qwen/qwen3.7-max", - "name": "Qwen3.7-Max", - "display_name": "Qwen3.7-Max", + "id": "gemini-2.5-flash-preview-09-2025", + "name": "Gemini 2.5 Flash Preview 09 2025", + "display_name": "Gemini 2.5 Flash Preview 09 2025", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 1000000, + "context": 1048576, "output": 65536 }, "temperature": true, "tool_call": true, "reasoning": { "supported": true, - "default": true + "default": true, + "budget": { + "default": -1, + "min": 0, + "max": 24576 + } }, "extra_capabilities": { "reasoning": { - "supported": true + "supported": true, + "default_enabled": true, + "mode": "budget", + "budget": { + "default": -1, + "min": 0, + "max": 24576, + "auto": -1, + "off": 0, + "unit": "tokens" + }, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thought_signatures" + ] } }, - "attachment": false, - "open_weights": false, - "release_date": "2026-05-21", - "last_updated": "2026-05-27", - "cost": { - "input": 1.25, - "output": 3.75, - "cache_read": 0.125, - "cache_write": 1.5625 + "search": { + "supported": true, + "default": false }, + "attachment": true, "type": "chat" }, { - "id": "qwen/qwen3-omni-30b-a3b-thinking", - "name": "Qwen3 Omni 30B A3B Thinking", - "display_name": "Qwen3 Omni 30B A3B Thinking", + "id": "gemini-2.5-flash-image-preview", + "name": "Gemini 2.5 Flash Image Preview", + "display_name": "Gemini 2.5 Flash Image Preview", "modalities": { "input": [ "text", - "audio", - "video", "image" ], "output": [ - "text" + "text", + "image" ] }, "limit": { - "context": 65536, - "output": 16384 + "context": 32768, + "output": 32768 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } - }, - "attachment": true, - "open_weights": true, - "release_date": "2025-09-24", - "last_updated": "2025-09-24", - "cost": { - "input": 0.25, - "output": 0.97, - "input_audio": 2.2, - "output_audio": 1.788 + "supported": false }, - "type": "chat" + "attachment": false, + "type": "imageGeneration" }, { - "id": "qwen/qwen3-vl-8b-instruct", - "name": "qwen/qwen3-vl-8b-instruct", - "display_name": "qwen/qwen3-vl-8b-instruct", + "id": "gemini-2.5-flash-lite-preview-09-2025", + "name": "Gemini 2.5 Flash Lite Preview 09 2025", + "display_name": "Gemini 2.5 Flash Lite Preview 09 2025", "modalities": { "input": [ "text", - "image", - "video" + "image" ], "output": [ "text" ] }, "limit": { - "context": 131072, - "output": 32768 + "context": 1048576, + "output": 65536 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": false, + "budget": { + "default": -1, + "min": 512, + "max": 24576 + } }, - "attachment": true, - "open_weights": true, - "release_date": "2025-10-17", - "last_updated": "2025-10-17", - "cost": { - "input": 0.08, - "output": 0.5 + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": false, + "mode": "budget", + "budget": { + "default": -1, + "min": 512, + "max": 24576, + "auto": -1, + "unit": "tokens" + }, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thought_signatures" + ] + } + }, + "search": { + "supported": true, + "default": false }, + "attachment": true, "type": "chat" }, { - "id": "qwen/qwen3-coder-480b-a35b-instruct", - "name": "Qwen3 Coder 480B A35B Instruct", - "display_name": "Qwen3 Coder 480B A35B Instruct", + "id": "gemini-2.0-flash-preview-image-generation", + "name": "Gemini 2.0 Flash Preview Image Generation", + "display_name": "Gemini 2.0 Flash Preview Image Generation", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ - "text" + "text", + "image" ] }, "limit": { - "context": 262144, - "output": 65536 + "context": 32000, + "output": 8192 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": false }, - "attachment": false, - "open_weights": true, - "knowledge": "2025-04", - "release_date": "2025-07-23", - "last_updated": "2025-07-23", - "cost": { - "input": 0.3, - "output": 1.3 + "search": { + "supported": false }, + "attachment": true, "type": "chat" - }, + } + ] + }, + "opencode-go": { + "id": "opencode-go", + "name": "OpenCode Go", + "display_name": "OpenCode Go", + "api": "https://opencode.ai/zen/go/v1", + "doc": "https://opencode.ai/docs/zen", + "models": [ { - "id": "qwen/qwen3-next-80b-a3b-thinking", - "name": "Qwen3 Next 80B A3B Thinking", - "display_name": "Qwen3 Next 80B A3B Thinking", + "id": "deepseek-v4-flash", + "name": "DeepSeek V4 Flash", + "display_name": "DeepSeek V4 Flash", "modalities": { "input": [ "text" @@ -39142,8 +41706,8 @@ ] }, "limit": { - "context": 131072, - "output": 32768 + "context": 1000000, + "output": 384000 }, "temperature": true, "tool_call": true, @@ -39164,30 +41728,30 @@ }, "attachment": false, "open_weights": true, - "release_date": "2025-09-10", - "last_updated": "2025-09-10", + "knowledge": "2025-05", + "release_date": "2026-04-24", + "last_updated": "2026-04-24", "cost": { - "input": 0.15, - "output": 1.5 + "input": 0.14, + "output": 0.28, + "cache_read": 0.0028 }, "type": "chat" }, { - "id": "qwen/qwen3.5-35b-a3b", - "name": "Qwen3.5-35B-A3B", - "display_name": "Qwen3.5-35B-A3B", + "id": "minimax-m2.5", + "name": "MiniMax M2.5", + "display_name": "MiniMax M2.5", "modalities": { "input": [ - "text", - "image", - "video" + "text" ], "output": [ "text" ] }, "limit": { - "context": 262144, + "context": 204800, "output": 65536 }, "temperature": true, @@ -39198,98 +41762,123 @@ }, "extra_capabilities": { "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] + "supported": true } }, - "attachment": true, + "attachment": false, "open_weights": true, - "release_date": "2026-02-26", - "last_updated": "2026-02-26", + "knowledge": "2025-01", + "release_date": "2026-02-12", + "last_updated": "2026-02-12", "cost": { - "input": 0.25, - "output": 2 + "input": 0.3, + "output": 1.2, + "cache_read": 0.03 }, "type": "chat" }, { - "id": "qwen/qwen2.5-7b-instruct", - "name": "Qwen2.5 7B Instruct", - "display_name": "Qwen2.5 7B Instruct", + "id": "qwen3.7-plus", + "name": "Qwen3.7 Plus", + "display_name": "Qwen3.7 Plus", "modalities": { "input": [ - "text" + "text", + "image", + "video" ], "output": [ "text" ] }, "limit": { - "context": 32000, - "output": 32000 + "context": 1000000, + "output": 65536 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": false, - "open_weights": true, - "release_date": "2025-04-16", - "last_updated": "2025-04-16", + "extra_capabilities": { + "reasoning": { + "supported": true + } + }, + "attachment": true, + "open_weights": false, + "release_date": "2026-06-02", + "last_updated": "2026-06-02", "cost": { - "input": 0.07, - "output": 0.07 + "input": 0.4, + "output": 1.6, + "cache_read": 0.04, + "cache_write": 0.5, + "tiers": [ + { + "input": 1.2, + "output": 4.8, + "cache_read": 0.12, + "cache_write": 1.5, + "tier": { + "type": "context", + "size": 256000 + } + } + ], + "context_over_200k": { + "input": 1.2, + "output": 4.8, + "cache_read": 0.12, + "cache_write": 1.5 + } }, "type": "chat" }, { - "id": "qwen/qwen3-omni-30b-a3b-instruct", - "name": "Qwen3 Omni 30B A3B Instruct", - "display_name": "Qwen3 Omni 30B A3B Instruct", + "id": "qwen3.7-max", + "name": "Qwen3.7 Max", + "display_name": "Qwen3.7 Max", "modalities": { "input": [ - "text", - "video", - "audio", - "image" + "text" ], "output": [ - "text", - "audio" + "text" ] }, "limit": { - "context": 65536, - "output": 16384 + "context": 1000000, + "output": 65536 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": true, - "open_weights": true, - "knowledge": "2024-04", - "release_date": "2025-09-24", - "last_updated": "2025-09-24", + "extra_capabilities": { + "reasoning": { + "supported": true + } + }, + "attachment": false, + "open_weights": false, + "release_date": "2026-05-21", + "last_updated": "2026-05-21", "cost": { - "input": 0.25, - "output": 0.97, - "input_audio": 2.2, - "output_audio": 1.788 + "input": 2.5, + "output": 7.5, + "cache_read": 0.5, + "cache_write": 3.125 }, "type": "chat" }, { - "id": "qwen/qwen3-235b-a22b-instruct-2507", - "name": "Qwen3 235B A22B Instruct 2507", - "display_name": "Qwen3 235B A22B Instruct 2507", + "id": "glm-5.1", + "name": "GLM-5.1", + "display_name": "GLM-5.1", "modalities": { "input": [ "text" @@ -39299,42 +41888,53 @@ ] }, "limit": { - "context": 131072, - "output": 16384 + "context": 202752, + "output": 32768 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } }, "attachment": false, "open_weights": true, "knowledge": "2025-04", - "release_date": "2025-07-22", - "last_updated": "2025-07-22", + "release_date": "2026-04-07", + "last_updated": "2026-04-07", "cost": { - "input": 0.09, - "output": 0.58 + "input": 1.4, + "output": 4.4, + "cache_read": 0.26 }, "type": "chat" }, { - "id": "qwen/qwen3.5-397b-a17b", - "name": "Qwen3.5-397B-A17B", - "display_name": "Qwen3.5-397B-A17B", + "id": "deepseek-v4-pro", + "name": "DeepSeek V4 Pro", + "display_name": "DeepSeek V4 Pro", "modalities": { "input": [ - "text", - "image", - "video" + "text" ], "output": [ "text" ] }, "limit": { - "context": 262144, - "output": 64000 + "context": 1000000, + "output": 384000 }, "temperature": true, "tool_call": true, @@ -39353,52 +41953,63 @@ ] } }, - "attachment": true, + "attachment": false, "open_weights": true, - "release_date": "2026-02-17", - "last_updated": "2026-02-17", + "knowledge": "2025-05", + "release_date": "2026-04-24", + "last_updated": "2026-04-24", "cost": { - "input": 0.6, - "output": 3.6 + "input": 1.74, + "output": 3.48, + "cache_read": 0.0145 }, "type": "chat" }, { - "id": "qwen/qwen3-30b-a3b-fp8", - "name": "Qwen3 30B A3B", - "display_name": "Qwen3 30B A3B", + "id": "minimax-m3", + "name": "MiniMax M3", + "display_name": "MiniMax M3", "modalities": { "input": [ - "text" + "text", + "image", + "video" ], "output": [ "text" ] }, "limit": { - "context": 40960, - "output": 20000 + "context": 512000, + "output": 131072 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { "supported": true, "default": true }, + "extra_capabilities": { + "reasoning": { + "supported": true + } + }, "attachment": false, "open_weights": true, - "release_date": "2025-04-29", - "last_updated": "2025-04-29", + "knowledge": "2025-01", + "release_date": "2026-05-31", + "last_updated": "2026-05-31", "cost": { - "input": 0.09, - "output": 0.45 + "input": 0.3, + "output": 1.2, + "cache_read": 0.06 }, "type": "chat" }, { - "id": "qwen/qwen3.5-27b", - "name": "Qwen3.5-27B", - "display_name": "Qwen3.5-27B", + "id": "qwen3.5-plus", + "name": "Qwen3.5 Plus", + "display_name": "Qwen3.5 Plus", "modalities": { "input": [ "text", @@ -39431,19 +42042,22 @@ } }, "attachment": true, - "open_weights": true, - "release_date": "2026-02-26", - "last_updated": "2026-02-26", + "open_weights": false, + "knowledge": "2025-04", + "release_date": "2026-02-16", + "last_updated": "2026-02-16", "cost": { - "input": 0.3, - "output": 2.4 + "input": 0.2, + "output": 1.2, + "cache_read": 0.02, + "cache_write": 0.25 }, "type": "chat" }, { - "id": "qwen/qwen-mt-plus", - "name": "Qwen MT Plus", - "display_name": "Qwen MT Plus", + "id": "minimax-m2.7", + "name": "MiniMax M2.7", + "display_name": "MiniMax M2.7", "modalities": { "input": [ "text" @@ -39453,28 +42067,42 @@ ] }, "limit": { - "context": 16384, - "output": 8192 + "context": 204800, + "output": 131072 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } }, "attachment": false, "open_weights": true, - "release_date": "2025-09-03", - "last_updated": "2025-09-03", + "knowledge": "2025-01", + "release_date": "2026-03-18", + "last_updated": "2026-03-18", "cost": { - "input": 0.25, - "output": 0.75 + "input": 0.3, + "output": 1.2, + "cache_read": 0.06 }, "type": "chat" }, { - "id": "qwen/qwen3-vl-235b-a22b-thinking", - "name": "Qwen3 VL 235B A22B Thinking", - "display_name": "Qwen3 VL 235B A22B Thinking", + "id": "kimi-k2.5", + "name": "Kimi K2.5", + "display_name": "Kimi K2.5", "modalities": { "input": [ "text", @@ -39486,11 +42114,11 @@ ] }, "limit": { - "context": 131072, - "output": 32768 + "context": 262144, + "output": 65536 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { "supported": true, "default": true @@ -39508,53 +42136,74 @@ }, "attachment": true, "open_weights": true, - "release_date": "2025-09-24", - "last_updated": "2025-09-24", + "knowledge": "2024-10", + "release_date": "2026-01-27", + "last_updated": "2026-01-27", "cost": { - "input": 0.98, - "output": 3.95 + "input": 0.6, + "output": 3, + "cache_read": 0.1 }, "type": "chat" }, { - "id": "qwen/qwen-2.5-72b-instruct", - "name": "Qwen 2.5 72B Instruct", - "display_name": "Qwen 2.5 72B Instruct", + "id": "mimo-v2.5", + "name": "MiMo V2.5", + "display_name": "MiMo V2.5", "modalities": { "input": [ - "text" + "text", + "image", + "audio", + "video" ], "output": [ "text" ] }, "limit": { - "context": 32000, - "output": 8192 + "context": 1000000, + "output": 128000 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": false, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } + }, + "attachment": true, "open_weights": true, - "knowledge": "2024-04", - "release_date": "2024-10-15", - "last_updated": "2024-10-15", + "knowledge": "2024-12", + "release_date": "2026-04-22", + "last_updated": "2026-04-22", "cost": { - "input": 0.38, - "output": 0.4 + "input": 0.14, + "output": 0.28, + "cache_read": 0.0028 }, "type": "chat" }, { - "id": "moonshotai/kimi-k2-thinking", - "name": "Kimi K2 Thinking", - "display_name": "Kimi K2 Thinking", + "id": "mimo-v2-omni", + "name": "MiMo V2 Omni", + "display_name": "MiMo V2 Omni", "modalities": { "input": [ - "text" + "text", + "image", + "audio", + "pdf" ], "output": [ "text" @@ -39562,7 +42211,7 @@ }, "limit": { "context": 262144, - "output": 262144 + "output": 128000 }, "temperature": true, "tool_call": true, @@ -39581,64 +42230,80 @@ ] } }, - "attachment": false, + "attachment": true, "open_weights": true, - "release_date": "2025-11-07", - "last_updated": "2025-11-07", + "knowledge": "2024-12", + "release_date": "2026-03-18", + "last_updated": "2026-03-18", "cost": { - "input": 0.6, - "output": 2.5 + "input": 0.4, + "output": 2, + "cache_read": 0.08 }, "type": "chat" }, { - "id": "moonshotai/kimi-k2-instruct", - "name": "Kimi K2 Instruct", - "display_name": "Kimi K2 Instruct", + "id": "kimi-k2.6", + "name": "Kimi K2.6", + "display_name": "Kimi K2.6", "modalities": { "input": [ - "text" + "text", + "image", + "video" ], "output": [ "text" ] }, "limit": { - "context": 131072, - "output": 32768 + "context": 262144, + "output": 65536 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": false, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } + }, + "attachment": true, "open_weights": true, - "release_date": "2025-07-11", - "last_updated": "2025-07-11", + "knowledge": "2024-10", + "release_date": "2026-04-21", + "last_updated": "2026-04-21", "cost": { - "input": 0.57, - "output": 2.3 + "input": 0.95, + "output": 4, + "cache_read": 0.16 }, "type": "chat" }, { - "id": "moonshotai/kimi-k2.6", - "name": "Kimi K2.6", - "display_name": "Kimi K2.6", + "id": "mimo-v2-pro", + "name": "MiMo V2 Pro", + "display_name": "MiMo V2 Pro", "modalities": { "input": [ - "text", - "image", - "video" + "text" ], "output": [ "text" ] }, "limit": { - "context": 262144, - "output": 262144 + "context": 1048576, + "output": 128000 }, "temperature": true, "tool_call": true, @@ -39659,20 +42324,36 @@ }, "attachment": true, "open_weights": true, - "knowledge": "2025-01", - "release_date": "2026-04-21", - "last_updated": "2026-04-21", + "knowledge": "2024-12", + "release_date": "2026-03-18", + "last_updated": "2026-03-18", "cost": { - "input": 0.95, - "output": 4, - "cache_read": 0.16 + "input": 1, + "output": 3, + "cache_read": 0.2, + "tiers": [ + { + "input": 2, + "output": 6, + "cache_read": 0.4, + "tier": { + "type": "context", + "size": 256000 + } + } + ], + "context_over_200k": { + "input": 2, + "output": 6, + "cache_read": 0.4 + } }, "type": "chat" }, { - "id": "moonshotai/kimi-k2-0905", - "name": "Kimi K2 0905", - "display_name": "Kimi K2 0905", + "id": "mimo-v2.5-pro", + "name": "MiMo V2.5 Pro", + "display_name": "MiMo V2.5 Pro", "modalities": { "input": [ "text" @@ -39682,42 +42363,53 @@ ] }, "limit": { - "context": 262144, - "output": 262144 + "context": 1048576, + "output": 128000 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": false, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } + }, + "attachment": true, "open_weights": true, - "knowledge": "2024-10", - "release_date": "2025-09-05", - "last_updated": "2025-09-05", + "knowledge": "2024-12", + "release_date": "2026-04-22", + "last_updated": "2026-04-22", "cost": { - "input": 0.6, - "output": 2.5 + "input": 1.74, + "output": 3.48, + "cache_read": 0.0145 }, "type": "chat" }, { - "id": "moonshotai/kimi-k2.5", - "name": "Kimi K2.5", - "display_name": "Kimi K2.5", + "id": "glm-5", + "name": "GLM-5", + "display_name": "GLM-5", "modalities": { "input": [ - "text", - "image", - "video" + "text" ], "output": [ "text" ] }, "limit": { - "context": 262144, - "output": 262144 + "context": 202752, + "output": 32768 }, "temperature": true, "tool_call": true, @@ -39736,117 +42428,188 @@ ] } }, - "attachment": true, + "attachment": false, "open_weights": true, - "knowledge": "2025-01", - "release_date": "2026-01-27", - "last_updated": "2026-01-27", + "knowledge": "2025-04", + "release_date": "2026-02-11", + "last_updated": "2026-02-11", "cost": { - "input": 0.6, - "output": 3, - "cache_read": 0.1 + "input": 1, + "output": 3.2, + "cache_read": 0.2 }, "type": "chat" }, { - "id": "meta-llama/llama-4-scout-17b-16e-instruct", - "name": "Llama 4 Scout Instruct", - "display_name": "Llama 4 Scout Instruct", + "id": "qwen3.6-plus", + "name": "Qwen3.6 Plus", + "display_name": "Qwen3.6 Plus", "modalities": { "input": [ "text", - "image" + "image", + "video" ], "output": [ "text" ] }, "limit": { - "context": 131072, - "output": 131072 + "context": 1000000, + "output": 65536 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } }, "attachment": true, - "open_weights": true, - "release_date": "2025-04-06", - "last_updated": "2025-04-06", + "open_weights": false, + "knowledge": "2025-04", + "release_date": "2026-04-02", + "last_updated": "2026-04-02", "cost": { - "input": 0.18, - "output": 0.59 + "input": 0.5, + "output": 3, + "cache_read": 0.05, + "cache_write": 0.625, + "tiers": [ + { + "input": 2, + "output": 6, + "cache_read": 0.2, + "cache_write": 2.5, + "tier": { + "type": "context", + "size": 256000 + } + } + ], + "context_over_200k": { + "input": 2, + "output": 6, + "cache_read": 0.2, + "cache_write": 2.5 + } }, "type": "chat" - }, + } + ] + }, + "digitalocean": { + "id": "digitalocean", + "name": "DigitalOcean", + "display_name": "DigitalOcean", + "api": "https://inference.do-ai.run/v1", + "doc": "https://docs.digitalocean.com/products/gradient-ai-platform/details/models/", + "models": [ { - "id": "meta-llama/llama-3.2-3b-instruct", - "name": "Llama 3.2 3B Instruct", - "display_name": "Llama 3.2 3B Instruct", + "id": "anthropic-claude-haiku-4.5", + "name": "Claude Haiku 4.5", + "display_name": "Claude Haiku 4.5", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 32768, - "output": 32000 + "context": 200000, + "output": 64000 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": false }, - "attachment": false, - "open_weights": true, - "release_date": "2024-09-18", - "last_updated": "2024-09-18", + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": false, + "mode": "budget", + "budget": { + "min": 1024, + "unit": "tokens" + }, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ], + "notes": [ + "Claude 4 manual thinking uses thinking.type = \"enabled\" with budget_tokens.", + "Interleaved thinking requires the interleaved-thinking-2025-05-14 beta header for this model family." + ] + } + }, + "attachment": true, + "open_weights": false, + "knowledge": "2025-02-28", + "release_date": "2025-10-15", + "last_updated": "2025-10-15", "cost": { - "input": 0.03, - "output": 0.05 + "input": 1, + "output": 5, + "cache_read": 1, + "cache_write": 1.25 }, "type": "chat" }, { - "id": "meta-llama/llama-4-maverick-17b-128e-instruct-fp8", - "name": "Llama 4 Maverick Instruct", - "display_name": "Llama 4 Maverick Instruct", + "id": "openai-gpt-image-1", + "name": "GPT Image 1", + "display_name": "GPT Image 1", "modalities": { "input": [ "text", "image" ], "output": [ - "text" + "image" ] }, "limit": { - "context": 1048576, + "context": 8192, "output": 8192 }, - "temperature": true, + "temperature": false, "tool_call": false, "reasoning": { "supported": false }, "attachment": true, - "open_weights": true, - "release_date": "2025-04-06", - "last_updated": "2025-04-06", + "open_weights": false, + "release_date": "2025-04-24", + "last_updated": "2025-04-24", "cost": { - "input": 0.27, - "output": 0.85 + "input": 5, + "output": 40, + "cache_read": 1.25 }, "type": "chat" }, { - "id": "meta-llama/llama-3-70b-instruct", - "name": "Llama3 70B Instruct", - "display_name": "Llama3 70B Instruct", + "id": "e5-large-v2", + "name": "E5 Large v2", + "display_name": "E5 Large v2", "modalities": { "input": [ "text" @@ -39856,28 +42619,28 @@ ] }, "limit": { - "context": 8192, - "output": 8000 + "context": 512, + "output": 1024 }, - "temperature": true, + "temperature": false, "tool_call": false, "reasoning": { "supported": false }, "attachment": false, "open_weights": true, - "release_date": "2024-04-25", - "last_updated": "2024-04-25", + "release_date": "2023-05-19", + "last_updated": "2026-04-30", "cost": { - "input": 0.51, - "output": 0.74 + "input": 0.02, + "output": 0 }, "type": "chat" }, { - "id": "meta-llama/llama-3-8b-instruct", - "name": "Llama 3 8B Instruct", - "display_name": "Llama 3 8B Instruct", + "id": "bge-m3", + "name": "BGE M3", + "display_name": "BGE M3", "modalities": { "input": [ "text" @@ -39888,58 +42651,27 @@ }, "limit": { "context": 8192, - "output": 8192 - }, - "temperature": true, - "tool_call": false, - "reasoning": { - "supported": false - }, - "attachment": false, - "open_weights": true, - "release_date": "2024-04-25", - "last_updated": "2024-04-25", - "cost": { - "input": 0.04, - "output": 0.04 - }, - "type": "chat" - }, - { - "id": "meta-llama/llama-3.1-8b-instruct", - "name": "Llama 3.1 8B Instruct", - "display_name": "Llama 3.1 8B Instruct", - "modalities": { - "input": [ - "text" - ], - "output": [ - "text" - ] - }, - "limit": { - "context": 16384, - "output": 16384 + "output": 1024 }, - "temperature": true, + "temperature": false, "tool_call": false, "reasoning": { "supported": false }, "attachment": false, "open_weights": true, - "release_date": "2024-07-24", - "last_updated": "2024-07-24", + "release_date": "2024-01-30", + "last_updated": "2026-04-30", "cost": { "input": 0.02, - "output": 0.05 + "output": 0 }, - "type": "chat" + "type": "embedding" }, { - "id": "meta-llama/llama-3.3-70b-instruct", - "name": "Llama 3.3 70B Instruct", - "display_name": "Llama 3.3 70B Instruct", + "id": "mistral-3-14B", + "name": "Ministral 3 14B Instruct", + "display_name": "Ministral 3 14B Instruct", "modalities": { "input": [ "text" @@ -39949,8 +42681,8 @@ ] }, "limit": { - "context": 131072, - "output": 120000 + "context": 262144, + "output": 128000 }, "temperature": true, "tool_call": true, @@ -39959,52 +42691,56 @@ }, "attachment": false, "open_weights": true, - "knowledge": "2023-12", - "release_date": "2024-12-07", - "last_updated": "2024-12-07", + "release_date": "2025-12-15", + "last_updated": "2026-04-30", "cost": { - "input": 0.135, - "output": 0.4 + "input": 0.2, + "output": 0.2 }, "type": "chat" }, { - "id": "baidu/ernie-4.5-vl-424b-a47b", - "name": "ERNIE 4.5 VL 424B A47B", - "display_name": "ERNIE 4.5 VL 424B A47B", + "id": "minimax-m2.5", + "name": "MiniMax M2.5", + "display_name": "MiniMax M2.5", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 123000, - "output": 16000 + "context": 204800, + "output": 128000 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { "supported": true, "default": true }, - "attachment": true, + "extra_capabilities": { + "reasoning": { + "supported": true + } + }, + "attachment": false, "open_weights": true, - "release_date": "2025-06-30", - "last_updated": "2025-06-30", + "knowledge": "2025-08", + "release_date": "2026-02-12", + "last_updated": "2026-04-16", "cost": { - "input": 0.42, - "output": 1.25 + "input": 0.3, + "output": 1.2 }, "type": "chat" }, { - "id": "baidu/ernie-4.5-vl-28b-a3b", - "name": "ERNIE 4.5 VL 28B A3B", - "display_name": "ERNIE 4.5 VL 28B A3B", + "id": "openai-gpt-5.4-nano", + "name": "GPT-5.4 nano", + "display_name": "GPT-5.4 nano", "modalities": { "input": [ "text", @@ -40015,60 +42751,31 @@ ] }, "limit": { - "context": 30000, - "output": 8000 + "context": 400000, + "output": 128000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { "supported": true, "default": true }, "attachment": true, - "open_weights": true, - "release_date": "2025-06-30", - "last_updated": "2025-06-30", - "cost": { - "input": 1.4, - "output": 5.6 - }, - "type": "chat" - }, - { - "id": "baidu/ernie-4.5-300b-a47b-paddle", - "name": "ERNIE 4.5 300B A47B", - "display_name": "ERNIE 4.5 300B A47B", - "modalities": { - "input": [ - "text" - ], - "output": [ - "text" - ] - }, - "limit": { - "context": 123000, - "output": 12000 - }, - "temperature": true, - "tool_call": false, - "reasoning": { - "supported": false - }, - "attachment": false, - "open_weights": true, - "release_date": "2025-06-30", - "last_updated": "2025-06-30", + "open_weights": false, + "knowledge": "2025-08-31", + "release_date": "2026-03-17", + "last_updated": "2026-03-17", "cost": { - "input": 0.28, - "output": 1.1 + "input": 0.2, + "output": 1.25, + "cache_read": 0.02 }, "type": "chat" }, { - "id": "baidu/ernie-4.5-21B-a3b", - "name": "ERNIE 4.5 21B A3B", - "display_name": "ERNIE 4.5 21B A3B", + "id": "deepseek-v3", + "name": "DeepSeek V3", + "display_name": "DeepSeek V3", "modalities": { "input": [ "text" @@ -40078,8 +42785,8 @@ ] }, "limit": { - "context": 120000, - "output": 8000 + "context": 163840, + "output": 131072 }, "temperature": true, "tool_call": true, @@ -40088,86 +42795,78 @@ }, "attachment": false, "open_weights": true, - "knowledge": "2025-03", - "release_date": "2025-06-30", - "last_updated": "2025-06-30", - "cost": { - "input": 0.07, - "output": 0.28 - }, + "knowledge": "2024-07", + "release_date": "2024-12-26", + "last_updated": "2025-03-24", "type": "chat" }, { - "id": "baidu/ernie-4.5-21B-a3b-thinking", - "name": "ERNIE-4.5-21B-A3B-Thinking", - "display_name": "ERNIE-4.5-21B-A3B-Thinking", + "id": "openai-gpt-image-2", + "name": "GPT Image 2", + "display_name": "GPT Image 2", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ - "text" + "image" ] }, "limit": { - "context": 131072, - "output": 65536 + "context": 8192, + "output": 8192 }, - "temperature": true, + "temperature": false, "tool_call": false, "reasoning": { - "supported": true, - "default": true - }, - "attachment": false, - "open_weights": true, - "knowledge": "2025-03", - "release_date": "2025-09-19", - "last_updated": "2025-09-19", - "cost": { - "input": 0.07, - "output": 0.28 + "supported": false }, + "attachment": true, + "open_weights": false, + "release_date": "2025-04-24", + "last_updated": "2025-04-24", "type": "chat" }, { - "id": "baidu/ernie-4.5-vl-28b-a3b-thinking", - "name": "ERNIE-4.5-VL-28B-A3B-Thinking", - "display_name": "ERNIE-4.5-VL-28B-A3B-Thinking", + "id": "openai-gpt-5.2", + "name": "GPT-5.2", + "display_name": "GPT-5.2", "modalities": { "input": [ "text", - "image", - "video" + "image" ], "output": [ "text" ] }, "limit": { - "context": 131072, - "output": 65536 + "context": 400000, + "output": 128000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { "supported": true, "default": true }, "attachment": true, - "open_weights": true, - "release_date": "2025-11-26", - "last_updated": "2025-11-26", + "open_weights": false, + "knowledge": "2025-08-31", + "release_date": "2025-12-11", + "last_updated": "2025-12-11", "cost": { - "input": 0.39, - "output": 0.39 + "input": 1.75, + "output": 14, + "cache_read": 0.175 }, "type": "chat" }, { - "id": "minimaxai/minimax-m1-80k", - "name": "MiniMax M1", - "display_name": "MiniMax M1", + "id": "deepseek-r1-distill-llama-70b", + "name": "DeepSeek R1 Distill Llama 70B", + "display_name": "DeepSeek R1 Distill Llama 70B", "modalities": { "input": [ "text" @@ -40177,8 +42876,8 @@ ] }, "limit": { - "context": 1000000, - "output": 40000 + "context": 131072, + "output": 32768 }, "temperature": true, "tool_call": true, @@ -40186,51 +42885,25 @@ "supported": true, "default": true }, - "attachment": false, - "open_weights": true, - "release_date": "2025-06-17", - "last_updated": "2025-06-17", - "cost": { - "input": 0.55, - "output": 2.2 - }, - "type": "chat" - }, - { - "id": "gryphe/mythomax-l2-13b", - "name": "Mythomax L2 13B", - "display_name": "Mythomax L2 13B", - "modalities": { - "input": [ - "text" - ], - "output": [ - "text" - ] - }, - "limit": { - "context": 4096, - "output": 3200 - }, - "temperature": true, - "tool_call": false, - "reasoning": { - "supported": false + "extra_capabilities": { + "reasoning": { + "supported": true + } }, "attachment": false, "open_weights": true, - "release_date": "2024-04-25", - "last_updated": "2024-04-25", + "release_date": "2025-01-30", + "last_updated": "2025-01-30", "cost": { - "input": 0.09, - "output": 0.09 + "input": 0.99, + "output": 0.99 }, "type": "chat" }, { - "id": "microsoft/wizardlm-2-8x22b", - "name": "Wizardlm 2 8x22B", - "display_name": "Wizardlm 2 8x22B", + "id": "qwen3-embedding-0.6b", + "name": "Qwen3 Embedding 0.6B", + "display_name": "Qwen3 Embedding 0.6B", "modalities": { "input": [ "text" @@ -40240,187 +42913,247 @@ ] }, "limit": { - "context": 65535, - "output": 8000 + "context": 8000, + "output": 1024 }, - "temperature": true, + "temperature": false, "tool_call": false, "reasoning": { "supported": false }, "attachment": false, "open_weights": true, - "release_date": "2024-04-24", - "last_updated": "2024-04-24", + "release_date": "2025-06-03", + "last_updated": "2026-04-16", "cost": { - "input": 0.62, - "output": 0.62 + "input": 0.04, + "output": 0 }, - "type": "chat" + "type": "embedding" }, { - "id": "inclusionai/ling-2.6-flash", - "name": "Ling-2.6-flash", - "display_name": "Ling-2.6-flash", + "id": "gemma-4-31B-it", + "name": "Gemma 4 31B", + "display_name": "Gemma 4 31B", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 262144, - "output": 32768 + "context": 256000, + "output": 8192 }, "temperature": true, "tool_call": true, "reasoning": { "supported": false }, - "attachment": false, + "attachment": true, "open_weights": true, - "release_date": "2026-04-24", - "last_updated": "2026-04-24", + "release_date": "2026-04-22", + "last_updated": "2026-04-30", "cost": { - "input": 0.1, - "output": 0.3, - "cache_read": 0.02 + "input": 0.18, + "output": 0.5 }, "type": "chat" }, { - "id": "inclusionai/ling-2.6-1t", - "name": "Ling-2.6-1T", - "display_name": "Ling-2.6-1T", + "id": "llama-4-maverick", + "name": "Llama 4 Maverick 17B 128E Instruct", + "display_name": "Llama 4 Maverick 17B 128E Instruct", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 262144, - "output": 32768 + "context": 1000000, + "output": 16384 }, "temperature": true, "tool_call": true, "reasoning": { "supported": false }, - "attachment": false, + "attachment": true, "open_weights": true, - "release_date": "2026-04-23", - "last_updated": "2026-04-23", + "knowledge": "2024-08", + "release_date": "2025-04-05", + "last_updated": "2026-04-30", "cost": { - "input": 0, - "output": 0 + "input": 0.25, + "output": 0.87 }, "type": "chat" }, { - "id": "inclusionai/ring-2.6-1t", - "name": "Ring-2.6-1T", - "display_name": "Ring-2.6-1T", + "id": "anthropic-claude-3.7-sonnet", + "name": "Claude 3.7 Sonnet", + "display_name": "Claude 3.7 Sonnet", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 262144, - "output": 65536 + "context": 200000, + "output": 64000 }, "temperature": true, "tool_call": true, "reasoning": { "supported": true, - "default": true + "default": false }, - "attachment": false, + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": false, + "mode": "budget", + "budget": { + "min": 1024, + "unit": "tokens" + }, + "interleaved": false, + "summaries": false, + "visibility": "full", + "continuation": [ + "thinking_blocks" + ], + "notes": [ + "Anthropic uses thinking budget tokens" + ] + } + }, + "attachment": true, "open_weights": false, - "release_date": "2026-05-08", - "last_updated": "2026-05-27", + "knowledge": "2024-11", + "release_date": "2025-02-24", + "last_updated": "2025-02-24", "cost": { - "input": 0.3, - "output": 2.5, - "cache_read": 0.06 + "input": 3, + "output": 15, + "cache_read": 0.3, + "cache_write": 3.75 }, "type": "chat" }, { - "id": "paddlepaddle/paddleocr-vl", - "name": "PaddleOCR-VL", - "display_name": "PaddleOCR-VL", + "id": "openai-gpt-4o-mini", + "name": "GPT-4o mini", + "display_name": "GPT-4o mini", "modalities": { "input": [ "text", - "image" + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 16384, + "context": 128000, "output": 16384 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { "supported": false }, "attachment": true, - "open_weights": true, - "release_date": "2025-10-22", - "last_updated": "2025-10-22", + "open_weights": false, + "knowledge": "2023-09", + "release_date": "2024-07-18", + "last_updated": "2024-07-18", "cost": { - "input": 0.02, - "output": 0.02 + "input": 0.15, + "output": 0.6, + "cache_read": 0.075 }, "type": "chat" }, { - "id": "sao10K/l3-8b-lunaris", - "name": "Sao10k L3 8B Lunaris\t", - "display_name": "Sao10k L3 8B Lunaris\t", + "id": "anthropic-claude-opus-4.7", + "name": "Claude Opus 4.7", + "display_name": "Claude Opus 4.7", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 8192, - "output": 8192 + "context": 1000000, + "output": 128000 }, - "temperature": true, - "tool_call": false, + "temperature": false, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": false }, - "attachment": false, - "open_weights": true, - "release_date": "2024-11-28", - "last_updated": "2024-11-28", + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": false, + "mode": "effort", + "effort": "high", + "effort_options": [ + "low", + "medium", + "high", + "xhigh", + "max" + ], + "interleaved": true, + "summaries": true, + "visibility": "omitted", + "continuation": [ + "thinking_blocks" + ], + "notes": [ + "Claude Opus 4.7 and newer Opus models require thinking.type = \"adaptive\" to enable thinking explicitly.", + "Manual budget_tokens requests return 400 on Claude Opus 4.7 and newer adaptive-only Opus models.", + "task_budget is separate from thinking control and should not be treated as a thinking budget." + ] + } + }, + "attachment": true, + "open_weights": false, + "knowledge": "2026-01-31", + "release_date": "2026-04-16", + "last_updated": "2026-04-16", "cost": { - "input": 0.05, - "output": 0.05 + "input": 5, + "output": 25, + "cache_read": 0.5, + "cache_write": 6.25 }, "type": "chat" }, { - "id": "sao10K/L3-8B-stheno-v3.2", - "name": "L3 8B Stheno V3.2", - "display_name": "L3 8B Stheno V3.2", + "id": "deepseek-4-flash", + "name": "Deepseek V4 Flash", + "display_name": "Deepseek V4 Flash", "modalities": { "input": [ "text" @@ -40430,8 +43163,8 @@ ] }, "limit": { - "context": 8192, - "output": 32000 + "context": 262144, + "output": 8192 }, "temperature": true, "tool_call": true, @@ -40439,114 +43172,182 @@ "supported": false }, "attachment": false, - "open_weights": true, - "release_date": "2024-11-29", - "last_updated": "2024-11-29", - "cost": { - "input": 0.05, - "output": 0.05 - }, + "open_weights": false, + "release_date": "2026-05-27", + "last_updated": "2026-05-29", "type": "chat" }, { - "id": "sao10K/l3-70b-euryale-v2.1", - "name": "L3 70B Euryale V2.1\t", - "display_name": "L3 70B Euryale V2.1\t", + "id": "anthropic-claude-4.5-haiku", + "name": "Claude Haiku 4.5", + "display_name": "Claude Haiku 4.5", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 8192, - "output": 8192 + "context": 200000, + "output": 64000 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": false, - "open_weights": true, - "release_date": "2024-06-18", - "last_updated": "2024-06-18", + "attachment": true, + "open_weights": false, + "knowledge": "2025-02-28", + "release_date": "2025-10-15", + "last_updated": "2025-10-15", "cost": { - "input": 1.48, - "output": 1.48 + "input": 1, + "output": 5, + "cache_read": 1, + "cache_write": 1.25 }, "type": "chat" }, { - "id": "sao10K/l31-70b-euryale-v2.2", - "name": "L31 70B Euryale V2.2", - "display_name": "L31 70B Euryale V2.2", + "id": "anthropic-claude-4.6-sonnet", + "name": "Claude Sonnet 4.6", + "display_name": "Claude Sonnet 4.6", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 8192, - "output": 8192 + "context": 1000000, + "output": 64000 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": false, - "open_weights": true, - "release_date": "2024-09-19", - "last_updated": "2024-09-19", + "attachment": true, + "open_weights": false, + "knowledge": "2025-08-31", + "release_date": "2026-02-17", + "last_updated": "2026-03-13", "cost": { - "input": 1.48, - "output": 1.48 + "input": 3, + "output": 15, + "cache_read": 0.3, + "cache_write": 3.75, + "tiers": [ + { + "input": 6, + "output": 22.5, + "cache_read": 0.3, + "cache_write": 3.75, + "tier": { + "type": "context", + "size": 200000 + } + } + ], + "context_over_200k": { + "input": 6, + "output": 22.5, + "cache_read": 0.3, + "cache_write": 3.75 + } }, "type": "chat" }, { - "id": "google/gemma-4-31b-it", - "name": "Gemma 4 31B", - "display_name": "Gemma 4 31B", + "id": "anthropic-claude-sonnet-4", + "name": "Claude Sonnet 4", + "display_name": "Claude Sonnet 4", "modalities": { "input": [ "text", - "image" + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 262144, - "output": 131072 + "context": 1000000, + "output": 64000 }, "temperature": true, "tool_call": true, "reasoning": { "supported": true, - "default": true + "default": false + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": false, + "mode": "budget", + "budget": { + "min": 1024, + "unit": "tokens" + }, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ], + "notes": [ + "Claude 4 manual thinking uses thinking.type = \"enabled\" with budget_tokens.", + "Interleaved thinking requires the interleaved-thinking-2025-05-14 beta header for this model family." + ] + } }, "attachment": true, - "open_weights": true, - "release_date": "2026-04-02", - "last_updated": "2026-04-02", + "open_weights": false, + "knowledge": "2025-03-31", + "release_date": "2025-05-22", + "last_updated": "2025-05-22", "cost": { - "input": 0.14, - "output": 0.4 + "input": 3, + "output": 15, + "cache_read": 0.3, + "cache_write": 3.75, + "tiers": [ + { + "input": 6, + "output": 22.5, + "cache_read": 0.3, + "cache_write": 3.75, + "tier": { + "type": "context", + "size": 200000 + } + } + ], + "context_over_200k": { + "input": 6, + "output": 22.5, + "cache_read": 0.3, + "cache_write": 3.75 + } }, "type": "chat" }, { - "id": "google/gemma-3-27b-it", - "name": "Gemma 3 27B", - "display_name": "Gemma 3 27B", + "id": "ministral-3-8b-instruct-2512", + "name": "Ministral 3 8B", + "display_name": "Ministral 3 8B", "modalities": { "input": [ "text", @@ -40557,105 +43358,173 @@ ] }, "limit": { - "context": 98304, - "output": 16384 + "context": 262144, + "output": 262144 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { "supported": false }, "attachment": true, "open_weights": true, - "release_date": "2025-03-25", - "last_updated": "2025-03-25", - "cost": { - "input": 0.119, - "output": 0.2 - }, + "release_date": "2025-12-15", + "last_updated": "2025-12-15", "type": "chat" }, { - "id": "google/gemma-3-12b-it", - "name": "Gemma 3 12B", - "display_name": "Gemma 3 12B", + "id": "anthropic-claude-4.5-sonnet", + "name": "Claude Sonnet 4.5", + "display_name": "Claude Sonnet 4.5", "modalities": { "input": [ "text", - "image" + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 131072, - "output": 8192 + "context": 1000000, + "output": 64000 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "attachment": true, - "open_weights": true, - "release_date": "2025-03-13", - "last_updated": "2025-03-13", + "open_weights": false, + "knowledge": "2025-07-31", + "release_date": "2025-09-29", + "last_updated": "2025-09-29", "cost": { - "input": 0.05, - "output": 0.1 + "input": 3, + "output": 15, + "cache_read": 0.3, + "cache_write": 3.75, + "tiers": [ + { + "input": 6, + "output": 22.5, + "cache_read": 0.3, + "cache_write": 3.75, + "tier": { + "type": "context", + "size": 200000 + } + } + ], + "context_over_200k": { + "input": 6, + "output": 22.5, + "cache_read": 0.3, + "cache_write": 3.75 + } }, "type": "chat" }, { - "id": "google/gemma-4-26b-a4b-it", - "name": "Gemma 4 26B A4B", - "display_name": "Gemma 4 26B A4B", + "id": "anthropic-claude-opus-4.6", + "name": "Claude Opus 4.6", + "display_name": "Claude Opus 4.6", "modalities": { "input": [ "text", - "image" + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 262144, - "output": 131072 + "context": 1000000, + "output": 128000 }, "temperature": true, "tool_call": true, "reasoning": { "supported": true, - "default": true + "default": false + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": false, + "mode": "mixed", + "budget": { + "min": 1024, + "unit": "tokens" + }, + "effort": "high", + "effort_options": [ + "low", + "medium", + "high", + "max" + ], + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ], + "notes": [ + "Anthropic recommends adaptive thinking with effort for Claude 4.6; budget_tokens remains a deprecated compatibility path.", + "Anthropic API defaults effort to high; lower effort levels should be chosen per workload." + ] + } }, "attachment": true, - "open_weights": true, - "release_date": "2026-04-02", - "last_updated": "2026-04-02", + "open_weights": false, + "knowledge": "2025-05-31", + "release_date": "2026-02-05", + "last_updated": "2026-03-13", "cost": { - "input": 0.13, - "output": 0.4 + "input": 5, + "output": 25, + "cache_read": 0.5, + "cache_write": 6.25, + "tiers": [ + { + "input": 10, + "output": 37.5, + "cache_read": 0.5, + "cache_write": 6.25, + "tier": { + "type": "context", + "size": 200000 + } + } + ], + "context_over_200k": { + "input": 10, + "output": 37.5, + "cache_read": 0.5, + "cache_write": 6.25 + } }, "type": "chat" }, { - "id": "openai/gpt-oss-120b", - "name": "OpenAI GPT OSS 120B", - "display_name": "OpenAI GPT OSS 120B", + "id": "deepseek-v4-pro", + "name": "DeepSeek V4 Pro", + "display_name": "DeepSeek V4 Pro", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 131072, - "output": 32768 + "context": 1048576, + "output": 393216 }, "temperature": true, "tool_call": true, @@ -40665,27 +43534,33 @@ }, "extra_capabilities": { "reasoning": { - "supported": true + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] } }, - "attachment": true, + "attachment": false, "open_weights": true, - "release_date": "2025-08-06", - "last_updated": "2025-08-06", + "knowledge": "2025-05", + "release_date": "2026-04-24", + "last_updated": "2026-04-24", "cost": { - "input": 0.05, - "output": 0.25 + "input": 1.74, + "output": 3.48 }, "type": "chat" }, { - "id": "openai/gpt-oss-20b", - "name": "OpenAI: GPT OSS 20B", - "display_name": "OpenAI: GPT OSS 20B", + "id": "openai-gpt-oss-20b", + "name": "gpt-oss-20b", + "display_name": "gpt-oss-20b", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" @@ -40693,33 +43568,29 @@ }, "limit": { "context": 131072, - "output": 32768 + "output": 131072 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { "supported": true, "default": true }, - "extra_capabilities": { - "reasoning": { - "supported": true - } - }, - "attachment": true, + "attachment": false, "open_weights": true, - "release_date": "2025-08-06", - "last_updated": "2025-08-06", + "knowledge": "2024-06", + "release_date": "2025-08-05", + "last_updated": "2026-04-16", "cost": { - "input": 0.04, - "output": 0.15 + "input": 0.05, + "output": 0.45 }, "type": "chat" }, { - "id": "baichuan/baichuan-m2-32b", - "name": "baichuan-m2-32b", - "display_name": "baichuan-m2-32b", + "id": "qwen-2.5-14b-instruct", + "name": "Qwen 2.5 14B Instruct", + "display_name": "Qwen 2.5 14B Instruct", "modalities": { "input": [ "text" @@ -40733,124 +43604,159 @@ "output": 131072 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { "supported": false }, "attachment": false, "open_weights": true, - "knowledge": "2024-12", - "release_date": "2025-08-13", - "last_updated": "2025-08-13", - "cost": { - "input": 0.07, - "output": 0.07 - }, + "knowledge": "2024-09", + "release_date": "2024-09-19", + "last_updated": "2024-09-19", "type": "chat" }, { - "id": "minimax/minimax-m2.7-highspeed", - "name": "MiniMax-M2.7-highspeed", - "display_name": "MiniMax-M2.7-highspeed", + "id": "anthropic-claude-opus-4.8", + "name": "Claude Opus 4.8", + "display_name": "Claude Opus 4.8", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 204800, - "output": 131072 + "context": 1000000, + "output": 128000 }, "temperature": true, "tool_call": true, "reasoning": { "supported": true, - "default": true + "default": false }, "extra_capabilities": { "reasoning": { "supported": true, + "default_enabled": false, + "mode": "effort", + "effort": "high", + "effort_options": [ + "low", + "medium", + "high", + "xhigh", + "max" + ], "interleaved": true, "summaries": true, - "visibility": "summary", + "visibility": "omitted", "continuation": [ "thinking_blocks" + ], + "notes": [ + "Claude Opus 4.7 and newer Opus models require thinking.type = \"adaptive\" to enable thinking explicitly.", + "Manual budget_tokens requests return 400 on Claude Opus 4.7 and newer adaptive-only Opus models.", + "task_budget is separate from thinking control and should not be treated as a thinking budget." ] } }, - "attachment": false, - "open_weights": true, - "release_date": "2026-03-18", - "last_updated": "2026-05-27", + "attachment": true, + "open_weights": false, + "release_date": "2026-05-28", + "last_updated": "2026-05-29", "cost": { - "input": 0.6, - "output": 2.4, - "cache_read": 0.06, - "cache_write": 0.375 + "input": 5, + "output": 25, + "cache_read": 0.5, + "cache_write": 6.25 }, "type": "chat" }, { - "id": "minimax/minimax-m2.1", - "name": "Minimax M2.1", - "display_name": "Minimax M2.1", + "id": "anthropic-claude-opus-4.5", + "name": "Claude Opus 4.5", + "display_name": "Claude Opus 4.5", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 204800, - "output": 131072 + "context": 200000, + "output": 64000 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true + "supported": true, + "default": false }, "extra_capabilities": { "reasoning": { "supported": true, + "default_enabled": false, + "mode": "mixed", + "budget": { + "min": 1024, + "unit": "tokens" + }, + "effort": "high", + "effort_options": [ + "low", + "medium", + "high" + ], "interleaved": true, "summaries": true, "visibility": "summary", "continuation": [ "thinking_blocks" + ], + "notes": [ + "Claude Opus 4.5 uses manual thinking.type = \"enabled\" with budget_tokens; effort can be used alongside the thinking budget.", + "Interleaved thinking requires the interleaved-thinking-2025-05-14 beta header." ] } }, - "attachment": false, - "open_weights": true, - "release_date": "2025-12-23", - "last_updated": "2025-12-23", + "attachment": true, + "open_weights": false, + "knowledge": "2025-03-31", + "release_date": "2025-11-24", + "last_updated": "2025-11-24", "cost": { - "input": 0.3, - "output": 1.2, - "cache_read": 0.03 + "input": 5, + "output": 25, + "cache_read": 0.5, + "cache_write": 6.25 }, "type": "chat" }, { - "id": "minimax/minimax-m2.7", - "name": "MiniMax M2.7", - "display_name": "MiniMax M2.7", + "id": "anthropic-claude-4.1-opus", + "name": "Claude Opus 4.1", + "display_name": "Claude Opus 4.1", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 204800, - "output": 131072 + "context": 200000, + "output": 32000 }, "temperature": true, "tool_call": true, @@ -40858,32 +43764,23 @@ "supported": true, "default": true }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } - }, - "attachment": false, - "open_weights": true, - "release_date": "2026-03-18", - "last_updated": "2026-03-18", + "attachment": true, + "open_weights": false, + "knowledge": "2025-03-31", + "release_date": "2025-08-05", + "last_updated": "2025-08-05", "cost": { - "input": 0.3, - "output": 1.2, - "cache_read": 0.06 + "input": 15, + "output": 75, + "cache_read": 1.5, + "cache_write": 18.75 }, "type": "chat" }, { - "id": "minimax/minimax-m2", - "name": "MiniMax-M2", - "display_name": "MiniMax-M2", + "id": "llama3-8b-instruct", + "name": "Llama 3.1 Instruct (8B)", + "display_name": "Llama 3.1 Instruct (8B)", "modalities": { "input": [ "text" @@ -40893,138 +43790,94 @@ ] }, "limit": { - "context": 204800, + "context": 131072, "output": 131072 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } + "supported": false }, "attachment": false, "open_weights": true, - "release_date": "2025-10-27", - "last_updated": "2025-10-27", + "knowledge": "2023-12", + "release_date": "2024-07-23", + "last_updated": "2024-07-23", "cost": { - "input": 0.3, - "output": 1.2, - "cache_read": 0.03 + "input": 0.198, + "output": 0.198 }, "type": "chat" }, { - "id": "minimax/minimax-m2.5", - "name": "MiniMax M2.5", - "display_name": "MiniMax M2.5", + "id": "stable-diffusion-3.5-large", + "name": "Stable Diffusion 3.5 Large", + "display_name": "Stable Diffusion 3.5 Large", "modalities": { "input": [ "text" ], "output": [ - "text" + "image" ] }, "limit": { - "context": 204800, - "output": 131100 + "context": 256, + "output": 1 }, - "temperature": true, - "tool_call": true, + "temperature": false, + "tool_call": false, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } + "supported": false }, "attachment": false, - "open_weights": false, - "release_date": "2026-02-12", - "last_updated": "2026-02-12", + "open_weights": true, + "release_date": "2024-10-22", + "last_updated": "2026-04-30", "cost": { - "input": 0.3, - "output": 1.2, - "cache_read": 0.03 + "input": 0.08, + "output": 0 }, "type": "chat" }, { - "id": "minimax/minimax-m2.5-highspeed", - "name": "MiniMax M2.5 Highspeed", - "display_name": "MiniMax M2.5 Highspeed", + "id": "openai-gpt-5.4-pro", + "name": "GPT-5.4 pro", + "display_name": "GPT-5.4 pro", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 204800, - "output": 131100 + "context": 400000, + "output": 128000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { "supported": true, "default": true }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } - }, - "attachment": false, + "attachment": true, "open_weights": false, - "release_date": "2026-02-12", - "last_updated": "2026-02-12", + "knowledge": "2025-08-31", + "release_date": "2026-03-05", + "last_updated": "2026-03-05", "cost": { - "input": 0.6, - "output": 2.4, - "cache_read": 0.03 + "input": 30, + "output": 180 }, "type": "chat" - } - ] - }, - "kilo": { - "id": "kilo", - "name": "Kilo Gateway", - "display_name": "Kilo Gateway", - "api": "https://api.kilo.ai/api/gateway", - "doc": "https://kilo.ai", - "models": [ + }, { - "id": "kwaipilot/kat-coder-pro-v2", - "name": "Kwaipilot: KAT-Coder-Pro V2", - "display_name": "Kwaipilot: KAT-Coder-Pro V2", + "id": "all-mini-lm-l6-v2", + "name": "All-MiniLM-L6-v2", + "display_name": "All-MiniLM-L6-v2", "modalities": { "input": [ "text" @@ -41034,111 +43887,154 @@ ] }, "limit": { - "context": 256000, - "output": 80000 + "context": 256, + "output": 384 }, - "temperature": true, - "tool_call": true, + "temperature": false, + "tool_call": false, "reasoning": { "supported": false }, "attachment": false, "open_weights": true, - "release_date": "2026-03-27", - "last_updated": "2026-04-11", + "release_date": "2021-08-30", + "last_updated": "2026-04-16", "cost": { - "input": 0.3, - "output": 1.2, - "cache_read": 0.06 + "input": 0.009, + "output": 0 }, "type": "chat" }, { - "id": "z-ai/glm-4.6", - "name": "Z.ai: GLM 4.6", - "display_name": "Z.ai: GLM 4.6", + "id": "openai-gpt-image-1.5", + "name": "GPT Image 1.5", + "display_name": "GPT Image 1.5", "modalities": { "input": [ - "text" + "text", + "image" + ], + "output": [ + "image" + ] + }, + "limit": { + "context": 8192, + "output": 8192 + }, + "temperature": false, + "tool_call": false, + "reasoning": { + "supported": false + }, + "attachment": true, + "open_weights": false, + "release_date": "2025-11-25", + "last_updated": "2025-11-25", + "cost": { + "input": 5, + "output": 10, + "cache_read": 1 + }, + "type": "chat" + }, + { + "id": "openai-gpt-4o", + "name": "GPT-4o", + "display_name": "GPT-4o", + "modalities": { + "input": [ + "text", + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 204800, - "output": 204800 + "context": 128000, + "output": 16384 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true - } + "supported": false }, - "attachment": false, - "open_weights": true, - "release_date": "2025-09-30", - "last_updated": "2026-03-15", + "attachment": true, + "open_weights": false, + "knowledge": "2023-09", + "release_date": "2024-05-13", + "last_updated": "2024-08-06", "cost": { - "input": 0.39, - "output": 1.9, - "cache_read": 0.175 + "input": 2.5, + "output": 10, + "cache_read": 1.25 }, "type": "chat" }, { - "id": "z-ai/glm-4.7", - "name": "Z.ai: GLM 4.7", - "display_name": "Z.ai: GLM 4.7", + "id": "anthropic-claude-opus-4", + "name": "Claude Opus 4", + "display_name": "Claude Opus 4", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 202752, - "output": 65535 + "context": 200000, + "output": 32000 }, "temperature": true, "tool_call": true, "reasoning": { "supported": true, - "default": true + "default": false }, "extra_capabilities": { "reasoning": { "supported": true, + "default_enabled": false, + "mode": "budget", + "budget": { + "min": 1024, + "unit": "tokens" + }, "interleaved": true, "summaries": true, "visibility": "summary", "continuation": [ "thinking_blocks" + ], + "notes": [ + "Claude 4 manual thinking uses thinking.type = \"enabled\" with budget_tokens.", + "Interleaved thinking requires the interleaved-thinking-2025-05-14 beta header for this model family." ] } }, - "attachment": false, - "open_weights": true, - "release_date": "2025-12-22", - "last_updated": "2026-03-15", + "attachment": true, + "open_weights": false, + "knowledge": "2025-03-31", + "release_date": "2025-05-22", + "last_updated": "2025-05-22", "cost": { - "input": 0.38, - "output": 1.98, - "cache_read": 0.2 + "input": 15, + "output": 75, + "cache_read": 1.5, + "cache_write": 18.75 }, "type": "chat" }, { - "id": "z-ai/glm-4-32b", - "name": "Z.ai: GLM 4 32B ", - "display_name": "Z.ai: GLM 4 32B ", + "id": "bge-reranker-v2-m3", + "name": "BGE Reranker v2 M3", + "display_name": "BGE Reranker v2 M3", "modalities": { "input": [ "text" @@ -41148,28 +44044,28 @@ ] }, "limit": { - "context": 128000, - "output": 32768 + "context": 8192, + "output": 1 }, - "temperature": true, - "tool_call": true, + "temperature": false, + "tool_call": false, "reasoning": { "supported": false }, "attachment": false, "open_weights": true, - "release_date": "2025-07-25", - "last_updated": "2026-03-15", + "release_date": "2024-03-12", + "last_updated": "2026-04-30", "cost": { - "input": 0.1, - "output": 0.1 + "input": 0.01, + "output": 0 }, - "type": "chat" + "type": "rerank" }, { - "id": "z-ai/glm-4.5v", - "name": "Z.ai: GLM 4.5V", - "display_name": "Z.ai: GLM 4.5V", + "id": "openai-gpt-5", + "name": "GPT-5", + "display_name": "GPT-5", "modalities": { "input": [ "text", @@ -41180,64 +44076,31 @@ ] }, "limit": { - "context": 65536, - "output": 16384 - }, - "temperature": true, - "tool_call": true, - "reasoning": { - "supported": true, - "default": true - }, - "attachment": true, - "open_weights": true, - "release_date": "2025-08-11", - "last_updated": "2025-08-11", - "cost": { - "input": 0.6, - "output": 1.8, - "cache_read": 0.11 - }, - "type": "chat" - }, - { - "id": "z-ai/glm-4.6v", - "name": "Z.ai: GLM 4.6V", - "display_name": "Z.ai: GLM 4.6V", - "modalities": { - "input": [ - "image", - "text", - "video" - ], - "output": [ - "text" - ] - }, - "limit": { - "context": 131072, - "output": 131072 + "context": 400000, + "output": 128000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { "supported": true, "default": true }, "attachment": true, - "open_weights": true, - "release_date": "2025-09-30", - "last_updated": "2026-01-10", + "open_weights": false, + "knowledge": "2024-09-30", + "release_date": "2025-08-07", + "last_updated": "2025-08-07", "cost": { - "input": 0.3, - "output": 0.9 + "input": 1.25, + "output": 10, + "cache_read": 0.125 }, "type": "chat" }, { - "id": "z-ai/glm-4.7-flash", - "name": "Z.ai: GLM 4.7 Flash", - "display_name": "Z.ai: GLM 4.7 Flash", + "id": "openai-o3-mini", + "name": "o3-mini", + "display_name": "o3-mini", "modalities": { "input": [ "text" @@ -41247,70 +44110,62 @@ ] }, "limit": { - "context": 202752, - "output": 40551 + "context": 200000, + "output": 100000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { "supported": true, "default": true }, - "extra_capabilities": { - "reasoning": { - "supported": true - } - }, "attachment": false, - "open_weights": true, - "release_date": "2026-01-19", - "last_updated": "2026-01-19", + "open_weights": false, + "knowledge": "2024-05", + "release_date": "2024-12-20", + "last_updated": "2025-01-29", "cost": { - "input": 0.06, - "output": 0.4, - "cache_read": 0.01 + "input": 1.1, + "output": 4.4, + "cache_read": 0.55 }, "type": "chat" }, { - "id": "z-ai/glm-5v-turbo", - "name": "Z.ai: GLM 5V Turbo", - "display_name": "Z.ai: GLM 5V Turbo", + "id": "multi-qa-mpnet-base-dot-v1", + "name": "Multi-QA-mpnet-base-dot-v1", + "display_name": "Multi-QA-mpnet-base-dot-v1", "modalities": { "input": [ - "image", - "text", - "video" + "text" ], "output": [ "text" ] }, "limit": { - "context": 202752, - "output": 131072 + "context": 512, + "output": 768 }, - "temperature": true, - "tool_call": true, + "temperature": false, + "tool_call": false, "reasoning": { - "supported": true, - "default": true + "supported": false }, - "attachment": true, + "attachment": false, "open_weights": true, - "release_date": "2026-04-01", - "last_updated": "2026-04-11", + "release_date": "2021-08-30", + "last_updated": "2026-04-16", "cost": { - "input": 1.2, - "output": 4, - "cache_read": 0.24 + "input": 0.009, + "output": 0 }, "type": "chat" }, { - "id": "z-ai/glm-5", - "name": "Z.ai: GLM 5", - "display_name": "Z.ai: GLM 5", + "id": "kimi-k2.5", + "name": "Kimi K2.5", + "display_name": "Kimi K2.5", "modalities": { "input": [ "text" @@ -41320,10 +44175,10 @@ ] }, "limit": { - "context": 202752, - "output": 131072 + "context": 262144, + "output": 32768 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { "supported": true, @@ -41342,18 +44197,19 @@ }, "attachment": false, "open_weights": true, - "release_date": "2026-02-12", - "last_updated": "2026-03-15", + "knowledge": "2025-01", + "release_date": "2026-01", + "last_updated": "2026-04-16", "cost": { - "input": 0.72, - "output": 2.3 + "input": 0.5, + "output": 2.7 }, "type": "chat" }, { - "id": "z-ai/glm-5-turbo", - "name": "Z.ai: GLM 5 Turbo", - "display_name": "Z.ai: GLM 5 Turbo", + "id": "llama3.3-70b-instruct", + "name": "Llama 3.3 Instruct 70B", + "display_name": "Llama 3.3 Instruct 70B", "modalities": { "input": [ "text" @@ -41363,35 +44219,29 @@ ] }, "limit": { - "context": 202752, - "output": 131072 + "context": 128000, + "output": 128000 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true - } + "supported": false }, "attachment": false, "open_weights": true, - "release_date": "2026-03-15", - "last_updated": "2026-04-11", + "knowledge": "2023-12", + "release_date": "2024-12-06", + "last_updated": "2024-12-06", "cost": { - "input": 1.2, - "output": 4, - "cache_read": 0.24 + "input": 0.65, + "output": 0.65 }, "type": "chat" }, { - "id": "z-ai/glm-4.5", - "name": "Z.ai: GLM 4.5", - "display_name": "Z.ai: GLM 4.5", + "id": "gte-large-en-v1.5", + "name": "GTE Large (v1.5)", + "display_name": "GTE Large (v1.5)", "modalities": { "input": [ "text" @@ -41401,100 +44251,115 @@ ] }, "limit": { - "context": 131072, - "output": 98304 + "context": 8192, + "output": 1024 }, - "temperature": true, - "tool_call": true, + "temperature": false, + "tool_call": false, "reasoning": { - "supported": true, - "default": true + "supported": false }, "attachment": false, "open_weights": true, - "release_date": "2025-07-28", - "last_updated": "2026-03-15", + "release_date": "2024-03-27", + "last_updated": "2026-04-16", "cost": { - "input": 0.6, - "output": 2.2, - "cache_read": 0.175 + "input": 0.09, + "output": 0 }, "type": "chat" }, { - "id": "z-ai/glm-4.5-air", - "name": "Z.ai: GLM 4.5 Air", - "display_name": "Z.ai: GLM 4.5 Air", + "id": "openai-gpt-5.4-mini", + "name": "GPT-5.4 mini", + "display_name": "GPT-5.4 mini", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 131072, - "output": 98304 + "context": 400000, + "output": 128000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { "supported": true, "default": true }, - "attachment": false, - "open_weights": true, - "release_date": "2025-07-28", - "last_updated": "2025-07-28", + "attachment": true, + "open_weights": false, + "knowledge": "2025-08-31", + "release_date": "2026-03-17", + "last_updated": "2026-03-17", "cost": { - "input": 0.13, - "output": 0.85, - "cache_read": 0.025 + "input": 0.75, + "output": 4.5, + "cache_read": 0.075 }, "type": "chat" }, { - "id": "z-ai/glm-5.1", - "name": "Z.ai: GLM 5.1", - "display_name": "Z.ai: GLM 5.1", + "id": "openai-gpt-5.5", + "name": "GPT-5.5", + "display_name": "GPT-5.5", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 202752, - "output": 131072 + "context": 1000000, + "output": 128000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { "supported": true, "default": true }, - "extra_capabilities": { - "reasoning": { - "supported": true - } - }, - "attachment": false, - "open_weights": true, - "release_date": "2026-03-27", - "last_updated": "2026-03-27", + "attachment": true, + "open_weights": false, + "knowledge": "2025-12-01", + "release_date": "2026-04-23", + "last_updated": "2026-04-30", "cost": { - "input": 1.26, - "output": 3.96 + "input": 5, + "output": 30, + "cache_read": 0.5, + "tiers": [ + { + "input": 10, + "output": 45, + "cache_read": 1, + "tier": { + "type": "context", + "size": 272000 + } + } + ], + "context_over_200k": { + "input": 10, + "output": 45, + "cache_read": 1 + } }, "type": "chat" }, { - "id": "upstage/solar-pro-3", - "name": "Upstage: Solar Pro 3", - "display_name": "Upstage: Solar Pro 3", + "id": "nemotron-3-nano-30b", + "name": "Nemotron 3 Nano 30B A3B", + "display_name": "Nemotron 3 Nano 30B A3B", "modalities": { "input": [ "text" @@ -41504,8 +44369,8 @@ ] }, "limit": { - "context": 128000, - "output": 32768 + "context": 262144, + "output": 262144 }, "temperature": true, "tool_call": true, @@ -41514,19 +44379,15 @@ "default": true }, "attachment": false, - "open_weights": false, - "release_date": "2026-01-27", - "last_updated": "2026-03-15", - "cost": { - "input": 0.15, - "output": 0.6 - }, + "open_weights": true, + "release_date": "2025-04-14", + "last_updated": "2025-04-14", "type": "chat" }, { - "id": "prime-intellect/intellect-3", - "name": "Prime Intellect: INTELLECT-3", - "display_name": "Prime Intellect: INTELLECT-3", + "id": "openai-gpt-oss-120b", + "name": "gpt-oss-120b", + "display_name": "gpt-oss-120b", "modalities": { "input": [ "text" @@ -41545,84 +44406,98 @@ "supported": true, "default": true }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } + }, "attachment": false, "open_weights": true, - "release_date": "2025-11-26", - "last_updated": "2026-02-04", + "knowledge": "2024-06", + "release_date": "2025-08-05", + "last_updated": "2026-04-16", "cost": { - "input": 0.2, - "output": 1.1 + "input": 0.1, + "output": 0.7 }, "type": "chat" }, { - "id": "alfredpros/codellama-7b-instruct-solidity", - "name": "AlfredPros: CodeLLaMa 7B Instruct Solidity", - "display_name": "AlfredPros: CodeLLaMa 7B Instruct Solidity", + "id": "openai-gpt-5-nano", + "name": "GPT-5 nano", + "display_name": "GPT-5 nano", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 4096, - "output": 4096 + "context": 400000, + "output": 128000 }, - "temperature": true, - "tool_call": false, + "temperature": false, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": false, - "open_weights": true, - "release_date": "2025-04-14", - "last_updated": "2026-03-15", + "attachment": true, + "open_weights": false, + "knowledge": "2024-05-30", + "release_date": "2025-08-07", + "last_updated": "2025-08-07", "cost": { - "input": 0.8, - "output": 1.2 + "input": 0.05, + "output": 0.4, + "cache_read": 0.005 }, "type": "chat" }, { - "id": "rekaai/reka-edge", - "name": "Reka Edge", - "display_name": "Reka Edge", + "id": "wan2-2-t2v-a14b", + "name": "Wan2.2-T2V-A14B", + "display_name": "Wan2.2-T2V-A14B", "modalities": { "input": [ - "image", - "text", - "video" + "text" ], "output": [ - "text" + "video" ] }, "limit": { - "context": 16384, - "output": 16384 + "context": 100, + "output": 1 }, - "temperature": true, - "tool_call": true, + "temperature": false, + "tool_call": false, "reasoning": { "supported": false }, - "attachment": true, + "attachment": false, "open_weights": true, - "release_date": "2026-03-20", - "last_updated": "2026-04-11", + "release_date": "2025-07-28", + "last_updated": "2026-04-30", "cost": { - "input": 0.1, - "output": 0.1 + "input": 0.6, + "output": 0 }, "type": "chat" }, { - "id": "rekaai/reka-flash-3", - "name": "Reka Flash 3", - "display_name": "Reka Flash 3", + "id": "mistral-7b-instruct-v0.3", + "name": "Mistral 7B Instruct v0.3", + "display_name": "Mistral 7B Instruct v0.3", "modalities": { "input": [ "text" @@ -41632,62 +44507,51 @@ ] }, "limit": { - "context": 65536, - "output": 65536 + "context": 32768, + "output": 32768 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, "attachment": false, "open_weights": true, - "release_date": "2025-03-12", - "last_updated": "2026-04-11", - "cost": { - "input": 0.1, - "output": 0.2 - }, + "release_date": "2024-05-22", + "last_updated": "2024-05-22", "type": "chat" }, { - "id": "nousresearch/hermes-4-70b", - "name": "Nous: Hermes 4 70B", - "display_name": "Nous: Hermes 4 70B", + "id": "qwen3-tts-voicedesign", + "name": "Qwen3 TTS VoiceDesign", + "display_name": "Qwen3 TTS VoiceDesign", "modalities": { "input": [ "text" ], "output": [ - "text" + "audio" ] }, "limit": { - "context": 131072, - "output": 131072 + "context": 32768, + "output": 1 }, - "temperature": true, + "temperature": false, "tool_call": false, "reasoning": { - "supported": true, - "default": true + "supported": false }, "attachment": false, "open_weights": true, - "release_date": "2025-08-25", - "last_updated": "2026-03-15", - "cost": { - "input": 0.13, - "output": 0.4, - "cache_read": 0.055 - }, + "release_date": "2026-04-21", + "last_updated": "2026-04-30", "type": "chat" }, { - "id": "nousresearch/hermes-3-llama-3.1-405b", - "name": "Nous: Hermes 3 405B Instruct", - "display_name": "Nous: Hermes 3 405B Instruct", + "id": "mistral-nemo-instruct-2407", + "name": "Mistral Nemo Instruct", + "display_name": "Mistral Nemo Instruct", "modalities": { "input": [ "text" @@ -41697,90 +44561,73 @@ ] }, "limit": { - "context": 131072, + "context": 128000, "output": 16384 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { "supported": false }, "attachment": false, "open_weights": true, - "release_date": "2024-08-16", - "last_updated": "2024-08-16", + "release_date": "2024-07-18", + "last_updated": "2024-07-18", "cost": { - "input": 1, - "output": 1 + "input": 0.3, + "output": 0.3 }, "type": "chat" }, { - "id": "nousresearch/hermes-3-llama-3.1-70b", - "name": "Nous: Hermes 3 70B Instruct", - "display_name": "Nous: Hermes 3 70B Instruct", + "id": "kimi-k2.6", + "name": "Kimi K2.6", + "display_name": "Kimi K2.6", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 131072, - "output": 32768 + "context": 262144, + "output": 262144 }, - "temperature": true, - "tool_call": false, + "temperature": false, + "tool_call": true, "reasoning": { - "supported": false - }, - "attachment": false, - "open_weights": true, - "release_date": "2024-08-18", - "last_updated": "2026-03-15", - "cost": { - "input": 0.3, - "output": 0.3 - }, - "type": "chat" - }, - { - "id": "nousresearch/hermes-2-pro-llama-3-8b", - "name": "NousResearch: Hermes 2 Pro - Llama-3 8B", - "display_name": "NousResearch: Hermes 2 Pro - Llama-3 8B", - "modalities": { - "input": [ - "text" - ], - "output": [ - "text" - ] - }, - "limit": { - "context": 8192, - "output": 8192 + "supported": true, + "default": true }, - "temperature": true, - "tool_call": false, - "reasoning": { - "supported": false + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } }, - "attachment": false, + "attachment": true, "open_weights": true, - "release_date": "2024-05-27", - "last_updated": "2024-06-27", + "knowledge": "2025-01", + "release_date": "2026-04-21", + "last_updated": "2026-04-21", "cost": { - "input": 0.14, - "output": 0.14 + "input": 0.95, + "output": 4 }, "type": "chat" }, { - "id": "nousresearch/hermes-4-405b", - "name": "Nous: Hermes 4 405B", - "display_name": "Nous: Hermes 4 405B", + "id": "deepseek-3.2", + "name": "DeepSeek V3.2", + "display_name": "DeepSeek V3.2", "modalities": { "input": [ "text" @@ -41790,60 +44637,77 @@ ] }, "limit": { - "context": 131072, - "output": 26215 + "context": 128000, + "output": 64000 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { "supported": true, "default": true }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } + }, "attachment": false, "open_weights": true, - "release_date": "2025-08-25", - "last_updated": "2025-08-25", + "knowledge": "2024-12", + "release_date": "2025-12-02", + "last_updated": "2026-04-30", "cost": { - "input": 1, - "output": 3 + "input": 0.5, + "output": 1.6 }, "type": "chat" }, { - "id": "mistralai/devstral-medium", - "name": "Mistral: Devstral Medium", - "display_name": "Mistral: Devstral Medium", + "id": "openai-o1", + "name": "o1", + "display_name": "o1", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 131072, - "output": 26215 + "context": 200000, + "output": 100000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": false, - "open_weights": true, - "release_date": "2025-07-10", - "last_updated": "2025-07-10", + "attachment": true, + "open_weights": false, + "knowledge": "2023-09", + "release_date": "2024-12-05", + "last_updated": "2024-12-05", "cost": { - "input": 0.4, - "output": 2 + "input": 15, + "output": 60, + "cache_read": 7.5 }, "type": "chat" }, { - "id": "mistralai/mistral-small-24b-instruct-2501", - "name": "Mistral: Mistral Small 3", - "display_name": "Mistral: Mistral Small 3", + "id": "qwen3.5-397b-a17b", + "name": "Qwen 3.5 397B A17B", + "display_name": "Qwen 3.5 397B A17B", "modalities": { "input": [ "text" @@ -41853,28 +44717,40 @@ ] }, "limit": { - "context": 32768, - "output": 16384 + "context": 262144, + "output": 81920 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } }, "attachment": false, "open_weights": true, - "release_date": "2025-12-29", - "last_updated": "2026-01-10", + "release_date": "2026-02-15", + "last_updated": "2026-04-30", "cost": { - "input": 0.05, - "output": 0.08 + "input": 0.55, + "output": 3.5 }, "type": "chat" }, { - "id": "mistralai/mistral-large-2411", - "name": "Mistral Large 2411", - "display_name": "Mistral Large 2411", + "id": "qwen3-coder-flash", + "name": "Qwen3 Coder Flash", + "display_name": "Qwen3 Coder Flash", "modalities": { "input": [ "text" @@ -41884,8 +44760,8 @@ ] }, "limit": { - "context": 131072, - "output": 26215 + "context": 262144, + "output": 65536 }, "temperature": true, "tool_call": true, @@ -41894,93 +44770,68 @@ }, "attachment": false, "open_weights": true, - "release_date": "2024-07-24", - "last_updated": "2024-11-04", - "cost": { - "input": 2, - "output": 6 - }, - "type": "chat" - }, - { - "id": "mistralai/mistral-7b-instruct-v0.1", - "name": "Mistral: Mistral 7B Instruct v0.1", - "display_name": "Mistral: Mistral 7B Instruct v0.1", - "modalities": { - "input": [ - "text" - ], - "output": [ - "text" - ] - }, - "limit": { - "context": 2824, - "output": 565 - }, - "temperature": true, - "tool_call": false, - "reasoning": { - "supported": false - }, - "attachment": false, - "open_weights": false, - "release_date": "2025-04-03", - "last_updated": "2025-04-03", + "knowledge": "2025-04", + "release_date": "2025-07-28", + "last_updated": "2026-04-30", "cost": { - "input": 0.11, - "output": 0.19 + "input": 0.45, + "output": 1.7 }, "type": "chat" }, { - "id": "mistralai/mistral-medium-3.1", - "name": "Mistral: Mistral Medium 3.1", - "display_name": "Mistral: Mistral Medium 3.1", + "id": "openai-gpt-5.3-codex", + "name": "GPT-5.3 Codex", + "display_name": "GPT-5.3 Codex", "modalities": { "input": [ "text", - "image" + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 131072, - "output": 26215 + "context": 400000, + "output": 128000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "attachment": true, "open_weights": false, - "release_date": "2025-08-12", - "last_updated": "2025-08-12", + "knowledge": "2025-08-31", + "release_date": "2026-02-05", + "last_updated": "2026-02-05", "cost": { - "input": 0.4, - "output": 2 + "input": 1.75, + "output": 14, + "cache_read": 0.175 }, "type": "chat" }, { - "id": "mistralai/ministral-14b-2512", - "name": "Mistral: Ministral 3 14B 2512", - "display_name": "Mistral: Ministral 3 14B 2512", + "id": "openai-gpt-4.1", + "name": "GPT-4.1", + "display_name": "GPT-4.1", "modalities": { "input": [ "text", - "image" + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 262144, - "output": 52429 + "context": 1047576, + "output": 32768 }, "temperature": true, "tool_call": true, @@ -41989,18 +44840,20 @@ }, "attachment": true, "open_weights": false, - "release_date": "2025-12-16", - "last_updated": "2025-12-16", + "knowledge": "2024-04", + "release_date": "2025-04-14", + "last_updated": "2025-04-14", "cost": { - "input": 0.2, - "output": 0.2 + "input": 2, + "output": 8, + "cache_read": 0.5 }, "type": "chat" }, { - "id": "mistralai/mistral-large-2407", - "name": "Mistral Large 2407", - "display_name": "Mistral Large 2407", + "id": "anthropic-claude-3.5-haiku", + "name": "Claude 3.5 Haiku", + "display_name": "Claude 3.5 Haiku", "modalities": { "input": [ "text" @@ -42010,8 +44863,8 @@ ] }, "limit": { - "context": 131072, - "output": 32768 + "context": 200000, + "output": 8192 }, "temperature": true, "tool_call": true, @@ -42019,85 +44872,58 @@ "supported": false }, "attachment": false, - "open_weights": true, - "release_date": "2024-11-19", - "last_updated": "2026-03-15", + "open_weights": false, + "knowledge": "2024-07", + "release_date": "2024-11-05", + "last_updated": "2024-11-05", "cost": { - "input": 2, - "output": 6 + "input": 0.8, + "output": 4, + "cache_read": 0.08, + "cache_write": 1 }, "type": "chat" }, { - "id": "mistralai/mistral-small-2603", - "name": "Mistral: Mistral Small 4", - "display_name": "Mistral: Mistral Small 4", + "id": "openai-gpt-5.4", + "name": "GPT-5.4", + "display_name": "GPT-5.4", "modalities": { "input": [ + "text", "image", - "text" + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 262144, - "output": 262144 + "context": 1000000, + "output": 128000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { "supported": true, "default": true }, "attachment": true, - "open_weights": true, - "release_date": "2026-03-16", - "last_updated": "2026-04-11", - "cost": { - "input": 0.15, - "output": 0.6, - "cache_read": 0.015 - }, - "type": "chat" - }, - { - "id": "mistralai/ministral-8b-2512", - "name": "Mistral: Ministral 3 8B 2512", - "display_name": "Mistral: Ministral 3 8B 2512", - "modalities": { - "input": [ - "image", - "text" - ], - "output": [ - "text" - ] - }, - "limit": { - "context": 262144, - "output": 32768 - }, - "temperature": true, - "tool_call": true, - "reasoning": { - "supported": false - }, - "attachment": true, - "open_weights": true, - "release_date": "2025-12-02", - "last_updated": "2026-03-15", + "open_weights": false, + "knowledge": "2025-08-31", + "release_date": "2026-03-05", + "last_updated": "2026-03-05", "cost": { - "input": 0.15, - "output": 0.15 + "input": 2.5, + "output": 15, + "cache_read": 0.25 }, "type": "chat" }, { - "id": "mistralai/mistral-large", - "name": "Mistral Large", - "display_name": "Mistral Large", + "id": "arcee-trinity-large-thinking", + "name": "Trinity Large Thinking", + "display_name": "Trinity Large Thinking", "modalities": { "input": [ "text" @@ -42107,92 +44933,101 @@ ] }, "limit": { - "context": 128000, - "output": 25600 + "context": 256000, + "output": 128000 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "attachment": false, "open_weights": true, - "release_date": "2024-07-24", - "last_updated": "2025-12-02", + "release_date": "2026-04-02", + "last_updated": "2026-04-16", "cost": { - "input": 2, - "output": 6 + "input": 0.25, + "output": 0.9, + "cache_read": 0.06 }, "type": "chat" }, { - "id": "mistralai/mistral-small-3.1-24b-instruct", - "name": "Mistral: Mistral Small 3.1 24B", - "display_name": "Mistral: Mistral Small 3.1 24B", + "id": "openai-o3", + "name": "o3", + "display_name": "o3", "modalities": { "input": [ + "text", "image", - "text" + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 131072 + "context": 200000, + "output": 100000 }, - "temperature": true, - "tool_call": false, + "temperature": false, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "attachment": true, - "open_weights": true, - "release_date": "2025-03-17", - "last_updated": "2026-03-15", + "open_weights": false, + "knowledge": "2024-05", + "release_date": "2025-04-16", + "last_updated": "2025-04-16", "cost": { - "input": 0.35, - "output": 0.56, - "cache_read": 0.015 + "input": 2, + "output": 8, + "cache_read": 0.5 }, "type": "chat" }, { - "id": "mistralai/mistral-nemo", - "name": "Mistral: Mistral Nemo", - "display_name": "Mistral: Mistral Nemo", + "id": "anthropic-claude-3.5-sonnet", + "name": "Claude 3.5 Sonnet", + "display_name": "Claude 3.5 Sonnet", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 131072, - "output": 16384 + "context": 200000, + "output": 8192 }, "temperature": true, "tool_call": true, "reasoning": { "supported": false }, - "attachment": false, - "open_weights": true, - "release_date": "2024-07-01", - "last_updated": "2024-07-30", + "attachment": true, + "open_weights": false, + "knowledge": "2024-04", + "release_date": "2024-06-20", + "last_updated": "2024-10-22", "cost": { - "input": 0.02, - "output": 0.04 + "input": 3, + "output": 15, + "cache_read": 0.3, + "cache_write": 3.75 }, "type": "chat" }, { - "id": "mistralai/mistral-large-2512", - "name": "Mistral: Mistral Large 3 2512", - "display_name": "Mistral: Mistral Large 3 2512", + "id": "openai-gpt-5-mini", + "name": "GPT-5 mini", + "display_name": "GPT-5 mini", "modalities": { "input": [ "text", @@ -42203,31 +45038,33 @@ ] }, "limit": { - "context": 262144, - "output": 52429 + "context": 400000, + "output": 128000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "attachment": true, - "open_weights": true, - "release_date": "2024-11-01", - "last_updated": "2025-12-16", + "open_weights": false, + "knowledge": "2024-05-30", + "release_date": "2025-08-07", + "last_updated": "2025-08-07", "cost": { - "input": 0.5, - "output": 1.5 + "input": 0.25, + "output": 2, + "cache_read": 0.025 }, "type": "chat" }, { - "id": "mistralai/ministral-3b-2512", - "name": "Mistral: Ministral 3 3B 2512", - "display_name": "Mistral: Ministral 3 3B 2512", + "id": "nvidia-nemotron-3-super-120b", + "name": "Nemotron-3-Super-120B", + "display_name": "Nemotron-3-Super-120B", "modalities": { "input": [ - "image", "text" ], "output": [ @@ -42235,28 +45072,30 @@ ] }, "limit": { - "context": 131072, + "context": 256000, "output": 32768 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": true, + "attachment": false, "open_weights": true, - "release_date": "2025-12-02", - "last_updated": "2026-03-15", + "knowledge": "2026-02", + "release_date": "2026-03-11", + "last_updated": "2026-04-16", "cost": { - "input": 0.1, - "output": 0.1 + "input": 0.3, + "output": 0.65 }, "type": "chat" }, { - "id": "mistralai/mistral-saba", - "name": "Mistral: Saba", - "display_name": "Mistral: Saba", + "id": "glm-5", + "name": "GLM 5", + "display_name": "GLM 5", "modalities": { "input": [ "text" @@ -42266,28 +45105,39 @@ ] }, "limit": { - "context": 32768, - "output": 32768 + "context": 202752, + "output": 128000 }, - "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } }, "attachment": false, "open_weights": true, - "release_date": "2025-02-17", - "last_updated": "2026-03-15", + "release_date": "2026-02-11", + "last_updated": "2026-04-16", "cost": { - "input": 0.2, - "output": 0.6 + "input": 1, + "output": 3.2 }, "type": "chat" }, { - "id": "mistralai/mistral-medium-3", - "name": "Mistral: Mistral Medium 3", - "display_name": "Mistral: Mistral Medium 3", + "id": "openai-gpt-5.2-pro", + "name": "GPT-5.2 pro", + "display_name": "GPT-5.2 pro", "modalities": { "input": [ "text", @@ -42298,72 +45148,79 @@ ] }, "limit": { - "context": 131072, - "output": 26215 + "context": 400000, + "output": 128000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "attachment": true, "open_weights": false, - "release_date": "2025-05-07", - "last_updated": "2025-05-07", + "knowledge": "2025-08-31", + "release_date": "2025-12-11", + "last_updated": "2025-12-11", "cost": { - "input": 0.4, - "output": 2 + "input": 21, + "output": 168 }, "type": "chat" }, { - "id": "mistralai/voxtral-small-24b-2507", - "name": "Mistral: Voxtral Small 24B 2507", - "display_name": "Mistral: Voxtral Small 24B 2507", + "id": "anthropic-claude-3-opus", + "name": "Claude 3 Opus", + "display_name": "Claude 3 Opus", "modalities": { "input": [ "text", - "audio" + "image" ], "output": [ "text" ] }, "limit": { - "context": 32000, - "output": 6400 + "context": 200000, + "output": 4096 }, "temperature": true, "tool_call": true, "reasoning": { "supported": false }, - "attachment": false, - "open_weights": true, - "release_date": "2025-07-01", - "last_updated": "2025-07-01", + "attachment": true, + "open_weights": false, + "knowledge": "2023-08", + "release_date": "2024-02-29", + "last_updated": "2024-02-29", "cost": { - "input": 0.1, - "output": 0.3 + "input": 15, + "output": 75, + "cache_read": 1.5, + "cache_write": 18.75 }, "type": "chat" }, { - "id": "mistralai/mistral-medium-3-5", - "name": "Mistral: Mistral Medium 3.5", - "display_name": "Mistral: Mistral Medium 3.5", + "id": "nemotron-3-nano-omni", + "name": "Nemotron Nano 3 Omni", + "display_name": "Nemotron Nano 3 Omni", "modalities": { "input": [ + "text", "image", - "text" + "video", + "audio" ], "output": [ "text" ] }, "limit": { - "context": 262144, - "output": 262144 + "context": 65536, + "output": 65536 }, "temperature": true, "tool_call": true, @@ -42372,50 +45229,19 @@ "default": true }, "attachment": true, - "open_weights": false, - "release_date": "2026-04-30", - "last_updated": "2026-05-07", - "cost": { - "input": 1.5, - "output": 7.5 - }, - "type": "chat" - }, - { - "id": "mistralai/mixtral-8x22b-instruct", - "name": "Mistral: Mixtral 8x22B Instruct", - "display_name": "Mistral: Mixtral 8x22B Instruct", - "modalities": { - "input": [ - "text" - ], - "output": [ - "text" - ] - }, - "limit": { - "context": 65536, - "output": 13108 - }, - "temperature": true, - "tool_call": true, - "reasoning": { - "supported": false - }, - "attachment": false, "open_weights": true, - "release_date": "2024-04-17", - "last_updated": "2024-04-17", + "release_date": "2026-04-28", + "last_updated": "2026-04-30", "cost": { - "input": 2, - "output": 6 + "input": 0.5, + "output": 0.9 }, "type": "chat" }, { - "id": "mistralai/devstral-small", - "name": "Mistral: Devstral Small 1.1", - "display_name": "Mistral: Devstral Small 1.1", + "id": "alibaba-qwen3-32b", + "name": "Qwen3-32B", + "display_name": "Qwen3-32B", "modalities": { "input": [ "text" @@ -42425,249 +45251,214 @@ ] }, "limit": { - "context": 131072, - "output": 26215 + "context": 131000, + "output": 40960 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "attachment": false, "open_weights": true, - "release_date": "2025-05-07", - "last_updated": "2025-07-10", + "release_date": "2025-04-30", + "last_updated": "2026-04-16", "cost": { - "input": 0.1, - "output": 0.3 + "input": 0.25, + "output": 0.55 }, "type": "chat" }, { - "id": "mistralai/devstral-2512", - "name": "Mistral: Devstral 2 2512", - "display_name": "Mistral: Devstral 2 2512", + "id": "nemotron-nano-12b-v2-vl", + "name": "Nemotron Nano 12B v2 VL", + "display_name": "Nemotron Nano 12B v2 VL", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 262144, - "output": 65536 + "context": 128000, + "output": 16384 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": false, + "attachment": true, "open_weights": true, - "release_date": "2025-09-12", - "last_updated": "2026-03-15", + "knowledge": "2024-10", + "release_date": "2025-12-01", + "last_updated": "2026-04-30", "cost": { - "input": 0.4, - "output": 2, - "cache_read": 0.025 + "input": 0.2, + "output": 0.6 }, "type": "chat" }, { - "id": "mistralai/mistral-small-3.2-24b-instruct", - "name": "Mistral: Mistral Small 3.2 24B", - "display_name": "Mistral: Mistral Small 3.2 24B", + "id": "openai-gpt-5.1-codex-max", + "name": "GPT-5.1 Codex Max", + "display_name": "GPT-5.1 Codex Max", "modalities": { "input": [ - "image", - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 131072, - "output": 131072 + "context": 400000, + "output": 128000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "attachment": true, - "open_weights": true, - "release_date": "2025-06-20", - "last_updated": "2025-06-20", + "open_weights": false, + "knowledge": "2024-09-30", + "release_date": "2025-11-13", + "last_updated": "2025-11-13", "cost": { - "input": 0.06, - "output": 0.18, - "cache_read": 0.03 + "input": 1.25, + "output": 10, + "cache_read": 0.125 }, "type": "chat" }, { - "id": "mistralai/codestral-2508", - "name": "Mistral: Codestral 2508", - "display_name": "Mistral: Codestral 2508", + "id": "fal-ai/fast-sdxl", + "name": "Fast SDXL", + "display_name": "Fast SDXL", "modalities": { "input": [ "text" ], "output": [ - "text" + "image" ] }, "limit": { - "context": 256000, - "output": 51200 + "context": 8192, + "output": 8192 }, - "temperature": true, - "tool_call": true, + "temperature": false, + "tool_call": false, "reasoning": { "supported": false }, "attachment": false, "open_weights": true, - "release_date": "2025-08-01", - "last_updated": "2025-08-01", - "cost": { - "input": 0.3, - "output": 0.9 - }, - "type": "chat" - }, - { - "id": "mistralai/pixtral-large-2411", - "name": "Mistral: Pixtral Large 2411", - "display_name": "Mistral: Pixtral Large 2411", - "modalities": { - "input": [ - "image", - "text" - ], - "output": [ - "text" - ] - }, - "limit": { - "context": 131072, - "output": 32768 - }, - "temperature": true, - "tool_call": true, - "reasoning": { - "supported": false - }, - "attachment": true, - "open_weights": true, - "release_date": "2024-11-19", - "last_updated": "2026-03-15", - "cost": { - "input": 2, - "output": 6 - }, + "release_date": "2023-07-26", + "last_updated": "2026-04-16", "type": "chat" }, { - "id": "sao10k/l3.1-euryale-70b", - "name": "Sao10K: Llama 3.1 Euryale 70B v2.2", - "display_name": "Sao10K: Llama 3.1 Euryale 70B v2.2", + "id": "fal-ai/elevenlabs/tts/multilingual-v2", + "name": "ElevenLabs Multilingual TTS v2", + "display_name": "ElevenLabs Multilingual TTS v2", "modalities": { "input": [ "text" ], "output": [ - "text" + "audio" ] }, "limit": { - "context": 131072, - "output": 16384 + "context": 8192, + "output": 8192 }, - "temperature": true, - "tool_call": true, + "temperature": false, + "tool_call": false, "reasoning": { "supported": false }, "attachment": false, - "open_weights": true, - "release_date": "2024-08-28", - "last_updated": "2026-03-15", - "cost": { - "input": 0.85, - "output": 0.85 - }, + "open_weights": false, + "release_date": "2023-08-22", + "last_updated": "2026-04-16", "type": "chat" }, { - "id": "sao10k/l3-lunaris-8b", - "name": "Sao10K: Llama 3 8B Lunaris", - "display_name": "Sao10K: Llama 3 8B Lunaris", + "id": "fal-ai/flux/schnell", + "name": "FLUX.1 [schnell]", + "display_name": "FLUX.1 [schnell]", "modalities": { "input": [ "text" ], "output": [ - "text" + "image" ] }, "limit": { "context": 8192, "output": 8192 }, - "temperature": true, + "temperature": false, "tool_call": false, "reasoning": { "supported": false }, "attachment": false, "open_weights": true, - "release_date": "2024-08-13", - "last_updated": "2026-03-15", - "cost": { - "input": 0.04, - "output": 0.05 - }, + "release_date": "2024-08-01", + "last_updated": "2026-04-16", "type": "chat" }, { - "id": "sao10k/l3.3-euryale-70b", - "name": "Sao10K: Llama 3.3 Euryale 70B", - "display_name": "Sao10K: Llama 3.3 Euryale 70B", + "id": "fal-ai/stable-audio-25/text-to-audio", + "name": "Stable Audio 2.5 (Text-to-Audio)", + "display_name": "Stable Audio 2.5 (Text-to-Audio)", "modalities": { "input": [ "text" ], "output": [ - "text" + "audio" ] }, "limit": { - "context": 131072, - "output": 16384 + "context": 8192, + "output": 8192 }, - "temperature": true, + "temperature": false, "tool_call": false, "reasoning": { "supported": false }, "attachment": false, - "open_weights": true, - "release_date": "2024-12-18", - "last_updated": "2026-03-15", - "cost": { - "input": 0.65, - "output": 0.75 - }, + "open_weights": false, + "release_date": "2025-10-08", + "last_updated": "2026-04-16", "type": "chat" - }, + } + ] + }, + "venice": { + "id": "venice", + "name": "Venice AI", + "display_name": "Venice AI", + "doc": "https://docs.venice.ai", + "models": [ { - "id": "sao10k/l3-euryale-70b", - "name": "Sao10k: Llama 3 Euryale 70B v2.1", - "display_name": "Sao10k: Llama 3 Euryale 70B v2.1", + "id": "z-ai-glm-5-turbo", + "name": "GLM 5 Turbo", + "display_name": "GLM 5 Turbo", "modalities": { "input": [ "text" @@ -42677,59 +45468,79 @@ ] }, "limit": { - "context": 8192, - "output": 8192 + "context": 200000, + "output": 32768 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "attachment": false, "open_weights": true, - "release_date": "2024-06-18", - "last_updated": "2026-03-15", + "release_date": "2026-03-15", + "last_updated": "2026-06-11", "cost": { - "input": 1.48, - "output": 1.48 + "input": 1.2, + "output": 4, + "cache_read": 0.24 }, "type": "chat" }, { - "id": "sao10k/l3.1-70b-hanami-x1", - "name": "Sao10K: Llama 3.1 70B Hanami x1", - "display_name": "Sao10K: Llama 3.1 70B Hanami x1", + "id": "grok-4-20-multi-agent", + "name": "Grok 4.20 Multi-Agent", + "display_name": "Grok 4.20 Multi-Agent", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 16000, - "output": 16000 + "context": 2000000, + "output": 128000 }, - "temperature": true, "tool_call": false, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": false, - "open_weights": true, - "release_date": "2025-01-08", - "last_updated": "2026-03-15", + "attachment": true, + "open_weights": false, + "release_date": "2026-03-12", + "last_updated": "2026-06-11", "cost": { - "input": 3, - "output": 3 + "input": 1.42, + "output": 2.83, + "cache_read": 0.23, + "tiers": [ + { + "input": 2.83, + "output": 5.67, + "cache_read": 0.45, + "tier": { + "type": "context", + "size": 200000 + } + } + ], + "context_over_200k": { + "input": 2.83, + "output": 5.67, + "cache_read": 0.45 + } }, "type": "chat" }, { - "id": "deepseek/deepseek-r1-0528", - "name": "DeepSeek: R1 0528", - "display_name": "DeepSeek: R1 0528", + "id": "deepseek-v4-flash", + "name": "DeepSeek V4 Flash", + "display_name": "DeepSeek V4 Flash", "modalities": { "input": [ "text" @@ -42739,8 +45550,8 @@ ] }, "limit": { - "context": 163840, - "output": 65536 + "context": 1000000, + "output": 32768 }, "temperature": true, "tool_call": true, @@ -42761,30 +45572,33 @@ }, "attachment": false, "open_weights": true, - "release_date": "2025-05-28", - "last_updated": "2026-03-15", + "knowledge": "2025-05", + "release_date": "2026-04-24", + "last_updated": "2026-06-11", "cost": { - "input": 0.45, - "output": 2.15, - "cache_read": 0.2 + "input": 0.17, + "output": 0.35, + "cache_read": 0.028 }, "type": "chat" }, { - "id": "deepseek/deepseek-v3.2", - "name": "DeepSeek: DeepSeek V3.2", - "display_name": "DeepSeek: DeepSeek V3.2", + "id": "google-gemma-4-31b-it", + "name": "Google Gemma 4 31B Instruct", + "display_name": "Google Gemma 4 31B Instruct", "modalities": { "input": [ - "text" + "text", + "image", + "video" ], "output": [ "text" ] }, "limit": { - "context": 163840, - "output": 65536 + "context": 256000, + "output": 8192 }, "temperature": true, "tool_call": true, @@ -42792,37 +45606,33 @@ "supported": true, "default": true }, - "extra_capabilities": { - "reasoning": { - "supported": true - } - }, - "attachment": false, + "attachment": true, "open_weights": true, - "release_date": "2025-12-01", - "last_updated": "2026-03-15", + "release_date": "2026-04-03", + "last_updated": "2026-06-11", "cost": { - "input": 0.26, - "output": 0.38, - "cache_read": 0.125 + "input": 0.12, + "output": 0.36, + "cache_read": 0.09 }, "type": "chat" }, { - "id": "deepseek/deepseek-r1", - "name": "DeepSeek: R1", - "display_name": "DeepSeek: R1", + "id": "kimi-k2-6", + "name": "Kimi K2.6", + "display_name": "Kimi K2.6", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 64000, - "output": 16000 + "context": 256000, + "output": 65536 }, "temperature": true, "tool_call": true, @@ -42841,20 +45651,22 @@ ] } }, - "attachment": false, + "attachment": true, "open_weights": true, - "release_date": "2025-01-20", - "last_updated": "2025-01-20", + "knowledge": "2025-01", + "release_date": "2026-04-20", + "last_updated": "2026-06-11", "cost": { - "input": 0.7, - "output": 2.5 + "input": 0.85, + "output": 4.655, + "cache_read": 0.22 }, "type": "chat" }, { - "id": "deepseek/deepseek-chat-v3.1", - "name": "DeepSeek: DeepSeek V3.1", - "display_name": "DeepSeek: DeepSeek V3.1", + "id": "qwen3-235b-a22b-instruct-2507", + "name": "Qwen 3 235B A22B Instruct 2507", + "display_name": "Qwen 3 235B A22B Instruct 2507", "modalities": { "input": [ "text" @@ -42864,19 +45676,17 @@ ] }, "limit": { - "context": 32768, - "output": 7168 + "context": 128000, + "output": 16384 }, - "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, "attachment": false, "open_weights": true, - "release_date": "2025-08-21", - "last_updated": "2025-08-21", + "release_date": "2025-04-29", + "last_updated": "2026-06-11", "cost": { "input": 0.15, "output": 0.75 @@ -42884,9 +45694,9 @@ "type": "chat" }, { - "id": "deepseek/deepseek-chat-v3-0324", - "name": "DeepSeek: DeepSeek V3 0324", - "display_name": "DeepSeek: DeepSeek V3 0324", + "id": "nvidia-nemotron-cascade-2-30b-a3b", + "name": "Nemotron Cascade 2 30B A3B", + "display_name": "Nemotron Cascade 2 30B A3B", "modalities": { "input": [ "text" @@ -42896,8 +45706,8 @@ ] }, "limit": { - "context": 163840, - "output": 65536 + "context": 256000, + "output": 32768 }, "temperature": true, "tool_call": true, @@ -42907,89 +45717,114 @@ }, "attachment": false, "open_weights": true, - "release_date": "2025-03-24", - "last_updated": "2026-03-15", + "release_date": "2026-03-24", + "last_updated": "2026-06-11", "cost": { - "input": 0.2, - "output": 0.77, - "cache_read": 0.095 + "input": 0.14, + "output": 0.8 }, "type": "chat" }, { - "id": "deepseek/deepseek-r1-distill-llama-70b", - "name": "DeepSeek: R1 Distill Llama 70B", - "display_name": "DeepSeek: R1 Distill Llama 70B", + "id": "claude-opus-4-7-fast", + "name": "Claude Opus 4.7 Fast", + "display_name": "Claude Opus 4.7 Fast", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 131072, - "output": 16384 + "context": 1000000, + "output": 128000 }, - "temperature": true, - "tool_call": false, + "temperature": false, + "tool_call": true, "reasoning": { "supported": true, - "default": true + "default": false }, "extra_capabilities": { "reasoning": { - "supported": true + "supported": true, + "default_enabled": false, + "mode": "effort", + "effort": "high", + "effort_options": [ + "low", + "medium", + "high", + "xhigh", + "max" + ], + "interleaved": true, + "summaries": true, + "visibility": "omitted", + "continuation": [ + "thinking_blocks" + ], + "notes": [ + "Claude Opus 4.7 and newer Opus models require thinking.type = \"adaptive\" to enable thinking explicitly.", + "Manual budget_tokens requests return 400 on Claude Opus 4.7 and newer adaptive-only Opus models.", + "task_budget is separate from thinking control and should not be treated as a thinking budget." + ] } }, - "attachment": false, - "open_weights": true, - "release_date": "2025-01-23", - "last_updated": "2026-03-15", + "attachment": true, + "open_weights": false, + "knowledge": "2026-01-31", + "release_date": "2026-05-14", + "last_updated": "2026-06-11", "cost": { - "input": 0.7, - "output": 0.8, - "cache_read": 0.015 + "input": 36, + "output": 180, + "cache_read": 3.6, + "cache_write": 45 }, "type": "chat" }, { - "id": "deepseek/deepseek-chat", - "name": "DeepSeek: DeepSeek V3", - "display_name": "DeepSeek: DeepSeek V3", + "id": "openai-gpt-55-pro", + "name": "GPT-5.5 Pro", + "display_name": "GPT-5.5 Pro", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 163840, - "output": 163840 + "context": 1000000, + "output": 128000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": false, - "open_weights": true, - "release_date": "2024-12-01", - "last_updated": "2026-03-15", + "attachment": true, + "open_weights": false, + "knowledge": "2025-12-01", + "release_date": "2026-04-24", + "last_updated": "2026-06-11", "cost": { - "input": 0.32, - "output": 0.89, - "cache_read": 0.15 + "input": 37.5, + "output": 225 }, "type": "chat" }, { - "id": "deepseek/deepseek-v3.2-speciale", - "name": "DeepSeek: DeepSeek V3.2 Speciale", - "display_name": "DeepSeek: DeepSeek V3.2 Speciale", + "id": "llama-3.3-70b", + "name": "Llama 3.3 70B", + "display_name": "Llama 3.3 70B", "modalities": { "input": [ "text" @@ -42999,40 +45834,39 @@ ] }, "limit": { - "context": 163840, - "output": 163840 + "context": 128000, + "output": 4096 }, - "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, "attachment": false, "open_weights": true, - "release_date": "2025-12-01", - "last_updated": "2026-03-15", + "release_date": "2025-04-06", + "last_updated": "2026-06-11", "cost": { - "input": 0.4, - "output": 1.2, - "cache_read": 0.135 + "input": 0.7, + "output": 2.8 }, "type": "chat" }, { - "id": "deepseek/deepseek-v3.1-terminus", - "name": "DeepSeek: DeepSeek V3.1 Terminus", - "display_name": "DeepSeek: DeepSeek V3.1 Terminus", + "id": "qwen3-5-397b-a17b", + "name": "Qwen 3.5 397B", + "display_name": "Qwen 3.5 397B", "modalities": { "input": [ - "text" + "text", + "image", + "video" ], "output": [ "text" ] }, "limit": { - "context": 163840, + "context": 128000, "output": 32768 }, "temperature": true, @@ -43041,97 +45875,83 @@ "supported": true, "default": true }, - "attachment": false, + "attachment": true, "open_weights": true, - "release_date": "2025-09-22", - "last_updated": "2025-09-22", + "release_date": "2026-02-16", + "last_updated": "2026-06-11", "cost": { - "input": 0.21, - "output": 0.79, - "cache_read": 0.13 + "input": 0.75, + "output": 4.5 }, "type": "chat" }, { - "id": "deepseek/deepseek-v4-flash", - "name": "DeepSeek: DeepSeek V4 Flash", - "display_name": "DeepSeek: DeepSeek V4 Flash", + "id": "claude-opus-4-5", + "name": "Claude Opus 4.5", + "display_name": "Claude Opus 4.5", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 1048576, - "output": 384000 + "context": 198000, + "output": 32768 }, "temperature": true, "tool_call": true, "reasoning": { "supported": true, - "default": true + "default": false }, "extra_capabilities": { "reasoning": { "supported": true, + "default_enabled": false, + "mode": "mixed", + "budget": { + "min": 1024, + "unit": "tokens" + }, + "effort": "high", + "effort_options": [ + "low", + "medium", + "high" + ], "interleaved": true, "summaries": true, "visibility": "summary", "continuation": [ "thinking_blocks" + ], + "notes": [ + "Claude Opus 4.5 uses manual thinking.type = \"enabled\" with budget_tokens; effort can be used alongside the thinking budget.", + "Interleaved thinking requires the interleaved-thinking-2025-05-14 beta header." ] } }, - "attachment": false, + "attachment": true, "open_weights": false, - "release_date": "2026-04-24", - "last_updated": "2026-05-01", - "cost": { - "input": 0.14, - "output": 0.28, - "cache_read": 0.0028 - }, - "type": "chat" - }, - { - "id": "deepseek/deepseek-v3.2-exp", - "name": "DeepSeek: DeepSeek V3.2 Exp", - "display_name": "DeepSeek: DeepSeek V3.2 Exp", - "modalities": { - "input": [ - "text" - ], - "output": [ - "text" - ] - }, - "limit": { - "context": 163840, - "output": 65536 - }, - "temperature": true, - "tool_call": true, - "reasoning": { - "supported": true, - "default": true - }, - "attachment": false, - "open_weights": true, - "release_date": "2025-01-01", - "last_updated": "2025-09-29", + "knowledge": "2025-03-31", + "release_date": "2025-12-06", + "last_updated": "2026-06-11", "cost": { - "input": 0.27, - "output": 0.41 + "input": 6, + "output": 30, + "cache_read": 0.6, + "cache_write": 7.5 }, "type": "chat" }, { - "id": "deepseek/deepseek-v4-pro", - "name": "DeepSeek: DeepSeek V4 Pro", - "display_name": "DeepSeek: DeepSeek V4 Pro", + "id": "zai-org-glm-5", + "name": "GLM 5", + "display_name": "GLM 5", "modalities": { "input": [ "text" @@ -43141,8 +45961,8 @@ ] }, "limit": { - "context": 1048576, - "output": 384000 + "context": 198000, + "output": 32000 }, "temperature": true, "tool_call": true, @@ -43162,55 +45982,59 @@ } }, "attachment": false, - "open_weights": false, - "release_date": "2026-04-24", - "last_updated": "2026-05-01", + "open_weights": true, + "release_date": "2026-02-11", + "last_updated": "2026-06-11", "cost": { - "input": 0.435, - "output": 0.87, - "cache_read": 0.003625 + "input": 1, + "output": 3.2, + "cache_read": 0.2 }, "type": "chat" }, { - "id": "deepseek/deepseek-r1-distill-qwen-32b", - "name": "DeepSeek: R1 Distill Qwen 32B", - "display_name": "DeepSeek: R1 Distill Qwen 32B", + "id": "qwen3-5-35b-a3b", + "name": "Qwen 3.5 35B A3B", + "display_name": "Qwen 3.5 35B A3B", "modalities": { "input": [ - "text" + "text", + "image", + "video" ], "output": [ "text" ] }, "limit": { - "context": 32768, - "output": 32768 + "context": 256000, + "output": 16384 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { "supported": true, "default": true }, - "attachment": false, + "attachment": true, "open_weights": true, - "release_date": "2025-01-01", - "last_updated": "2025-11-25", + "release_date": "2026-02-25", + "last_updated": "2026-06-11", "cost": { - "input": 0.29, - "output": 0.29 + "input": 0.3125, + "output": 1.25, + "cache_read": 0.15625 }, "type": "chat" }, { - "id": "inception/mercury-2", - "name": "Inception: Mercury 2", - "display_name": "Inception: Mercury 2", + "id": "venice-uncensored-role-play", + "name": "Venice Role Play Uncensored", + "display_name": "Venice Role Play Uncensored", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" @@ -43218,90 +46042,81 @@ }, "limit": { "context": 128000, - "output": 50000 + "output": 4096 }, - "temperature": true, "tool_call": true, - "reasoning": { - "supported": true, - "default": true - }, - "attachment": false, - "open_weights": false, - "release_date": "2026-02-24", - "last_updated": "2026-02-24", - "cost": { - "input": 0.25, - "output": 0.75, - "cache_read": 0.025 - }, - "type": "chat" - }, - { - "id": "relace/relace-apply-3", - "name": "Relace: Relace Apply 3", - "display_name": "Relace: Relace Apply 3", - "modalities": { - "input": [ - "text" - ], - "output": [ - "text" - ] - }, - "limit": { - "context": 256000, - "output": 128000 - }, - "tool_call": false, "reasoning": { "supported": false }, - "attachment": false, - "open_weights": false, - "release_date": "2025-09-26", - "last_updated": "2026-03-15", + "attachment": true, + "open_weights": true, + "release_date": "2026-02-20", + "last_updated": "2026-06-11", "cost": { - "input": 0.85, - "output": 1.25 + "input": 0.5, + "output": 2 }, "type": "chat" }, { - "id": "relace/relace-search", - "name": "Relace: Relace Search", - "display_name": "Relace: Relace Search", + "id": "qwen-3-6-plus", + "name": "Qwen 3.6 Plus Uncensored", + "display_name": "Qwen 3.6 Plus Uncensored", "modalities": { "input": [ - "text" + "text", + "image", + "video" ], "output": [ "text" ] }, "limit": { - "context": 256000, - "output": 128000 + "context": 1000000, + "output": 65536 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": false, + "attachment": true, "open_weights": false, - "release_date": "2025-12-09", - "last_updated": "2026-03-15", + "knowledge": "2025-04", + "release_date": "2026-04-06", + "last_updated": "2026-06-11", "cost": { - "input": 1, - "output": 3 + "input": 0.625, + "output": 3.75, + "cache_read": 0.0625, + "cache_write": 0.78, + "tiers": [ + { + "input": 2.5, + "output": 7.5, + "cache_read": 0.0625, + "cache_write": 0.78, + "tier": { + "type": "context", + "size": 256000 + } + } + ], + "context_over_200k": { + "input": 2.5, + "output": 7.5, + "cache_read": 0.0625, + "cache_write": 0.78 + } }, "type": "chat" }, { - "id": "thedrummer/rocinante-12b", - "name": "TheDrummer: Rocinante 12B", - "display_name": "TheDrummer: Rocinante 12B", + "id": "zai-org-glm-4.6", + "name": "GLM 4.6", + "display_name": "GLM 4.6", "modalities": { "input": [ "text" @@ -43311,121 +46126,180 @@ ] }, "limit": { - "context": 32768, - "output": 32768 + "context": 198000, + "output": 16384 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } }, "attachment": false, "open_weights": true, - "release_date": "2024-09-30", - "last_updated": "2026-03-15", + "knowledge": "2025-04", + "release_date": "2024-04-01", + "last_updated": "2026-06-11", "cost": { - "input": 0.17, - "output": 0.43 + "input": 0.85, + "output": 2.75, + "cache_read": 0.3 }, "type": "chat" }, { - "id": "thedrummer/skyfall-36b-v2", - "name": "TheDrummer: Skyfall 36B V2", - "display_name": "TheDrummer: Skyfall 36B V2", + "id": "openai-gpt-4o-2024-11-20", + "name": "GPT-4o", + "display_name": "GPT-4o", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 32768, - "output": 32768 + "context": 128000, + "output": 16384 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { "supported": false }, - "attachment": false, - "open_weights": true, - "release_date": "2025-03-11", - "last_updated": "2026-03-15", + "attachment": true, + "open_weights": false, + "knowledge": "2023-09", + "release_date": "2026-02-28", + "last_updated": "2026-06-11", "cost": { - "input": 0.55, - "output": 0.8 + "input": 3.125, + "output": 12.5 }, "type": "chat" }, { - "id": "thedrummer/unslopnemo-12b", - "name": "TheDrummer: UnslopNemo 12B", - "display_name": "TheDrummer: UnslopNemo 12B", + "id": "grok-4-3", + "name": "Grok 4.3", + "display_name": "Grok 4.3", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 32768, - "output": 32768 + "context": 1000000, + "output": 32000 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": false, - "open_weights": true, - "release_date": "2024-11-09", - "last_updated": "2026-03-15", + "attachment": true, + "open_weights": false, + "release_date": "2026-04-18", + "last_updated": "2026-06-11", "cost": { - "input": 0.4, - "output": 0.4 + "input": 1.42, + "output": 2.83, + "cache_read": 0.23, + "tiers": [ + { + "input": 2.83, + "output": 5.67, + "cache_read": 0.45, + "tier": { + "type": "context", + "size": 200000 + } + } + ], + "context_over_200k": { + "input": 2.83, + "output": 5.67, + "cache_read": 0.45 + } }, "type": "chat" }, { - "id": "thedrummer/cydonia-24b-v4.1", - "name": "TheDrummer: Cydonia 24B V4.1", - "display_name": "TheDrummer: Cydonia 24B V4.1", + "id": "qwen-3-7-plus", + "name": "Qwen 3.7 Plus", + "display_name": "Qwen 3.7 Plus", "modalities": { "input": [ - "text" + "text", + "image", + "video" ], "output": [ "text" ] }, "limit": { - "context": 131072, - "output": 131072 + "context": 1000000, + "output": 65536 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": false, - "open_weights": true, - "release_date": "2025-09-27", - "last_updated": "2026-03-15", + "attachment": true, + "open_weights": false, + "knowledge": "2025-04", + "release_date": "2026-06-02", + "last_updated": "2026-06-11", "cost": { - "input": 0.3, - "output": 0.5 + "input": 0.5, + "output": 2, + "cache_read": 0.05, + "cache_write": 0.625, + "tiers": [ + { + "input": 1.5, + "output": 6, + "cache_read": 0.15, + "cache_write": 1.875, + "tier": { + "type": "context", + "size": 256000 + } + } + ], + "context_over_200k": { + "input": 1.5, + "output": 6, + "cache_read": 0.15, + "cache_write": 1.875 + } }, "type": "chat" }, { - "id": "deepcogito/cogito-v2.1-671b", - "name": "Deep Cogito: Cogito v2.1 671B", - "display_name": "Deep Cogito: Cogito v2.1 671B", + "id": "minimax-m27", + "name": "MiniMax M2.7", + "display_name": "MiniMax M2.7", "modalities": { "input": [ "text" @@ -43435,60 +46309,30 @@ ] }, "limit": { - "context": 128000, + "context": 198000, "output": 32768 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { "supported": true, "default": true }, "attachment": false, "open_weights": true, - "release_date": "2025-11-14", - "last_updated": "2026-03-15", - "cost": { - "input": 1.25, - "output": 1.25 - }, - "type": "chat" - }, - { - "id": "inflection/inflection-3-pi", - "name": "Inflection: Inflection 3 Pi", - "display_name": "Inflection: Inflection 3 Pi", - "modalities": { - "input": [ - "text" - ], - "output": [ - "text" - ] - }, - "limit": { - "context": 8000, - "output": 1024 - }, - "temperature": true, - "tool_call": false, - "reasoning": { - "supported": false - }, - "attachment": false, - "open_weights": false, - "release_date": "2024-10-11", - "last_updated": "2026-03-15", + "release_date": "2026-03-18", + "last_updated": "2026-06-11", "cost": { - "input": 2.5, - "output": 10 + "input": 0.375, + "output": 1.5, + "cache_read": 0.06875 }, "type": "chat" }, { - "id": "inflection/inflection-3-productivity", - "name": "Inflection: Inflection 3 Productivity", - "display_name": "Inflection: Inflection 3 Productivity", + "id": "deepseek-v4-pro", + "name": "DeepSeek V4 Pro", + "display_name": "DeepSeek V4 Pro", "modalities": { "input": [ "text" @@ -43498,66 +46342,44 @@ ] }, "limit": { - "context": 8000, - "output": 1024 - }, - "temperature": true, - "tool_call": false, - "reasoning": { - "supported": false - }, - "attachment": false, - "open_weights": false, - "release_date": "2024-10-11", - "last_updated": "2026-03-15", - "cost": { - "input": 2.5, - "output": 10 - }, - "type": "chat" - }, - { - "id": "perceptron/perceptron-mk1", - "name": "Perceptron: Perceptron Mk1", - "display_name": "Perceptron: Perceptron Mk1", - "modalities": { - "input": [ - "image", - "text", - "video" - ], - "output": [ - "text" - ] - }, - "limit": { - "context": 32768, - "output": 8192 + "context": 1000000, + "output": 32768 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { "supported": true, "default": true }, - "attachment": true, - "open_weights": false, - "release_date": "2026-05-12", - "last_updated": "2026-05-16", + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } + }, + "attachment": false, + "open_weights": true, + "knowledge": "2025-05", + "release_date": "2026-04-24", + "last_updated": "2026-06-11", "cost": { - "input": 0.15, - "output": 1.5 + "input": 1.73, + "output": 3.796, + "cache_read": 0.33 }, "type": "chat" }, { - "id": "anthropic/claude-sonnet-4", - "name": "Anthropic: Claude Sonnet 4", - "display_name": "Anthropic: Claude Sonnet 4", + "id": "qwen3-235b-a22b-thinking-2507", + "name": "Qwen 3 235B A22B Thinking 2507", + "display_name": "Qwen 3 235B A22B Thinking 2507", "modalities": { "input": [ - "image", - "pdf", "text" ], "output": [ @@ -43565,64 +46387,51 @@ ] }, "limit": { - "context": 200000, - "output": 64000 + "context": 128000, + "output": 16384 }, - "temperature": true, "tool_call": true, "reasoning": { "supported": true, - "default": false + "default": true }, "extra_capabilities": { "reasoning": { "supported": true, - "default_enabled": false, - "mode": "budget", - "budget": { - "min": 1024, - "unit": "tokens" - }, "interleaved": true, "summaries": true, "visibility": "summary", "continuation": [ "thinking_blocks" - ], - "notes": [ - "Claude 4 manual thinking uses thinking.type = \"enabled\" with budget_tokens.", - "Interleaved thinking requires the interleaved-thinking-2025-05-14 beta header for this model family." ] } }, - "attachment": true, - "open_weights": false, - "release_date": "2025-05-22", - "last_updated": "2026-03-15", + "attachment": false, + "open_weights": true, + "release_date": "2025-04-29", + "last_updated": "2026-06-11", "cost": { - "input": 3, - "output": 15, - "cache_read": 0.3, - "cache_write": 3.75 + "input": 0.45, + "output": 3.5 }, "type": "chat" }, { - "id": "anthropic/claude-sonnet-4.6", - "name": "Anthropic: Claude Sonnet 4.6", - "display_name": "Anthropic: Claude Sonnet 4.6", + "id": "claude-sonnet-4-5", + "name": "Claude Sonnet 4.5", + "display_name": "Claude Sonnet 4.5", "modalities": { "input": [ - "image", - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 1000000, - "output": 128000 + "context": 198000, + "output": 64000 }, "temperature": true, "tool_call": true, @@ -43634,18 +46443,11 @@ "reasoning": { "supported": true, "default_enabled": false, - "mode": "mixed", + "mode": "budget", "budget": { "min": 1024, "unit": "tokens" }, - "effort": "high", - "effort_options": [ - "low", - "medium", - "high", - "max" - ], "interleaved": true, "summaries": true, "visibility": "summary", @@ -43653,94 +46455,66 @@ "thinking_blocks" ], "notes": [ - "Anthropic recommends adaptive thinking with effort for Claude 4.6; budget_tokens remains a deprecated compatibility path.", - "Anthropic API defaults effort to high; lower effort levels should be chosen per workload." + "Claude 4 manual thinking uses thinking.type = \"enabled\" with budget_tokens.", + "Interleaved thinking requires the interleaved-thinking-2025-05-14 beta header for this model family." ] } }, "attachment": true, "open_weights": false, - "knowledge": "2025-08-31", - "release_date": "2026-02-17", - "last_updated": "2026-03-15", + "knowledge": "2025-07-31", + "release_date": "2025-01-15", + "last_updated": "2026-06-11", "cost": { - "input": 3, - "output": 15 + "input": 3.75, + "output": 18.75, + "cache_read": 0.375, + "cache_write": 4.69 }, "type": "chat" }, { - "id": "anthropic/claude-opus-4.5", - "name": "Anthropic: Claude Opus 4.5", - "display_name": "Anthropic: Claude Opus 4.5", + "id": "openai-gpt-4o-mini-2024-07-18", + "name": "GPT-4o Mini", + "display_name": "GPT-4o Mini", "modalities": { "input": [ - "image", - "pdf", - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 64000 + "context": 128000, + "output": 16384 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": false - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": false, - "mode": "mixed", - "budget": { - "min": 1024, - "unit": "tokens" - }, - "effort": "high", - "effort_options": [ - "low", - "medium", - "high" - ], - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ], - "notes": [ - "Claude Opus 4.5 uses manual thinking.type = \"enabled\" with budget_tokens; effort can be used alongside the thinking budget.", - "Interleaved thinking requires the interleaved-thinking-2025-05-14 beta header." - ] - } + "supported": false }, "attachment": true, "open_weights": false, - "release_date": "2025-11-24", - "last_updated": "2026-03-15", + "knowledge": "2023-09", + "release_date": "2026-02-28", + "last_updated": "2026-06-11", "cost": { - "input": 5, - "output": 25, - "cache_read": 0.5, - "cache_write": 6.25 + "input": 0.1875, + "output": 0.75, + "cache_read": 0.09375 }, "type": "chat" }, { - "id": "anthropic/claude-opus-4.7", - "name": "Anthropic: Claude Opus 4.7", - "display_name": "Anthropic: Claude Opus 4.7", + "id": "claude-opus-4-7", + "name": "Claude Opus 4.7", + "display_name": "Claude Opus 4.7", "modalities": { "input": [ "text", - "image", - "pdf" + "image" ], "output": [ "text" @@ -43784,20 +46558,21 @@ }, "attachment": true, "open_weights": false, + "knowledge": "2026-01-31", "release_date": "2026-04-16", - "last_updated": "2026-05-01", + "last_updated": "2026-06-11", "cost": { - "input": 5, - "output": 25, - "cache_read": 0.5, - "cache_write": 6.25 + "input": 6, + "output": 30, + "cache_read": 0.6, + "cache_write": 7.5 }, "type": "chat" }, { - "id": "anthropic/claude-3.5-haiku", - "name": "Anthropic: Claude 3.5 Haiku", - "display_name": "Anthropic: Claude 3.5 Haiku", + "id": "openai-gpt-53-codex", + "name": "GPT-5.3 Codex", + "display_name": "GPT-5.3 Codex", "modalities": { "input": [ "text", @@ -43808,30 +46583,31 @@ ] }, "limit": { - "context": 200000, - "output": 8192 + "context": 400000, + "output": 128000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "attachment": true, "open_weights": false, - "release_date": "2024-10-22", - "last_updated": "2024-10-22", + "knowledge": "2025-08-31", + "release_date": "2026-02-24", + "last_updated": "2026-06-11", "cost": { - "input": 0.8, - "output": 4, - "cache_read": 0.08, - "cache_write": 1 + "input": 2.19, + "output": 17.5, + "cache_read": 0.219 }, "type": "chat" }, { - "id": "anthropic/claude-3-haiku", - "name": "Anthropic: Claude 3 Haiku", - "display_name": "Anthropic: Claude 3 Haiku", + "id": "openai-gpt-54", + "name": "GPT-5.4", + "display_name": "GPT-5.4", "modalities": { "input": [ "text", @@ -43842,151 +46618,102 @@ ] }, "limit": { - "context": 200000, - "output": 4096 + "context": 1000000, + "output": 131072 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "attachment": true, "open_weights": false, - "release_date": "2024-03-07", - "last_updated": "2024-03-07", + "knowledge": "2025-08-31", + "release_date": "2026-03-05", + "last_updated": "2026-06-11", "cost": { - "input": 0.25, - "output": 1.25, - "cache_read": 0.03, - "cache_write": 0.3 + "input": 3.13, + "output": 18.8, + "cache_read": 0.313 }, "type": "chat" }, { - "id": "anthropic/claude-opus-4.6-fast", - "name": "Anthropic: Claude Opus 4.6 (Fast)", - "display_name": "Anthropic: Claude Opus 4.6 (Fast)", + "id": "google-gemma-3-27b-it", + "name": "Google Gemma 3 27B Instruct", + "display_name": "Google Gemma 3 27B Instruct", "modalities": { "input": [ - "image", - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 1000000, - "output": 128000 + "context": 198000, + "output": 16384 }, - "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": false - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": false, - "mode": "mixed", - "budget": { - "min": 1024, - "unit": "tokens" - }, - "effort": "high", - "effort_options": [ - "low", - "medium", - "high", - "max" - ], - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ], - "notes": [ - "Anthropic recommends adaptive thinking with effort for Claude 4.6; budget_tokens remains a deprecated compatibility path.", - "Anthropic API defaults effort to high; lower effort levels should be chosen per workload." - ] - } + "supported": false }, "attachment": true, - "open_weights": false, - "knowledge": "2025-05-31", - "release_date": "2026-04-07", - "last_updated": "2026-04-11", + "open_weights": true, + "release_date": "2025-11-04", + "last_updated": "2026-06-11", "cost": { - "input": 30, - "output": 150, - "cache_read": 3, - "cache_write": 37.5 + "input": 0.12, + "output": 0.2 }, "type": "chat" }, { - "id": "anthropic/claude-sonnet-4.5", - "name": "Anthropic: Claude Sonnet 4.5", - "display_name": "Anthropic: Claude Sonnet 4.5", + "id": "minimax-m3", + "name": "MiniMax M3", + "display_name": "MiniMax M3", "modalities": { "input": [ + "text", "image", - "pdf", - "text" + "video" ], "output": [ "text" ] }, "limit": { - "context": 1000000, - "output": 64000 + "context": 500000, + "output": 131072 }, "temperature": true, "tool_call": true, "reasoning": { "supported": true, - "default": false + "default": true }, "extra_capabilities": { "reasoning": { - "supported": true, - "default_enabled": false, - "mode": "budget", - "budget": { - "min": 1024, - "unit": "tokens" - }, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ], - "notes": [ - "Claude 4 manual thinking uses thinking.type = \"enabled\" with budget_tokens.", - "Interleaved thinking requires the interleaved-thinking-2025-05-14 beta header for this model family." - ] + "supported": true } }, "attachment": true, "open_weights": false, - "release_date": "2025-09-29", - "last_updated": "2026-03-15", + "release_date": "2026-06-01", + "last_updated": "2026-06-11", "cost": { - "input": 3, - "output": 15, - "cache_read": 0.3, - "cache_write": 3.75 + "input": 0.3, + "output": 1.2, + "cache_read": 0.06 }, "type": "chat" }, { - "id": "anthropic/claude-opus-4.6", - "name": "Anthropic: Claude Opus 4.6", - "display_name": "Anthropic: Claude Opus 4.6", + "id": "claude-opus-4-8-fast", + "name": "Claude Opus 4.8 Fast", + "display_name": "Claude Opus 4.8 Fast", "modalities": { "input": [ "text", @@ -44000,7 +46727,7 @@ "context": 1000000, "output": 128000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { "supported": true, @@ -44010,107 +46737,77 @@ "reasoning": { "supported": true, "default_enabled": false, - "mode": "mixed", - "budget": { - "min": 1024, - "unit": "tokens" - }, + "mode": "effort", "effort": "high", "effort_options": [ "low", "medium", "high", + "xhigh", "max" ], "interleaved": true, "summaries": true, - "visibility": "summary", + "visibility": "omitted", "continuation": [ "thinking_blocks" ], "notes": [ - "Anthropic recommends adaptive thinking with effort for Claude 4.6; budget_tokens remains a deprecated compatibility path.", - "Anthropic API defaults effort to high; lower effort levels should be chosen per workload." + "Claude Opus 4.7 and newer Opus models require thinking.type = \"adaptive\" to enable thinking explicitly.", + "Manual budget_tokens requests return 400 on Claude Opus 4.7 and newer adaptive-only Opus models.", + "task_budget is separate from thinking control and should not be treated as a thinking budget." ] } }, "attachment": true, "open_weights": false, - "knowledge": "2025-05-31", - "release_date": "2026-02-05", - "last_updated": "2026-02-05", + "release_date": "2026-05-28", + "last_updated": "2026-06-11", "cost": { - "input": 5, - "output": 25, - "cache_read": 0.5, - "cache_write": 6.25 + "input": 12, + "output": 60, + "cache_read": 1.2, + "cache_write": 15 }, "type": "chat" }, { - "id": "anthropic/claude-haiku-4.5", - "name": "Anthropic: Claude Haiku 4.5", - "display_name": "Anthropic: Claude Haiku 4.5", + "id": "gemma-4-uncensored", + "name": "Gemma 4 Uncensored", + "display_name": "Gemma 4 Uncensored", "modalities": { "input": [ - "image", - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 64000 + "context": 256000, + "output": 8192 }, - "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": false - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": false, - "mode": "budget", - "budget": { - "min": 1024, - "unit": "tokens" - }, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ], - "notes": [ - "Claude 4 manual thinking uses thinking.type = \"enabled\" with budget_tokens.", - "Interleaved thinking requires the interleaved-thinking-2025-05-14 beta header for this model family." - ] - } + "supported": false }, "attachment": true, - "open_weights": false, - "release_date": "2025-10-15", - "last_updated": "2025-10-15", + "open_weights": true, + "release_date": "2026-04-13", + "last_updated": "2026-06-11", "cost": { - "input": 1, - "output": 5, - "cache_read": 0.1, - "cache_write": 1.25 + "input": 0.1625, + "output": 0.5 }, "type": "chat" }, { - "id": "anthropic/claude-opus-4.7-fast", - "name": "Anthropic: Claude Opus 4.7 (Fast)", - "display_name": "Anthropic: Claude Opus 4.7 (Fast)", + "id": "qwen3-next-80b", + "name": "Qwen 3 Next 80b", + "display_name": "Qwen 3 Next 80b", "modalities": { "input": [ - "image", - "pdf", "text" ], "output": [ @@ -44118,129 +46815,75 @@ ] }, "limit": { - "context": 1000000, - "output": 128000 + "context": 256000, + "output": 16384 }, - "temperature": false, "tool_call": true, "reasoning": { - "supported": true, - "default": false + "supported": false }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": false, - "mode": "effort", - "effort": "high", - "effort_options": [ - "low", - "medium", - "high", - "xhigh", - "max" - ], - "interleaved": true, - "summaries": true, - "visibility": "omitted", - "continuation": [ - "thinking_blocks" - ], - "notes": [ - "Claude Opus 4.7 and newer Opus models require thinking.type = \"adaptive\" to enable thinking explicitly.", - "Manual budget_tokens requests return 400 on Claude Opus 4.7 and newer adaptive-only Opus models.", - "task_budget is separate from thinking control and should not be treated as a thinking budget." - ] - } - }, - "attachment": true, - "open_weights": false, - "release_date": "2026-05-12", - "last_updated": "2026-05-16", + "attachment": false, + "open_weights": true, + "release_date": "2025-04-29", + "last_updated": "2026-06-11", "cost": { - "input": 30, - "output": 150, - "cache_read": 3, - "cache_write": 37.5 + "input": 0.35, + "output": 1.9 }, "type": "chat" }, { - "id": "anthropic/claude-opus-4.1", - "name": "Anthropic: Claude Opus 4.1", - "display_name": "Anthropic: Claude Opus 4.1", + "id": "mistral-small-2603", + "name": "Mistral Small 4", + "display_name": "Mistral Small 4", "modalities": { "input": [ - "image", - "pdf", - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 32000 + "context": 256000, + "output": 65536 }, "temperature": true, "tool_call": true, "reasoning": { "supported": true, - "default": false - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": false, - "mode": "budget", - "budget": { - "min": 1024, - "unit": "tokens" - }, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ], - "notes": [ - "Claude 4 manual thinking uses thinking.type = \"enabled\" with budget_tokens.", - "Interleaved thinking requires the interleaved-thinking-2025-05-14 beta header for this model family." - ] - } + "default": true }, "attachment": true, - "open_weights": false, - "release_date": "2025-08-05", - "last_updated": "2026-03-15", + "open_weights": true, + "knowledge": "2025-06", + "release_date": "2026-03-16", + "last_updated": "2026-06-11", "cost": { - "input": 15, - "output": 75, - "cache_read": 1.5, - "cache_write": 18.75 + "input": 0.1875, + "output": 0.75 }, "type": "chat" }, { - "id": "anthropic/claude-opus-4", - "name": "Anthropic: Claude Opus 4", - "display_name": "Anthropic: Claude Opus 4", + "id": "claude-opus-4-8", + "name": "Claude Opus 4.8", + "display_name": "Claude Opus 4.8", "modalities": { "input": [ - "image", - "pdf", - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 32000 + "context": 1000000, + "output": 128000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { "supported": true, @@ -44250,54 +46893,55 @@ "reasoning": { "supported": true, "default_enabled": false, - "mode": "budget", - "budget": { - "min": 1024, - "unit": "tokens" - }, + "mode": "effort", + "effort": "high", + "effort_options": [ + "low", + "medium", + "high", + "xhigh", + "max" + ], "interleaved": true, "summaries": true, - "visibility": "summary", + "visibility": "omitted", "continuation": [ "thinking_blocks" ], "notes": [ - "Claude 4 manual thinking uses thinking.type = \"enabled\" with budget_tokens.", - "Interleaved thinking requires the interleaved-thinking-2025-05-14 beta header for this model family." + "Claude Opus 4.7 and newer Opus models require thinking.type = \"adaptive\" to enable thinking explicitly.", + "Manual budget_tokens requests return 400 on Claude Opus 4.7 and newer adaptive-only Opus models.", + "task_budget is separate from thinking control and should not be treated as a thinking budget." ] } }, "attachment": true, "open_weights": false, - "release_date": "2025-05-22", - "last_updated": "2026-03-15", + "release_date": "2026-05-28", + "last_updated": "2026-06-11", "cost": { - "input": 15, - "output": 75, - "cache_read": 1.5, - "cache_write": 18.75 + "input": 6, + "output": 30, + "cache_read": 0.6, + "cache_write": 7.5 }, "type": "chat" }, { - "id": "xiaomi/mimo-v2-omni", - "name": "Xiaomi: MiMo-V2-Omni", - "display_name": "Xiaomi: MiMo-V2-Omni", + "id": "zai-org-glm-4.7-flash", + "name": "GLM 4.7 Flash", + "display_name": "GLM 4.7 Flash", "modalities": { "input": [ - "text", - "image", - "audio", - "video", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 262144, - "output": 65536 + "context": 128000, + "output": 16384 }, "temperature": true, "tool_call": true, @@ -44305,33 +46949,34 @@ "supported": true, "default": true }, - "attachment": true, - "open_weights": false, - "knowledge": "2024-12", - "release_date": "2026-03-18", - "last_updated": "2026-03-18", + "attachment": false, + "open_weights": true, + "knowledge": "2025-04", + "release_date": "2026-01-29", + "last_updated": "2026-06-11", "cost": { - "input": 0.4, - "output": 2, - "cache_read": 0.08 + "input": 0.125, + "output": 0.5 }, "type": "chat" }, { - "id": "xiaomi/mimo-v2-pro", - "name": "Xiaomi: MiMo-V2-Pro", - "display_name": "Xiaomi: MiMo-V2-Pro", + "id": "google-gemma-4-26b-a4b-it", + "name": "Google Gemma 4 26B A4B Instruct", + "display_name": "Google Gemma 4 26B A4B Instruct", "modalities": { "input": [ - "text" + "text", + "image", + "video" ], "output": [ "text" ] }, "limit": { - "context": 1048576, - "output": 131072 + "context": 256000, + "output": 8192 }, "temperature": true, "tool_call": true, @@ -44339,102 +46984,69 @@ "supported": true, "default": true }, - "attachment": false, - "open_weights": false, - "knowledge": "2024-12", - "release_date": "2026-03-18", - "last_updated": "2026-03-18", + "attachment": true, + "open_weights": true, + "release_date": "2026-04-02", + "last_updated": "2026-06-11", "cost": { - "input": 1, - "output": 3, - "cache_read": 0.2, - "tiers": [ - { - "input": 2, - "output": 6, - "cache_read": 0.4, - "tier": { - "type": "context", - "size": 256000 - } - } - ], - "context_over_200k": { - "input": 2, - "output": 6, - "cache_read": 0.4 - } + "input": 0.1625, + "output": 0.5 }, "type": "chat" }, { - "id": "xiaomi/mimo-v2.5", - "name": "Xiaomi: MiMo-V2.5", - "display_name": "Xiaomi: MiMo-V2.5", + "id": "grok-4-20", + "name": "Grok 4.20", + "display_name": "Grok 4.20", "modalities": { "input": [ "text", - "image", - "audio", - "video" + "image" ], "output": [ "text" ] }, "limit": { - "context": 1048576, - "output": 131072 + "context": 2000000, + "output": 128000 }, - "temperature": true, "tool_call": true, "reasoning": { "supported": true, "default": true }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } - }, "attachment": true, - "open_weights": true, - "knowledge": "2024-12", - "release_date": "2026-04-22", - "last_updated": "2026-04-22", + "open_weights": false, + "release_date": "2026-03-12", + "last_updated": "2026-06-11", "cost": { - "input": 0.4, - "output": 2, - "cache_read": 0.08, + "input": 1.42, + "output": 2.83, + "cache_read": 0.23, "tiers": [ { - "input": 0.8, - "output": 4, - "cache_read": 0.16, + "input": 2.83, + "output": 5.67, + "cache_read": 0.45, "tier": { "type": "context", - "size": 256000 + "size": 200000 } } ], "context_over_200k": { - "input": 0.8, - "output": 4, - "cache_read": 0.16 + "input": 2.83, + "output": 5.67, + "cache_read": 0.45 } }, "type": "chat" }, { - "id": "xiaomi/mimo-v2-flash", - "name": "Xiaomi: MiMo-V2-Flash", - "display_name": "Xiaomi: MiMo-V2-Flash", + "id": "hermes-3-llama-3.1-405b", + "name": "Hermes 3 Llama 3.1 405b", + "display_name": "Hermes 3 Llama 3.1 405b", "modalities": { "input": [ "text" @@ -44444,31 +47056,27 @@ ] }, "limit": { - "context": 262144, - "output": 65536 + "context": 128000, + "output": 16384 }, - "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": true + "supported": false }, "attachment": false, "open_weights": true, - "knowledge": "2024-12-01", - "release_date": "2025-12-16", - "last_updated": "2026-02-04", + "release_date": "2025-09-25", + "last_updated": "2026-06-11", "cost": { - "input": 0.09, - "output": 0.29, - "cache_read": 0.045 + "input": 1.1, + "output": 3 }, "type": "chat" }, { - "id": "xiaomi/mimo-v2.5-pro", - "name": "Xiaomi: MiMo V2.5 Pro", - "display_name": "Xiaomi: MiMo V2.5 Pro", + "id": "aion-labs-aion-2-0", + "name": "Aion 2.0", + "display_name": "Aion 2.0", "modalities": { "input": [ "text" @@ -44478,61 +47086,33 @@ ] }, "limit": { - "context": 1048576, - "output": 131072 + "context": 128000, + "output": 32768 }, - "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": true, "default": true }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } - }, "attachment": false, - "open_weights": true, - "knowledge": "2024-12", - "release_date": "2026-04-22", - "last_updated": "2026-04-22", + "open_weights": false, + "release_date": "2026-03-24", + "last_updated": "2026-06-11", "cost": { "input": 1, - "output": 3, - "cache_read": 0.2, - "tiers": [ - { - "input": 2, - "output": 6, - "cache_read": 0.4, - "tier": { - "type": "context", - "size": 256000 - } - } - ], - "context_over_200k": { - "input": 2, - "output": 6, - "cache_read": 0.4 - } + "output": 2, + "cache_read": 0.25 }, "type": "chat" }, { - "id": "ai21/jamba-large-1.7", - "name": "AI21: Jamba Large 1.7", - "display_name": "AI21: Jamba Large 1.7", + "id": "qwen3-vl-235b-a22b", + "name": "Qwen3 VL 235B", + "display_name": "Qwen3 VL 235B", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" @@ -44540,31 +47120,42 @@ }, "limit": { "context": 256000, - "output": 4096 + "output": 16384 }, - "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true }, - "attachment": false, - "open_weights": false, - "release_date": "2025-08-09", - "last_updated": "2026-03-15", + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } + }, + "attachment": true, + "open_weights": true, + "release_date": "2026-01-16", + "last_updated": "2026-06-11", "cost": { - "input": 2, - "output": 8 + "input": 0.25, + "output": 1.5 }, "type": "chat" }, { - "id": "qwen/qwen3.5-plus-02-15", - "name": "Qwen: Qwen3.5 Plus 2026-02-15", - "display_name": "Qwen: Qwen3.5 Plus 2026-02-15", + "id": "xiaomi-mimo-v2-5", + "name": "MiMo-V2.5", + "display_name": "MiMo-V2.5", "modalities": { "input": [ - "image", "text", + "image", + "audio", "video" ], "output": [ @@ -44581,120 +47172,105 @@ "supported": true, "default": true }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } - }, "attachment": true, - "open_weights": false, - "release_date": "2026-02-15", - "last_updated": "2026-03-15", + "open_weights": true, + "knowledge": "2024-12", + "release_date": "2026-06-11", + "last_updated": "2026-06-11", "cost": { - "input": 0.26, - "output": 1.56 + "input": 0.175, + "output": 0.35, + "cache_read": 0.0625 }, "type": "chat" }, { - "id": "qwen/qwen-plus-2025-07-28", - "name": "Qwen: Qwen Plus 0728", - "display_name": "Qwen: Qwen Plus 0728", + "id": "venice-uncensored-1-2", + "name": "Venice Uncensored 1.2", + "display_name": "Venice Uncensored 1.2", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 1000000, - "output": 32768 + "context": 128000, + "output": 8192 }, - "temperature": true, "tool_call": true, "reasoning": { - "supported": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } + "supported": false }, - "attachment": false, + "attachment": true, "open_weights": true, - "release_date": "2025-09-09", - "last_updated": "2026-03-15", + "release_date": "2026-04-01", + "last_updated": "2026-06-11", "cost": { - "input": 0.26, - "output": 0.78 + "input": 0.2, + "output": 0.9 }, "type": "chat" }, { - "id": "qwen/qwen3-30b-a3b-instruct-2507", - "name": "Qwen: Qwen3 30B A3B Instruct 2507", - "display_name": "Qwen: Qwen3 30B A3B Instruct 2507", + "id": "gemini-3-5-flash", + "name": "Gemini 3.5 Flash", + "display_name": "Gemini 3.5 Flash", "modalities": { "input": [ - "text" + "text", + "image", + "audio", + "video" ], "output": [ "text" ] }, "limit": { - "context": 262144, - "output": 262144 + "context": 1000000, + "output": 65536 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": false, - "open_weights": true, - "release_date": "2025-07-29", - "last_updated": "2026-03-15", + "attachment": true, + "open_weights": false, + "knowledge": "2025-01", + "release_date": "2026-05-22", + "last_updated": "2026-06-11", "cost": { - "input": 0.09, - "output": 0.3, - "cache_read": 0.04 + "input": 1.55, + "output": 9.45, + "cache_read": 0.155, + "cache_write": 0.086 }, "type": "chat" }, { - "id": "qwen/qwen3.5-122b-a10b", - "name": "Qwen: Qwen3.5-122B-A10B", - "display_name": "Qwen: Qwen3.5-122B-A10B", + "id": "claude-fable-5", + "name": "Claude Fable 5", + "display_name": "Claude Fable 5", "modalities": { "input": [ - "image", "text", - "video" + "image" ], "output": [ "text" ] }, "limit": { - "context": 262144, - "output": 65536 + "context": 1000000, + "output": 128000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { "supported": true, @@ -44703,28 +47279,46 @@ "extra_capabilities": { "reasoning": { "supported": true, + "default_enabled": true, + "mode": "effort", + "effort": "high", + "effort_options": [ + "low", + "medium", + "high", + "xhigh", + "max" + ], "interleaved": true, "summaries": true, - "visibility": "summary", + "visibility": "omitted", "continuation": [ "thinking_blocks" + ], + "notes": [ + "Adaptive thinking is always on for Claude Fable 5 and Claude Mythos 5; thinking.type = \"disabled\" is rejected.", + "Manual budget_tokens requests return 400 on Claude Fable 5 and Claude Mythos 5.", + "thinking.display defaults to omitted; set display to summarized to receive readable thinking summaries." ] } }, "attachment": true, - "open_weights": true, - "release_date": "2026-02-26", - "last_updated": "2026-03-15", + "open_weights": false, + "knowledge": "2026-01-31", + "release_date": "2026-06-10", + "last_updated": "2026-06-11", "cost": { - "input": 0.26, - "output": 2.08 + "input": 12, + "output": 60, + "cache_read": 1.2, + "cache_write": 15 }, "type": "chat" }, { - "id": "qwen/qwen3-next-80b-a3b-instruct", - "name": "Qwen: Qwen3 Next 80B A3B Instruct", - "display_name": "Qwen: Qwen3 Next 80B A3B Instruct", + "id": "openai-gpt-oss-120b", + "name": "OpenAI GPT OSS 120B", + "display_name": "OpenAI GPT OSS 120B", "modalities": { "input": [ "text" @@ -44734,31 +47328,30 @@ ] }, "limit": { - "context": 131072, - "output": 52429 + "context": 128000, + "output": 16384 }, - "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "attachment": false, "open_weights": true, - "release_date": "2025-09-11", - "last_updated": "2026-03-15", + "release_date": "2025-11-06", + "last_updated": "2026-06-11", "cost": { - "input": 0.09, - "output": 1.1 + "input": 0.07, + "output": 0.3 }, "type": "chat" }, { - "id": "qwen/qwen2.5-vl-72b-instruct", - "name": "Qwen: Qwen2.5 VL 72B Instruct", - "display_name": "Qwen: Qwen2.5 VL 72B Instruct", + "id": "nvidia-nemotron-3-nano-30b-a3b", + "name": "NVIDIA Nemotron 3 Nano 30B", + "display_name": "NVIDIA Nemotron 3 Nano 30B", "modalities": { "input": [ - "image", "text" ], "output": [ @@ -44766,29 +47359,28 @@ ] }, "limit": { - "context": 32768, - "output": 32768 + "context": 128000, + "output": 16384 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { "supported": false }, - "attachment": true, + "attachment": false, "open_weights": true, - "release_date": "2025-02-01", - "last_updated": "2026-03-15", + "release_date": "2026-01-27", + "last_updated": "2026-06-11", "cost": { - "input": 0.8, - "output": 0.8, - "cache_read": 0.075 + "input": 0.075, + "output": 0.3 }, "type": "chat" }, { - "id": "qwen/qwen3-vl-30b-a3b-instruct", - "name": "Qwen: Qwen3 VL 30B A3B Instruct", - "display_name": "Qwen: Qwen3 VL 30B A3B Instruct", + "id": "claude-opus-4-6", + "name": "Claude Opus 4.6", + "display_name": "Claude Opus 4.6", "modalities": { "input": [ "text", @@ -44799,72 +47391,60 @@ ] }, "limit": { - "context": 131072, - "output": 32768 - }, - "temperature": true, - "tool_call": true, - "reasoning": { - "supported": false - }, - "attachment": true, - "open_weights": true, - "release_date": "2025-10-05", - "last_updated": "2025-11-25", - "cost": { - "input": 0.13, - "output": 0.52 - }, - "type": "chat" - }, - { - "id": "qwen/qwen3-32b", - "name": "Qwen: Qwen3 32B", - "display_name": "Qwen: Qwen3 32B", - "modalities": { - "input": [ - "text" - ], - "output": [ - "text" - ] - }, - "limit": { - "context": 40960, - "output": 40960 + "context": 1000000, + "output": 128000 }, "temperature": true, "tool_call": true, "reasoning": { "supported": true, - "default": true + "default": false }, "extra_capabilities": { "reasoning": { "supported": true, + "default_enabled": false, + "mode": "mixed", + "budget": { + "min": 1024, + "unit": "tokens" + }, + "effort": "high", + "effort_options": [ + "low", + "medium", + "high", + "max" + ], "interleaved": true, "summaries": true, "visibility": "summary", "continuation": [ "thinking_blocks" + ], + "notes": [ + "Anthropic recommends adaptive thinking with effort for Claude 4.6; budget_tokens remains a deprecated compatibility path.", + "Anthropic API defaults effort to high; lower effort levels should be chosen per workload." ] } }, - "attachment": false, - "open_weights": true, - "release_date": "2024-12-01", - "last_updated": "2026-02-04", + "attachment": true, + "open_weights": false, + "knowledge": "2025-05-31", + "release_date": "2026-02-05", + "last_updated": "2026-06-11", "cost": { - "input": 0.08, - "output": 0.24, - "cache_read": 0.04 + "input": 6, + "output": 30, + "cache_read": 0.6, + "cache_write": 7.5 }, "type": "chat" }, { - "id": "qwen/qwen3-coder-30b-a3b-instruct", - "name": "Qwen: Qwen3 Coder 30B A3B Instruct", - "display_name": "Qwen: Qwen3 Coder 30B A3B Instruct", + "id": "mistral-small-3-2-24b-instruct", + "name": "Mistral Small 3.2 24B Instruct", + "display_name": "Mistral Small 3.2 24B Instruct", "modalities": { "input": [ "text" @@ -44874,137 +47454,162 @@ ] }, "limit": { - "context": 160000, - "output": 32768 + "context": 256000, + "output": 16384 }, - "temperature": true, "tool_call": true, "reasoning": { "supported": false }, "attachment": false, "open_weights": true, - "release_date": "2025-07-31", - "last_updated": "2025-07-31", + "release_date": "2026-01-15", + "last_updated": "2026-06-11", "cost": { - "input": 0.07, - "output": 0.27 + "input": 0.09375, + "output": 0.25 }, "type": "chat" }, { - "id": "qwen/qwen3-vl-30b-a3b-thinking", - "name": "Qwen: Qwen3 VL 30B A3B Thinking", - "display_name": "Qwen: Qwen3 VL 30B A3B Thinking", + "id": "openai-gpt-54-pro", + "name": "GPT-5.4 Pro", + "display_name": "GPT-5.4 Pro", "modalities": { "input": [ - "image", - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 131072, - "output": 32768 + "context": 1000000, + "output": 128000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { "supported": true, "default": true }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } - }, "attachment": true, - "open_weights": true, - "release_date": "2025-10-11", - "last_updated": "2026-03-15", + "open_weights": false, + "knowledge": "2025-08-31", + "release_date": "2026-03-05", + "last_updated": "2026-06-11", "cost": { - "input": 0.13, - "output": 1.56 + "input": 37.5, + "output": 225, + "tiers": [ + { + "input": 75, + "output": 337.5, + "tier": { + "type": "context", + "size": 272000 + } + } + ], + "context_over_200k": { + "input": 75, + "output": 337.5 + } }, "type": "chat" }, { - "id": "qwen/qwen-2.5-coder-32b-instruct", - "name": "Qwen2.5 Coder 32B Instruct", - "display_name": "Qwen2.5 Coder 32B Instruct", + "id": "gemini-3-1-pro-preview", + "name": "Gemini 3.1 Pro Preview", + "display_name": "Gemini 3.1 Pro Preview", "modalities": { "input": [ - "text" + "text", + "image", + "audio", + "video" ], "output": [ "text" ] }, "limit": { - "context": 32768, - "output": 8192 + "context": 1000000, + "output": 32768 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": false, - "open_weights": true, - "release_date": "2024-11-11", - "last_updated": "2026-03-15", + "attachment": true, + "open_weights": false, + "knowledge": "2025-01", + "release_date": "2026-02-19", + "last_updated": "2026-06-11", "cost": { - "input": 0.2, - "output": 0.2, - "cache_read": 0.015 + "input": 2.5, + "output": 15, + "cache_read": 0.5, + "cache_write": 0.5, + "tiers": [ + { + "input": 5, + "output": 22.5, + "cache_read": 0.5, + "cache_write": 0.5, + "tier": { + "type": "context", + "size": 200000 + } + } + ], + "context_over_200k": { + "input": 5, + "output": 22.5, + "cache_read": 0.5, + "cache_write": 0.5 + } }, "type": "chat" }, { - "id": "qwen/qwen3-vl-235b-a22b-instruct", - "name": "Qwen: Qwen3 VL 235B A22B Instruct", - "display_name": "Qwen: Qwen3 VL 235B A22B Instruct", + "id": "qwen3-coder-480b-a35b-instruct-turbo", + "name": "Qwen 3 Coder 480B Turbo", + "display_name": "Qwen 3 Coder 480B Turbo", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 262144, - "output": 52429 + "context": 256000, + "output": 65536 }, - "temperature": true, "tool_call": true, "reasoning": { "supported": false }, - "attachment": true, + "attachment": false, "open_weights": true, - "release_date": "2025-09-23", - "last_updated": "2026-01-10", + "release_date": "2026-01-27", + "last_updated": "2026-06-11", "cost": { - "input": 0.2, - "output": 0.88, - "cache_read": 0.11 + "input": 0.35, + "output": 1.5, + "cache_read": 0.04 }, "type": "chat" }, { - "id": "qwen/qwen3.6-27b", - "name": "Qwen: Qwen3.6 27B", - "display_name": "Qwen: Qwen3.6 27B", + "id": "qwen3-6-27b", + "name": "Qwen 3.6 27B", + "display_name": "Qwen 3.6 27B", "modalities": { "input": [ "text", @@ -45025,21 +47630,10 @@ "supported": true, "default": true }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } - }, "attachment": true, "open_weights": false, - "release_date": "2026-04-27", - "last_updated": "2026-05-01", + "release_date": "2026-04-24", + "last_updated": "2026-06-11", "cost": { "input": 0.325, "output": 3.25 @@ -45047,58 +47641,48 @@ "type": "chat" }, { - "id": "qwen/qwen3-235b-a22b", - "name": "Qwen: Qwen3 235B A22B", - "display_name": "Qwen: Qwen3 235B A22B", + "id": "openai-gpt-52-codex", + "name": "GPT-5.2 Codex", + "display_name": "GPT-5.2 Codex", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 131072, - "output": 8192 + "context": 256000, + "output": 65536 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { "supported": true, "default": true }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } - }, - "attachment": false, - "open_weights": true, - "release_date": "2024-12-01", - "last_updated": "2026-03-15", + "attachment": true, + "open_weights": false, + "knowledge": "2025-08", + "release_date": "2025-01-15", + "last_updated": "2026-06-11", "cost": { - "input": 0.455, - "output": 1.82, - "cache_read": 0.15 + "input": 2.19, + "output": 17.5, + "cache_read": 0.219 }, "type": "chat" }, { - "id": "qwen/qwen3.5-plus-20260420", - "name": "Qwen: Qwen3.5 Plus 2026-04-20", - "display_name": "Qwen: Qwen3.5 Plus 2026-04-20", + "id": "claude-opus-4-6-fast", + "name": "Claude Opus 4.6 Fast", + "display_name": "Claude Opus 4.6 Fast", "modalities": { "input": [ "text", - "image", - "video" + "image" ], "output": [ "text" @@ -45106,39 +47690,59 @@ }, "limit": { "context": 1000000, - "output": 65536 + "output": 128000 }, "temperature": true, "tool_call": true, "reasoning": { "supported": true, - "default": true + "default": false }, "extra_capabilities": { "reasoning": { "supported": true, + "default_enabled": false, + "mode": "mixed", + "budget": { + "min": 1024, + "unit": "tokens" + }, + "effort": "high", + "effort_options": [ + "low", + "medium", + "high", + "max" + ], "interleaved": true, "summaries": true, "visibility": "summary", "continuation": [ "thinking_blocks" + ], + "notes": [ + "Anthropic recommends adaptive thinking with effort for Claude 4.6; budget_tokens remains a deprecated compatibility path.", + "Anthropic API defaults effort to high; lower effort levels should be chosen per workload." ] } }, "attachment": true, "open_weights": false, - "release_date": "2026-04-27", - "last_updated": "2026-05-01", + "knowledge": "2025-05-31", + "release_date": "2026-04-08", + "last_updated": "2026-06-11", "cost": { - "input": 0.4, - "output": 2.4 + "input": 36, + "output": 180, + "cache_read": 3.6, + "cache_write": 45 }, "type": "chat" }, { - "id": "qwen/qwen3-max", - "name": "Qwen: Qwen3 Max", - "display_name": "Qwen: Qwen3 Max", + "id": "qwen-3-7-max", + "name": "Qwen 3.7 Max", + "display_name": "Qwen 3.7 Max", "modalities": { "input": [ "text" @@ -45148,40 +47752,31 @@ ] }, "limit": { - "context": 262144, - "output": 32768 + "context": 1000000, + "output": 65536 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } + "supported": true, + "default": true }, "attachment": false, "open_weights": false, - "release_date": "2025-09-05", - "last_updated": "2026-03-15", + "release_date": "2026-05-22", + "last_updated": "2026-06-11", "cost": { - "input": 1.2, - "output": 6, - "cache_read": 0.24 + "input": 2.7, + "output": 8.05, + "cache_read": 0.27, + "cache_write": 3.35 }, "type": "chat" }, { - "id": "qwen/qwen3-coder-plus", - "name": "Qwen: Qwen3 Coder Plus", - "display_name": "Qwen: Qwen3 Coder Plus", + "id": "olafangensan-glm-4.7-flash-heretic", + "name": "GLM 4.7 Flash Heretic", + "display_name": "GLM 4.7 Flash Heretic", "modalities": { "input": [ "text" @@ -45191,105 +47786,113 @@ ] }, "limit": { - "context": 1000000, - "output": 65536 + "context": 200000, + "output": 24000 }, - "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "attachment": false, "open_weights": true, - "release_date": "2025-07-01", - "last_updated": "2026-03-15", + "release_date": "2026-02-04", + "last_updated": "2026-06-11", "cost": { - "input": 0.65, - "output": 3.25, - "cache_read": 0.2 + "input": 0.14, + "output": 0.8 }, "type": "chat" }, { - "id": "qwen/qwen3-14b", - "name": "Qwen: Qwen3 14B", - "display_name": "Qwen: Qwen3 14B", + "id": "openai-gpt-54-mini", + "name": "GPT-5.4 Mini", + "display_name": "GPT-5.4 Mini", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 40960, - "output": 40960 + "context": 400000, + "output": 128000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { "supported": true, "default": true }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } - }, - "attachment": false, - "open_weights": true, - "release_date": "2025-04", - "last_updated": "2026-03-15", + "attachment": true, + "open_weights": false, + "knowledge": "2025-08-31", + "release_date": "2026-03-27", + "last_updated": "2026-06-11", "cost": { - "input": 0.06, - "output": 0.24, - "cache_read": 0.025 + "input": 0.9375, + "output": 5.625, + "cache_read": 0.09375 }, "type": "chat" }, { - "id": "qwen/qwen3-coder-next", - "name": "Qwen: Qwen3 Coder Next", - "display_name": "Qwen: Qwen3 Coder Next", + "id": "grok-build-0-1", + "name": "Grok Build 0.1", + "display_name": "Grok Build 0.1", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 262144, + "context": 256000, "output": 65536 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": false, - "open_weights": true, - "release_date": "2026-02-02", - "last_updated": "2026-03-15", + "attachment": true, + "open_weights": false, + "release_date": "2026-05-21", + "last_updated": "2026-06-11", "cost": { - "input": 0.12, - "output": 0.75, - "cache_read": 0.035 + "input": 1, + "output": 2, + "cache_read": 0.2, + "tiers": [ + { + "input": 2, + "output": 4, + "cache_read": 0.4, + "tier": { + "type": "context", + "size": 200000 + } + } + ], + "context_over_200k": { + "input": 2, + "output": 4, + "cache_read": 0.4 + } }, "type": "chat" }, { - "id": "qwen/qwen3-235b-a22b-thinking-2507", - "name": "Qwen: Qwen3 235B A22B Thinking 2507", - "display_name": "Qwen: Qwen3 235B A22B Thinking 2507", + "id": "zai-org-glm-4.7", + "name": "GLM 4.7", + "display_name": "GLM 4.7", "modalities": { "input": [ "text" @@ -45299,8 +47902,8 @@ ] }, "limit": { - "context": 262144, - "output": 262144 + "context": 198000, + "output": 16384 }, "temperature": true, "tool_call": true, @@ -45321,72 +47924,98 @@ }, "attachment": false, "open_weights": true, - "release_date": "2025-07-25", - "last_updated": "2026-03-15", - "cost": { - "input": 0.11, - "output": 0.6 + "knowledge": "2025-04", + "release_date": "2025-12-24", + "last_updated": "2026-06-11", + "cost": { + "input": 0.55, + "output": 2.65, + "cache_read": 0.11 }, "type": "chat" }, { - "id": "qwen/qwen3-8b", - "name": "Qwen: Qwen3 8B", - "display_name": "Qwen: Qwen3 8B", + "id": "claude-sonnet-4-6", + "name": "Claude Sonnet 4.6", + "display_name": "Claude Sonnet 4.6", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 40960, - "output": 8192 + "context": 1000000, + "output": 64000 }, "temperature": true, "tool_call": true, "reasoning": { "supported": true, - "default": true + "default": false }, "extra_capabilities": { "reasoning": { "supported": true, + "default_enabled": false, + "mode": "mixed", + "budget": { + "min": 1024, + "unit": "tokens" + }, + "effort": "high", + "effort_options": [ + "low", + "medium", + "high", + "max" + ], "interleaved": true, "summaries": true, "visibility": "summary", "continuation": [ "thinking_blocks" + ], + "notes": [ + "Anthropic recommends adaptive thinking with effort for Claude 4.6; budget_tokens remains a deprecated compatibility path.", + "Anthropic API defaults effort to high; lower effort levels should be chosen per workload." ] } }, - "attachment": false, - "open_weights": true, - "release_date": "2025-04", - "last_updated": "2026-03-15", + "attachment": true, + "open_weights": false, + "knowledge": "2025-08-31", + "release_date": "2026-02-17", + "last_updated": "2026-06-11", "cost": { - "input": 0.05, - "output": 0.4, - "cache_read": 0.05 + "input": 3.6, + "output": 18, + "cache_read": 0.36, + "cache_write": 4.5 }, "type": "chat" }, { - "id": "qwen/qwen3.7-max", - "name": "Qwen: Qwen3.7 Max", - "display_name": "Qwen: Qwen3.7 Max", + "id": "gemini-3-flash-preview", + "name": "Gemini 3 Flash Preview", + "display_name": "Gemini 3 Flash Preview", "modalities": { "input": [ - "text" + "text", + "image", + "video", + "audio", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 1000000, + "context": 256000, "output": 65536 }, "temperature": true, @@ -45397,57 +48026,40 @@ }, "extra_capabilities": { "reasoning": { - "supported": true + "supported": true, + "default_enabled": true, + "mode": "level", + "level": "high", + "level_options": [ + "minimal", + "low", + "medium", + "high" + ], + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] } }, - "attachment": false, + "attachment": true, "open_weights": false, - "release_date": "2025-08-26", - "last_updated": "2026-05-27", - "cost": { - "input": 1.625, - "output": 4.875, - "cache_read": 0.1625, - "cache_write": 2.03125 - }, - "type": "chat" - }, - { - "id": "qwen/qwen3-235b-a22b-2507", - "name": "Qwen: Qwen3 235B A22B Instruct 2507", - "display_name": "Qwen: Qwen3 235B A22B Instruct 2507", - "modalities": { - "input": [ - "text" - ], - "output": [ - "text" - ] - }, - "limit": { - "context": 262144, - "output": 52429 - }, - "temperature": true, - "tool_call": true, - "reasoning": { - "supported": true, - "default": true - }, - "attachment": false, - "open_weights": true, - "release_date": "2025-04", - "last_updated": "2026-01", + "knowledge": "2025-01", + "release_date": "2025-12-19", + "last_updated": "2026-06-11", "cost": { - "input": 0.071, - "output": 0.1 + "input": 0.7, + "output": 3.75, + "cache_read": 0.07 }, "type": "chat" }, { - "id": "qwen/qwen3-30b-a3b", - "name": "Qwen: Qwen3 30B A3B", - "display_name": "Qwen: Qwen3 30B A3B", + "id": "arcee-trinity-large-thinking", + "name": "Trinity Large Thinking", + "display_name": "Trinity Large Thinking", "modalities": { "input": [ "text" @@ -45457,10 +48069,9 @@ ] }, "limit": { - "context": 40960, - "output": 40960 + "context": 256000, + "output": 65536 }, - "temperature": true, "tool_call": true, "reasoning": { "supported": true, @@ -45479,23 +48090,23 @@ }, "attachment": false, "open_weights": true, - "release_date": "2025-04", - "last_updated": "2026-03-15", + "release_date": "2026-04-02", + "last_updated": "2026-06-11", "cost": { - "input": 0.08, - "output": 0.28, - "cache_read": 0.03 + "input": 0.3125, + "output": 1.125, + "cache_read": 0.075 }, "type": "chat" }, { - "id": "qwen/qwen3.6-plus", - "name": "Qwen: Qwen3.6 Plus", - "display_name": "Qwen: Qwen3.6 Plus", + "id": "openai-gpt-55", + "name": "GPT-5.5", + "display_name": "GPT-5.5", "modalities": { "input": [ - "image", - "text" + "text", + "image" ], "output": [ "text" @@ -45503,46 +48114,50 @@ }, "limit": { "context": 1000000, - "output": 65536 + "output": 131072 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { "supported": true, "default": true }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } - }, "attachment": true, "open_weights": false, - "release_date": "2025-08-26", - "last_updated": "2026-04-11", + "knowledge": "2025-12-01", + "release_date": "2026-04-23", + "last_updated": "2026-06-11", "cost": { - "input": 0.325, - "output": 1.95, - "cache_read": 0.0325, - "cache_write": 0.40625 + "input": 6.25, + "output": 37.5, + "cache_read": 0.625, + "tiers": [ + { + "input": 12.5, + "output": 56.25, + "cache_read": 1.25, + "tier": { + "type": "context", + "size": 272000 + } + } + ], + "context_over_200k": { + "input": 12.5, + "output": 56.25, + "cache_read": 1.25 + } }, "type": "chat" }, { - "id": "qwen/qwen3.5-9b", - "name": "Qwen: Qwen3.5-9B", - "display_name": "Qwen: Qwen3.5-9B", + "id": "qwen3-5-9b", + "name": "Qwen 3.5 9B", + "display_name": "Qwen 3.5 9B", "modalities": { "input": [ - "image", "text", - "video" + "image" ], "output": [ "text" @@ -45552,40 +48167,27 @@ "context": 256000, "output": 32768 }, - "temperature": true, "tool_call": true, "reasoning": { "supported": true, "default": true }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } - }, "attachment": true, "open_weights": true, - "release_date": "2026-03-10", - "last_updated": "2026-03-15", + "release_date": "2026-03-05", + "last_updated": "2026-06-11", "cost": { - "input": 0.05, + "input": 0.1, "output": 0.15 }, "type": "chat" }, { - "id": "qwen/qwen3-vl-8b-instruct", - "name": "Qwen: Qwen3 VL 8B Instruct", - "display_name": "Qwen: Qwen3 VL 8B Instruct", + "id": "mercury-2", + "name": "Mercury 2", + "display_name": "Mercury 2", "modalities": { "input": [ - "image", "text" ], "output": [ @@ -45593,41 +48195,40 @@ ] }, "limit": { - "context": 131072, - "output": 32768 + "context": 128000, + "output": 50000 }, - "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": true, - "open_weights": true, - "release_date": "2025-10-15", - "last_updated": "2025-11-25", + "attachment": false, + "open_weights": false, + "release_date": "2026-02-20", + "last_updated": "2026-06-11", "cost": { - "input": 0.08, - "output": 0.5 + "input": 0.3125, + "output": 0.9375, + "cache_read": 0.03125 }, "type": "chat" }, { - "id": "qwen/qwen3.5-flash-02-23", - "name": "Qwen: Qwen3.5-Flash", - "display_name": "Qwen: Qwen3.5-Flash", + "id": "zai-org-glm-5-1", + "name": "GLM 5.1", + "display_name": "GLM 5.1", "modalities": { "input": [ - "image", - "text", - "video" + "text" ], "output": [ "text" ] }, "limit": { - "context": 1000000, - "output": 65536 + "context": 200000, + "output": 24000 }, "temperature": true, "tool_call": true, @@ -45646,33 +48247,35 @@ ] } }, - "attachment": true, + "attachment": false, "open_weights": true, - "release_date": "2026-02-26", - "last_updated": "2026-03-15", + "release_date": "2026-04-07", + "last_updated": "2026-06-11", "cost": { - "input": 0.1, - "output": 0.4 + "input": 1.75, + "output": 5.5, + "cache_read": 0.325 }, "type": "chat" }, { - "id": "qwen/qwen3-next-80b-a3b-thinking", - "name": "Qwen: Qwen3 Next 80B A3B Thinking", - "display_name": "Qwen: Qwen3 Next 80B A3B Thinking", + "id": "kimi-k2-5", + "name": "Kimi K2.5", + "display_name": "Kimi K2.5", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 131072, - "output": 32768 + "context": 256000, + "output": 65536 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { "supported": true, @@ -45689,65 +48292,67 @@ ] } }, - "attachment": false, - "open_weights": true, - "release_date": "2025-09-11", - "last_updated": "2026-03-15", + "attachment": true, + "open_weights": false, + "knowledge": "2024-04", + "release_date": "2026-01-27", + "last_updated": "2026-06-11", "cost": { - "input": 0.0975, - "output": 0.78 + "input": 0.56, + "output": 3.5, + "cache_read": 0.22 }, "type": "chat" }, { - "id": "qwen/qwen3-coder-flash", - "name": "Qwen: Qwen3 Coder Flash", - "display_name": "Qwen: Qwen3 Coder Flash", + "id": "z-ai-glm-5v-turbo", + "name": "GLM 5V Turbo", + "display_name": "GLM 5V Turbo", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 1000000, - "output": 65536 + "context": 200000, + "output": 32768 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": false, + "attachment": true, "open_weights": false, - "release_date": "2025-07-23", - "last_updated": "2026-03-15", + "release_date": "2026-04-01", + "last_updated": "2026-06-11", "cost": { - "input": 0.195, - "output": 0.975, - "cache_read": 0.06 + "input": 1.5, + "output": 5, + "cache_read": 0.3 }, "type": "chat" }, { - "id": "qwen/qwen3.5-35b-a3b", - "name": "Qwen: Qwen3.5-35B-A3B", - "display_name": "Qwen: Qwen3.5-35B-A3B", + "id": "nvidia-nemotron-3-ultra-550b-a55b", + "name": "NVIDIA Nemotron 3 Ultra", + "display_name": "NVIDIA Nemotron 3 Ultra", "modalities": { "input": [ - "image", - "text", - "video" + "text" ], "output": [ "text" ] }, "limit": { - "context": 262144, - "output": 65536 + "context": 256000, + "output": 32768 }, "temperature": true, "tool_call": true, @@ -45755,123 +48360,92 @@ "supported": true, "default": true }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } - }, - "attachment": true, + "attachment": false, "open_weights": true, - "release_date": "2026-02-26", - "last_updated": "2026-03-15", + "release_date": "2026-06-04", + "last_updated": "2026-06-11", "cost": { - "input": 0.1625, - "output": 1.3 + "input": 0.625, + "output": 3.125, + "cache_read": 0.1875 }, "type": "chat" }, { - "id": "qwen/qwen3.6-flash", - "name": "Qwen: Qwen3.6 Flash", - "display_name": "Qwen: Qwen3.6 Flash", + "id": "openai-gpt-52", + "name": "GPT-5.2", + "display_name": "GPT-5.2", "modalities": { "input": [ - "text", - "image", - "video" + "text" ], "output": [ "text" ] }, "limit": { - "context": 1000000, + "context": 256000, "output": 65536 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { "supported": true, "default": true }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } - }, - "attachment": true, + "attachment": false, "open_weights": false, - "release_date": "2026-04-27", - "last_updated": "2026-05-01", + "knowledge": "2025-08-31", + "release_date": "2025-12-13", + "last_updated": "2026-06-11", "cost": { - "input": 0.25, - "output": 1.5, - "cache_write": 0.3125 + "input": 2.19, + "output": 17.5, + "cache_read": 0.219 }, "type": "chat" }, { - "id": "qwen/qwen3.6-35b-a3b", - "name": "Qwen: Qwen3.6 35B A3B", - "display_name": "Qwen: Qwen3.6 35B A3B", + "id": "deepseek-v3.2", + "name": "DeepSeek V3.2", + "display_name": "DeepSeek V3.2", "modalities": { "input": [ - "text", - "image", - "video" + "text" ], "output": [ "text" ] }, "limit": { - "context": 262144, - "output": 65536 + "context": 160000, + "output": 32768 }, - "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { "supported": true, "default": true }, "extra_capabilities": { "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] + "supported": true } }, - "attachment": true, - "open_weights": false, - "release_date": "2026-04-27", - "last_updated": "2026-05-01", + "attachment": false, + "open_weights": true, + "release_date": "2025-12-04", + "last_updated": "2026-06-11", "cost": { - "input": 0.1612, - "output": 0.96525, - "cache_read": 0.1612 + "input": 0.33, + "output": 0.48, + "cache_read": 0.16 }, "type": "chat" }, { - "id": "qwen/qwen3-30b-a3b-thinking-2507", - "name": "Qwen: Qwen3 30B A3B Thinking 2507", - "display_name": "Qwen: Qwen3 30B A3B Thinking 2507", + "id": "minimax-m25", + "name": "MiniMax M2.5", + "display_name": "MiniMax M2.5", "modalities": { "input": [ "text" @@ -45881,8 +48455,8 @@ ] }, "limit": { - "context": 32768, - "output": 6554 + "context": 198000, + "output": 32768 }, "temperature": true, "tool_call": true, @@ -45903,50 +48477,19 @@ }, "attachment": false, "open_weights": true, - "release_date": "2025-07-29", - "last_updated": "2025-07-29", - "cost": { - "input": 0.051, - "output": 0.34 - }, - "type": "chat" - }, - { - "id": "qwen/qwen-plus-2025-07-28:thinking", - "name": "Qwen: Qwen Plus 0728 (thinking)", - "display_name": "Qwen: Qwen Plus 0728 (thinking)", - "modalities": { - "input": [ - "text" - ], - "output": [ - "text" - ] - }, - "limit": { - "context": 1000000, - "output": 32768 - }, - "temperature": true, - "tool_call": true, - "reasoning": { - "supported": true, - "default": true - }, - "attachment": false, - "open_weights": true, - "release_date": "2025-09-09", - "last_updated": "2026-03-15", + "release_date": "2026-02-12", + "last_updated": "2026-06-11", "cost": { - "input": 0.26, - "output": 0.78 + "input": 0.34, + "output": 1.19, + "cache_read": 0.04 }, "type": "chat" }, { - "id": "qwen/qwen3-coder", - "name": "Qwen: Qwen3 Coder 480B A35B", - "display_name": "Qwen: Qwen3 Coder 480B A35B", + "id": "llama-3.2-3b", + "name": "Llama 3.2 3B", + "display_name": "Llama 3.2 3B", "modalities": { "input": [ "text" @@ -45956,29 +48499,27 @@ ] }, "limit": { - "context": 262144, - "output": 52429 + "context": 128000, + "output": 4096 }, - "temperature": true, "tool_call": true, "reasoning": { "supported": false }, "attachment": false, "open_weights": true, - "release_date": "2025-07-23", - "last_updated": "2025-07-23", + "release_date": "2024-10-03", + "last_updated": "2026-06-11", "cost": { - "input": 0.22, - "output": 1, - "cache_read": 0.022 + "input": 0.15, + "output": 0.6 }, "type": "chat" }, { - "id": "qwen/qwen3.6-max-preview", - "name": "Qwen: Qwen3.6 Max Preview", - "display_name": "Qwen: Qwen3.6 Max Preview", + "id": "tencent-hy3-preview", + "name": "Hy3 Preview", + "display_name": "Hy3 Preview", "modalities": { "input": [ "text" @@ -45988,8 +48529,8 @@ ] }, "limit": { - "context": 262144, - "output": 65536 + "context": 256000, + "output": 32768 }, "temperature": true, "tool_call": true, @@ -45997,45 +48538,41 @@ "supported": true, "default": true }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } - }, "attachment": false, - "open_weights": false, - "release_date": "2026-04-27", - "last_updated": "2026-05-01", + "open_weights": true, + "release_date": "2026-06-08", + "last_updated": "2026-06-11", "cost": { - "input": 1.04, - "output": 6.24, - "cache_write": 1.3 + "input": 0.063, + "output": 0.21, + "cache_read": 0.021 }, "type": "chat" - }, + } + ] + }, + "lmstudio": { + "id": "lmstudio", + "name": "LMStudio", + "display_name": "LMStudio", + "api": "http://127.0.0.1:1234/v1", + "doc": "https://lmstudio.ai/models", + "models": [ { - "id": "qwen/qwen3.5-397b-a17b", - "name": "Qwen: Qwen3.5 397B A17B", - "display_name": "Qwen: Qwen3.5 397B A17B", + "id": "openai/gpt-oss-20b", + "name": "GPT OSS 20B", + "display_name": "GPT OSS 20B", "modalities": { "input": [ - "image", - "text", - "video" + "text" ], "output": [ "text" ] }, "limit": { - "context": 262144, - "output": 65536 + "context": 131072, + "output": 32768 }, "temperature": true, "tool_call": true, @@ -46045,29 +48582,23 @@ }, "extra_capabilities": { "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] + "supported": true } }, - "attachment": true, - "open_weights": false, - "release_date": "2026-02-15", - "last_updated": "2026-03-15", + "attachment": false, + "open_weights": true, + "release_date": "2025-08-05", + "last_updated": "2025-08-05", "cost": { - "input": 0.39, - "output": 2.34 + "input": 0, + "output": 0 }, "type": "chat" }, { - "id": "qwen/qwen-2.5-7b-instruct", - "name": "Qwen: Qwen2.5 7B Instruct", - "display_name": "Qwen: Qwen2.5 7B Instruct", + "id": "qwen/qwen3-30b-a3b-2507", + "name": "Qwen3 30B A3B 2507", + "display_name": "Qwen3 30B A3B 2507", "modalities": { "input": [ "text" @@ -46077,8 +48608,8 @@ ] }, "limit": { - "context": 32768, - "output": 6554 + "context": 262144, + "output": 16384 }, "temperature": true, "tool_call": true, @@ -46087,18 +48618,19 @@ }, "attachment": false, "open_weights": true, - "release_date": "2024-09", - "last_updated": "2025-04-16", + "knowledge": "2025-04", + "release_date": "2025-07-30", + "last_updated": "2025-07-30", "cost": { - "input": 0.04, - "output": 0.1 + "input": 0, + "output": 0 }, "type": "chat" }, { - "id": "qwen/qwen3-max-thinking", - "name": "Qwen: Qwen3 Max Thinking", - "display_name": "Qwen: Qwen3 Max Thinking", + "id": "qwen/qwen3-coder-30b", + "name": "Qwen3 Coder 30B", + "display_name": "Qwen3 Coder 30B", "modalities": { "input": [ "text" @@ -46109,52 +48641,48 @@ }, "limit": { "context": 262144, - "output": 32768 + "output": 65536 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } + "supported": false }, "attachment": false, - "open_weights": false, - "release_date": "2026-01-23", - "last_updated": "2026-03-15", + "open_weights": true, + "knowledge": "2025-04", + "release_date": "2025-07-23", + "last_updated": "2025-07-23", "cost": { - "input": 0.78, - "output": 3.9 + "input": 0, + "output": 0 }, "type": "chat" - }, + } + ] + }, + "poolside": { + "id": "poolside", + "name": "Poolside", + "display_name": "Poolside", + "api": "https://inference.poolside.ai/v1", + "doc": "https://platform.poolside.ai", + "models": [ { - "id": "qwen/qwen3.5-27b", - "name": "Qwen: Qwen3.5-27B", - "display_name": "Qwen: Qwen3.5-27B", + "id": "poolside/laguna-xs.2", + "name": "Laguna XS.2", + "display_name": "Laguna XS.2", "modalities": { "input": [ - "image", - "text", - "video" + "text" ], "output": [ "text" ] }, "limit": { - "context": 262144, - "output": 65536 + "context": 131040, + "output": 8192 }, "temperature": true, "tool_call": true, @@ -46173,23 +48701,24 @@ ] } }, - "attachment": true, + "attachment": false, "open_weights": true, - "release_date": "2026-02-26", - "last_updated": "2026-03-15", + "release_date": "2026-04-28", + "last_updated": "2026-04-28", "cost": { - "input": 0.195, - "output": 1.56 + "input": 0, + "output": 0, + "cache_read": 0, + "cache_write": 0 }, "type": "chat" }, { - "id": "qwen/qwen3-vl-8b-thinking", - "name": "Qwen: Qwen3 VL 8B Thinking", - "display_name": "Qwen: Qwen3 VL 8B Thinking", + "id": "poolside/laguna-m.1", + "name": "Laguna M.1", + "display_name": "Laguna M.1", "modalities": { "input": [ - "image", "text" ], "output": [ @@ -46197,8 +48726,8 @@ ] }, "limit": { - "context": 131072, - "output": 32768 + "context": 131040, + "output": 8192 }, "temperature": true, "tool_call": true, @@ -46217,34 +48746,45 @@ ] } }, - "attachment": true, + "attachment": false, "open_weights": false, - "release_date": "2025-10-15", - "last_updated": "2025-11-25", + "release_date": "2026-04-28", + "last_updated": "2026-04-28", "cost": { - "input": 0.117, - "output": 1.365 + "input": 0, + "output": 0, + "cache_read": 0, + "cache_write": 0 }, "type": "chat" - }, + } + ] + }, + "openai": { + "id": "openai", + "name": "OpenAI", + "display_name": "OpenAI", + "doc": "https://platform.openai.com/docs/models", + "models": [ { - "id": "qwen/qwen3-vl-235b-a22b-thinking", - "name": "Qwen: Qwen3 VL 235B A22B Thinking", - "display_name": "Qwen: Qwen3 VL 235B A22B Thinking", + "id": "o3", + "name": "o3", + "display_name": "o3", "modalities": { "input": [ + "text", "image", - "text" + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 131072, - "output": 32768 + "context": 200000, + "output": 100000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { "supported": true, @@ -46253,28 +48793,33 @@ "extra_capabilities": { "reasoning": { "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] + "default_enabled": true, + "mode": "effort", + "effort": "medium", + "effort_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" } }, "attachment": true, - "open_weights": true, - "release_date": "2025-09-24", - "last_updated": "2026-03-15", + "open_weights": false, + "knowledge": "2024-05", + "release_date": "2025-04-16", + "last_updated": "2025-04-16", "cost": { - "input": 0.26, - "output": 2.6 + "input": 2, + "output": 8, + "cache_read": 0.5 }, "type": "chat" }, { - "id": "qwen/qwen-2.5-72b-instruct", - "name": "Qwen2.5 72B Instruct", - "display_name": "Qwen2.5 72B Instruct", + "id": "text-embedding-3-large", + "name": "text-embedding-3-large", + "display_name": "text-embedding-3-large", "modalities": { "input": [ "text" @@ -46284,28 +48829,29 @@ ] }, "limit": { - "context": 32768, - "output": 16384 + "context": 8191, + "output": 3072 }, - "temperature": true, - "tool_call": true, + "temperature": false, + "tool_call": false, "reasoning": { "supported": false }, "attachment": false, - "open_weights": true, - "release_date": "2024-09", - "last_updated": "2026-01-10", + "open_weights": false, + "knowledge": "2024-01", + "release_date": "2024-01-25", + "last_updated": "2024-01-25", "cost": { - "input": 0.12, - "output": 0.39 + "input": 0.13, + "output": 0 }, - "type": "chat" + "type": "embedding" }, { - "id": "qwen/qwen3-vl-32b-instruct", - "name": "Qwen: Qwen3 VL 32B Instruct", - "display_name": "Qwen: Qwen3 VL 32B Instruct", + "id": "gpt-5.2-pro", + "name": "GPT-5.2 Pro", + "display_name": "GPT-5.2 Pro", "modalities": { "input": [ "text", @@ -46316,71 +48862,106 @@ ] }, "limit": { - "context": 131072, - "output": 32768 + "context": 400000, + "output": 128000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": true, + "mode": "effort", + "effort": "high", + "effort_options": [ + "medium", + "high", + "xhigh" + ], + "verbosity": "medium", + "verbosity_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" + } }, "attachment": true, "open_weights": false, - "release_date": "2025-10-21", - "last_updated": "2025-11-25", + "knowledge": "2025-08-31", + "release_date": "2025-12-11", + "last_updated": "2025-12-11", "cost": { - "input": 0.104, - "output": 0.416 + "input": 21, + "output": 168 }, "type": "chat" }, { - "id": "qwen/qwen-plus", - "name": "Qwen: Qwen-Plus", - "display_name": "Qwen: Qwen-Plus", + "id": "gpt-5", + "name": "GPT-5", + "display_name": "GPT-5", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 1000000, - "output": 32768 + "context": 400000, + "output": 128000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { - "supported": true + "supported": true, + "default": true }, "extra_capabilities": { "reasoning": { "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] + "default_enabled": true, + "mode": "effort", + "effort": "medium", + "effort_options": [ + "minimal", + "low", + "medium", + "high" + ], + "verbosity": "medium", + "verbosity_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" } }, - "attachment": false, + "attachment": true, "open_weights": false, - "release_date": "2024-01-25", - "last_updated": "2025-09-11", + "knowledge": "2024-09-30", + "release_date": "2025-08-07", + "last_updated": "2025-08-07", "cost": { - "input": 0.4, - "output": 1.2, - "cache_read": 0.08 + "input": 1.25, + "output": 10, + "cache_read": 0.125 }, "type": "chat" }, { - "id": "liquid/lfm-2-24b-a2b", - "name": "LiquidAI: LFM2-24B-A2B", - "display_name": "LiquidAI: LFM2-24B-A2B", + "id": "gpt-3.5-turbo", + "name": "GPT-3.5-turbo", + "display_name": "GPT-3.5-turbo", "modalities": { "input": [ "text" @@ -46390,8 +48971,8 @@ ] }, "limit": { - "context": 32768, - "output": 32768 + "context": 16385, + "output": 4096 }, "temperature": true, "tool_call": false, @@ -46399,53 +48980,75 @@ "supported": false }, "attachment": false, - "open_weights": true, - "release_date": "2026-02-26", - "last_updated": "2026-03-15", + "open_weights": false, + "knowledge": "2021-09-01", + "release_date": "2023-03-01", + "last_updated": "2023-11-06", "cost": { - "input": 0.03, - "output": 0.12 + "input": 0.5, + "output": 1.5, + "cache_read": 0 }, "type": "chat" }, { - "id": "essentialai/rnj-1-instruct", - "name": "EssentialAI: Rnj 1 Instruct", - "display_name": "EssentialAI: Rnj 1 Instruct", + "id": "gpt-5-pro", + "name": "GPT-5 Pro", + "display_name": "GPT-5 Pro", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 32768, - "output": 6554 + "context": 400000, + "output": 272000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": false, - "open_weights": true, - "release_date": "2025-12-05", - "last_updated": "2026-03-15", + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": true, + "mode": "fixed", + "effort": "high", + "verbosity": "medium", + "verbosity_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" + } + }, + "attachment": true, + "open_weights": false, + "knowledge": "2024-09-30", + "release_date": "2025-10-06", + "last_updated": "2025-10-06", "cost": { - "input": 0.15, - "output": 0.15 + "input": 15, + "output": 120 }, "type": "chat" }, { - "id": "cohere/command-r-plus-08-2024", - "name": "Cohere: Command R+ (08-2024)", - "display_name": "Cohere: Command R+ (08-2024)", + "id": "gpt-4o", + "name": "GPT-4o", + "display_name": "GPT-4o", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ "text" @@ -46453,27 +49056,29 @@ }, "limit": { "context": 128000, - "output": 4000 + "output": 16384 }, "temperature": true, "tool_call": true, "reasoning": { "supported": false }, - "attachment": false, - "open_weights": true, - "release_date": "2024-08-30", - "last_updated": "2024-08-30", + "attachment": true, + "open_weights": false, + "knowledge": "2023-09", + "release_date": "2024-05-13", + "last_updated": "2024-08-06", "cost": { "input": 2.5, - "output": 10 + "output": 10, + "cache_read": 1.25 }, "type": "chat" }, { - "id": "cohere/command-r-08-2024", - "name": "Cohere: Command R (08-2024)", - "display_name": "Cohere: Command R (08-2024)", + "id": "gpt-4", + "name": "GPT-4", + "display_name": "GPT-4", "modalities": { "input": [ "text" @@ -46483,94 +49088,82 @@ ] }, "limit": { - "context": 128000, - "output": 4000 + "context": 8192, + "output": 8192 }, "temperature": true, "tool_call": true, "reasoning": { "supported": false }, - "attachment": false, - "open_weights": true, - "release_date": "2024-08-30", - "last_updated": "2024-08-30", + "attachment": true, + "open_weights": false, + "knowledge": "2023-11", + "release_date": "2023-11-06", + "last_updated": "2024-04-09", "cost": { - "input": 0.15, - "output": 0.6 + "input": 30, + "output": 60 }, "type": "chat" }, { - "id": "cohere/command-a", - "name": "Cohere: Command A", - "display_name": "Cohere: Command A", + "id": "o4-mini", + "name": "o4-mini", + "display_name": "o4-mini", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 256000, - "output": 8192 + "context": 200000, + "output": 100000 }, - "temperature": true, - "tool_call": false, + "temperature": false, + "tool_call": true, "reasoning": { - "supported": false - }, - "attachment": false, - "open_weights": true, - "release_date": "2025-03-13", - "last_updated": "2025-03-13", - "cost": { - "input": 2.5, - "output": 10 + "supported": true, + "default": true }, - "type": "chat" - }, - { - "id": "cohere/command-r7b-12-2024", - "name": "Cohere: Command R7B (12-2024)", - "display_name": "Cohere: Command R7B (12-2024)", - "modalities": { - "input": [ - "text" - ], - "output": [ - "text" - ] - }, - "limit": { - "context": 128000, - "output": 4000 - }, - "temperature": true, - "tool_call": true, - "reasoning": { - "supported": false + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": true, + "mode": "effort", + "effort": "medium", + "effort_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" + } }, - "attachment": false, - "open_weights": true, - "release_date": "2024-02-27", - "last_updated": "2024-02-27", + "attachment": true, + "open_weights": false, + "knowledge": "2024-05", + "release_date": "2025-04-16", + "last_updated": "2025-04-16", "cost": { - "input": 0.0375, - "output": 0.15 + "input": 1.1, + "output": 4.4, + "cache_read": 0.275 }, "type": "chat" }, { - "id": "openrouter/free", - "name": "Free Models Router", - "display_name": "Free Models Router", + "id": "o3-pro", + "name": "o3-pro", + "display_name": "o3-pro", "modalities": { "input": [ - "image", - "text" + "text", + "image" ], "output": [ "text" @@ -46578,62 +49171,76 @@ }, "limit": { "context": 200000, - "output": 32768 + "output": 100000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { "supported": true, "default": true }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": true, + "mode": "effort", + "effort": "medium", + "effort_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" + } + }, "attachment": true, "open_weights": false, - "release_date": "2026-02-01", - "last_updated": "2026-03-15", + "knowledge": "2024-05", + "release_date": "2025-06-10", + "last_updated": "2025-06-10", "cost": { - "input": 0, - "output": 0 + "input": 20, + "output": 80 }, "type": "chat" }, { - "id": "openrouter/pareto-code", - "name": "Pareto Code Router", - "display_name": "Pareto Code Router", + "id": "chatgpt-image-latest", + "name": "chatgpt-image-latest", + "display_name": "chatgpt-image-latest", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ - "text" + "text", + "image" ] }, "limit": { - "context": 200000, - "output": 65536 + "context": 8192, + "output": 8192 }, "temperature": false, "tool_call": false, "reasoning": { "supported": false }, - "attachment": false, + "attachment": true, "open_weights": false, - "release_date": "2026-04-21", - "last_updated": "2026-05-01", - "cost": { - "input": 0, - "output": 0 - }, + "release_date": "2025-12-16", + "last_updated": "2025-12-16", "type": "chat" }, { - "id": "openrouter/bodybuilder", - "name": "Body Builder (beta)", - "display_name": "Body Builder (beta)", + "id": "gpt-4o-2024-05-13", + "name": "GPT-4o (2024-05-13)", + "display_name": "GPT-4o (2024-05-13)", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" @@ -46641,153 +49248,191 @@ }, "limit": { "context": 128000, - "output": 32768 + "output": 4096 }, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { "supported": false }, - "attachment": false, + "attachment": true, "open_weights": false, - "release_date": "2026-03-15", - "last_updated": "2026-03-15", + "knowledge": "2023-09", + "release_date": "2024-05-13", + "last_updated": "2024-05-13", "cost": { - "input": 0, - "output": 0 + "input": 5, + "output": 15 }, "type": "chat" }, { - "id": "openrouter/owl-alpha", - "name": "Owl Alpha", - "display_name": "Owl Alpha", + "id": "gpt-5.4-nano", + "name": "GPT-5.4 nano", + "display_name": "GPT-5.4 nano", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 1048756, - "output": 262144 + "context": 400000, + "output": 128000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { "supported": true, - "default": true + "default": false }, - "attachment": false, + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": false, + "mode": "effort", + "effort": "none", + "effort_options": [ + "none", + "low", + "medium", + "high", + "xhigh" + ], + "verbosity": "medium", + "verbosity_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" + } + }, + "attachment": true, "open_weights": false, - "release_date": "2026-04-28", - "last_updated": "2026-04-30", + "knowledge": "2025-08-31", + "release_date": "2026-03-17", + "last_updated": "2026-03-17", "cost": { - "input": 0, - "output": 0 + "input": 0.2, + "output": 1.25, + "cache_read": 0.02 }, "type": "chat" }, { - "id": "openrouter/auto", - "name": "Auto Router", - "display_name": "Auto Router", + "id": "gpt-5-chat-latest", + "name": "GPT-5 Chat (latest)", + "display_name": "GPT-5 Chat (latest)", "modalities": { "input": [ - "audio", - "image", - "pdf", "text", - "video" + "image" ], "output": [ - "image", "text" ] }, "limit": { - "context": 2000000, - "output": 32768 + "context": 400000, + "output": 128000 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": true, "default": true }, "attachment": true, "open_weights": false, - "release_date": "2026-03-15", - "last_updated": "2026-03-15", + "knowledge": "2024-09-30", + "release_date": "2025-08-07", + "last_updated": "2025-08-07", "cost": { - "input": 0, - "output": 0 + "input": 1.25, + "output": 10, + "cache_read": 0.125 }, "type": "chat" }, { - "id": "moonshotai/kimi-k2-thinking", - "name": "MoonshotAI: Kimi K2 Thinking", - "display_name": "MoonshotAI: Kimi K2 Thinking", + "id": "gpt-5.1-codex", + "name": "GPT-5.1 Codex", + "display_name": "GPT-5.1 Codex", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 131072, - "output": 65535 + "context": 400000, + "output": 128000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { "supported": true, - "default": true + "default": false }, "extra_capabilities": { "reasoning": { "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] + "default_enabled": false, + "mode": "effort", + "effort": "none", + "effort_options": [ + "none", + "low", + "medium", + "high" + ], + "verbosity": "medium", + "verbosity_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" } }, - "attachment": false, - "open_weights": true, - "release_date": "2025-11-06", - "last_updated": "2026-03-15", + "attachment": true, + "open_weights": false, + "knowledge": "2024-09-30", + "release_date": "2025-11-13", + "last_updated": "2025-11-13", "cost": { - "input": 0.47, - "output": 2, - "cache_read": 0.2 + "input": 1.25, + "output": 10, + "cache_read": 0.125 }, "type": "chat" }, { - "id": "moonshotai/kimi-k2.6", - "name": "MoonshotAI: Kimi K2.6", - "display_name": "MoonshotAI: Kimi K2.6", + "id": "gpt-5.3-codex-spark", + "name": "GPT-5.3 Codex Spark", + "display_name": "GPT-5.3 Codex Spark", "modalities": { "input": [ "text", - "image" + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 262144, - "output": 65535 + "context": 128000, + "output": 32000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { "supported": true, @@ -46795,162 +49440,131 @@ }, "extra_capabilities": { "reasoning": { - "supported": true + "supported": true, + "default_enabled": true, + "mode": "effort", + "effort": "medium", + "effort_options": [ + "low", + "medium", + "high", + "xhigh" + ], + "verbosity": "medium", + "verbosity_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" } }, "attachment": true, - "open_weights": true, - "release_date": "2026-04-20", - "last_updated": "2026-05-12", - "cost": { - "input": 0.75, - "output": 3.5, - "cache_read": 0.375 - }, - "type": "chat" - }, - { - "id": "moonshotai/kimi-k2-0905", - "name": "MoonshotAI: Kimi K2 0905", - "display_name": "MoonshotAI: Kimi K2 0905", - "modalities": { - "input": [ - "text" - ], - "output": [ - "text" - ] - }, - "limit": { - "context": 131072, - "output": 26215 - }, - "temperature": true, - "tool_call": true, - "reasoning": { - "supported": false - }, - "attachment": false, - "open_weights": true, - "release_date": "2025-09-05", - "last_updated": "2025-09-05", - "cost": { - "input": 0.4, - "output": 2, - "cache_read": 0.15 - }, - "type": "chat" - }, - { - "id": "moonshotai/kimi-k2", - "name": "MoonshotAI: Kimi K2 0711", - "display_name": "MoonshotAI: Kimi K2 0711", - "modalities": { - "input": [ - "text" - ], - "output": [ - "text" - ] - }, - "limit": { - "context": 131000, - "output": 26215 - }, - "temperature": true, - "tool_call": true, - "reasoning": { - "supported": false - }, - "attachment": false, - "open_weights": true, - "release_date": "2025-07-11", - "last_updated": "2026-03-15", + "open_weights": false, + "knowledge": "2025-08-31", + "release_date": "2026-02-05", + "last_updated": "2026-02-05", "cost": { - "input": 0.55, - "output": 2.2 + "input": 1.75, + "output": 14, + "cache_read": 0.175 }, "type": "chat" }, { - "id": "moonshotai/kimi-k2.5", - "name": "MoonshotAI: Kimi K2.5", - "display_name": "MoonshotAI: Kimi K2.5", + "id": "gpt-5.1-codex-max", + "name": "GPT-5.1 Codex Max", + "display_name": "GPT-5.1 Codex Max", "modalities": { "input": [ - "image", - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 262144, - "output": 65535 + "context": 400000, + "output": 128000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { "supported": true, - "default": true + "default": false }, "extra_capabilities": { "reasoning": { "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] + "default_enabled": false, + "mode": "effort", + "effort": "none", + "effort_options": [ + "none", + "low", + "medium", + "high" + ], + "verbosity": "medium", + "verbosity_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" } }, "attachment": true, - "open_weights": true, - "release_date": "2026-01-27", - "last_updated": "2026-03-15", + "open_weights": false, + "knowledge": "2024-09-30", + "release_date": "2025-11-13", + "last_updated": "2025-11-13", "cost": { - "input": 0.45, - "output": 2.2 + "input": 1.25, + "output": 10, + "cache_read": 0.125 }, "type": "chat" }, { - "id": "meta-llama/llama-3.1-70b-instruct", - "name": "Meta: Llama 3.1 70B Instruct", - "display_name": "Meta: Llama 3.1 70B Instruct", + "id": "gpt-5.3-chat-latest", + "name": "GPT-5.3 Chat (latest)", + "display_name": "GPT-5.3 Chat (latest)", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 131072, - "output": 26215 + "context": 128000, + "output": 16384 }, "temperature": true, "tool_call": true, "reasoning": { "supported": false }, - "attachment": false, - "open_weights": true, - "release_date": "2024-07-16", - "last_updated": "2024-07-23", + "attachment": true, + "open_weights": false, + "knowledge": "2025-08-31", + "release_date": "2026-03-03", + "last_updated": "2026-03-03", "cost": { - "input": 0.4, - "output": 0.4 + "input": 1.75, + "output": 14, + "cache_read": 0.175 }, "type": "chat" }, { - "id": "meta-llama/llama-4-maverick", - "name": "Meta: Llama 4 Maverick", - "display_name": "Meta: Llama 4 Maverick", + "id": "gpt-4o-2024-08-06", + "name": "GPT-4o (2024-08-06)", + "display_name": "GPT-4o (2024-08-06)", "modalities": { "input": [ "text", @@ -46961,7 +49575,7 @@ ] }, "limit": { - "context": 1048576, + "context": 128000, "output": 16384 }, "temperature": true, @@ -46970,22 +49584,23 @@ "supported": false }, "attachment": true, - "open_weights": true, - "release_date": "2025-04-05", - "last_updated": "2025-12-24", + "open_weights": false, + "knowledge": "2023-09", + "release_date": "2024-08-06", + "last_updated": "2024-08-06", "cost": { - "input": 0.15, - "output": 0.6 + "input": 2.5, + "output": 10, + "cache_read": 1.25 }, "type": "chat" }, { - "id": "meta-llama/llama-guard-4-12b", - "name": "Meta: Llama Guard 4 12B", - "display_name": "Meta: Llama Guard 4 12B", + "id": "text-embedding-ada-002", + "name": "text-embedding-ada-002", + "display_name": "text-embedding-ada-002", "modalities": { "input": [ - "image", "text" ], "output": [ @@ -46993,28 +49608,29 @@ ] }, "limit": { - "context": 163840, - "output": 32768 + "context": 8192, + "output": 1536 }, - "temperature": true, + "temperature": false, "tool_call": false, "reasoning": { "supported": false }, - "attachment": true, - "open_weights": true, - "release_date": "2025-04-05", - "last_updated": "2025-04-05", + "attachment": false, + "open_weights": false, + "knowledge": "2022-12", + "release_date": "2022-12-15", + "last_updated": "2022-12-15", "cost": { - "input": 0.18, - "output": 0.18 + "input": 0.1, + "output": 0 }, - "type": "chat" + "type": "embedding" }, { - "id": "meta-llama/llama-3.2-3b-instruct", - "name": "Meta: Llama 3.2 3B Instruct", - "display_name": "Meta: Llama 3.2 3B Instruct", + "id": "o3-mini", + "name": "o3-mini", + "display_name": "o3-mini", "modalities": { "input": [ "text" @@ -47024,28 +49640,45 @@ ] }, "limit": { - "context": 80000, - "output": 16384 + "context": 200000, + "output": 100000 }, - "temperature": true, - "tool_call": false, + "temperature": false, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": true, + "mode": "effort", + "effort": "medium", + "effort_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" + } }, "attachment": false, - "open_weights": true, - "release_date": "2024-09-18", - "last_updated": "2026-03-15", + "open_weights": false, + "knowledge": "2024-05", + "release_date": "2024-12-20", + "last_updated": "2025-01-29", "cost": { - "input": 0.051, - "output": 0.34 + "input": 1.1, + "output": 4.4, + "cache_read": 0.55 }, "type": "chat" }, { - "id": "meta-llama/llama-4-scout", - "name": "Meta: Llama 4 Scout", - "display_name": "Meta: Llama 4 Scout", + "id": "gpt-5.2", + "name": "GPT-5.2", + "display_name": "GPT-5.2", "modalities": { "input": [ "text", @@ -47056,60 +49689,110 @@ ] }, "limit": { - "context": 327680, - "output": 16384 + "context": 400000, + "output": 128000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": false + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": false, + "mode": "effort", + "effort": "none", + "effort_options": [ + "none", + "low", + "medium", + "high", + "xhigh" + ], + "verbosity": "medium", + "verbosity_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" + } }, "attachment": true, - "open_weights": true, - "release_date": "2025-04-05", - "last_updated": "2025-04-05", + "open_weights": false, + "knowledge": "2025-08-31", + "release_date": "2025-12-11", + "last_updated": "2025-12-11", "cost": { - "input": 0.08, - "output": 0.3 + "input": 1.75, + "output": 14, + "cache_read": 0.175 }, "type": "chat" }, { - "id": "meta-llama/llama-3.2-11b-vision-instruct", - "name": "Meta: Llama 3.2 11B Vision Instruct", - "display_name": "Meta: Llama 3.2 11B Vision Instruct", + "id": "gpt-5.3-codex", + "name": "GPT-5.3 Codex", + "display_name": "GPT-5.3 Codex", "modalities": { "input": [ "text", - "image" + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 131072, - "output": 16384 + "context": 400000, + "output": 128000 }, - "temperature": true, - "tool_call": false, + "temperature": false, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": true, + "mode": "effort", + "effort": "medium", + "effort_options": [ + "low", + "medium", + "high", + "xhigh" + ], + "verbosity": "medium", + "verbosity_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" + } }, "attachment": true, - "open_weights": true, - "release_date": "2024-09-25", - "last_updated": "2024-09-25", + "open_weights": false, + "knowledge": "2025-08-31", + "release_date": "2026-02-05", + "last_updated": "2026-02-05", "cost": { - "input": 0.049, - "output": 0.049 + "input": 1.75, + "output": 14, + "cache_read": 0.175 }, "type": "chat" }, { - "id": "meta-llama/llama-3.2-1b-instruct", - "name": "Meta: Llama 3.2 1B Instruct", - "display_name": "Meta: Llama 3.2 1B Instruct", + "id": "text-embedding-3-small", + "name": "text-embedding-3-small", + "display_name": "text-embedding-3-small", "modalities": { "input": [ "text" @@ -47119,345 +49802,473 @@ ] }, "limit": { - "context": 60000, - "output": 12000 + "context": 8191, + "output": 1536 }, - "temperature": true, + "temperature": false, "tool_call": false, "reasoning": { "supported": false }, "attachment": false, - "open_weights": true, - "release_date": "2024-09-18", - "last_updated": "2026-01-27", + "open_weights": false, + "knowledge": "2024-01", + "release_date": "2024-01-25", + "last_updated": "2024-01-25", "cost": { - "input": 0.027, - "output": 0.2 + "input": 0.02, + "output": 0 }, - "type": "chat" + "type": "embedding" }, { - "id": "meta-llama/llama-3-70b-instruct", - "name": "Meta: Llama 3 70B Instruct", - "display_name": "Meta: Llama 3 70B Instruct", + "id": "gpt-5.1-codex-mini", + "name": "GPT-5.1 Codex mini", + "display_name": "GPT-5.1 Codex mini", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 8192, - "output": 8000 + "context": 400000, + "output": 128000 }, - "temperature": true, - "tool_call": false, + "temperature": false, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": false }, - "attachment": false, - "open_weights": true, - "release_date": "2024-07-23", - "last_updated": "2024-07-23", + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": false, + "mode": "effort", + "effort": "none", + "effort_options": [ + "none", + "low", + "medium", + "high" + ], + "verbosity": "medium", + "verbosity_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" + } + }, + "attachment": true, + "open_weights": false, + "knowledge": "2024-09-30", + "release_date": "2025-11-13", + "last_updated": "2025-11-13", "cost": { - "input": 0.51, - "output": 0.74 + "input": 0.25, + "output": 2, + "cache_read": 0.025 }, "type": "chat" }, { - "id": "meta-llama/llama-3-8b-instruct", - "name": "Meta: Llama 3 8B Instruct", - "display_name": "Meta: Llama 3 8B Instruct", + "id": "gpt-5.1-chat-latest", + "name": "GPT-5.1 Chat", + "display_name": "GPT-5.1 Chat", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 8192, + "context": 128000, "output": 16384 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": false, - "open_weights": true, - "release_date": "2024-04-25", - "last_updated": "2025-04-03", + "attachment": true, + "open_weights": false, + "knowledge": "2024-09-30", + "release_date": "2025-11-13", + "last_updated": "2025-11-13", "cost": { - "input": 0.03, - "output": 0.04 + "input": 1.25, + "output": 10, + "cache_read": 0.125 }, "type": "chat" }, { - "id": "meta-llama/llama-3.1-8b-instruct", - "name": "Meta: Llama 3.1 8B Instruct", - "display_name": "Meta: Llama 3.1 8B Instruct", + "id": "gpt-5.2-chat-latest", + "name": "GPT-5.2 Chat", + "display_name": "GPT-5.2 Chat", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 16384, + "context": 128000, "output": 16384 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": false, - "open_weights": true, - "release_date": "2024-07-23", - "last_updated": "2025-12-23", + "attachment": true, + "open_weights": false, + "knowledge": "2025-08-31", + "release_date": "2025-12-11", + "last_updated": "2025-12-11", "cost": { - "input": 0.02, - "output": 0.05 + "input": 1.75, + "output": 14, + "cache_read": 0.175 }, "type": "chat" }, { - "id": "meta-llama/llama-3.3-70b-instruct", - "name": "Meta: Llama 3.3 70B Instruct", - "display_name": "Meta: Llama 3.3 70B Instruct", + "id": "o4-mini-deep-research", + "name": "o4-mini-deep-research", + "display_name": "o4-mini-deep-research", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 131072, - "output": 16384 + "context": 200000, + "output": 100000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": false, - "open_weights": true, - "release_date": "2024-08-01", - "last_updated": "2026-02-04", + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": true, + "mode": "effort", + "effort": "medium", + "effort_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" + } + }, + "attachment": true, + "open_weights": false, + "knowledge": "2024-05", + "release_date": "2024-06-26", + "last_updated": "2024-06-26", "cost": { - "input": 0.1, - "output": 0.32 + "input": 2, + "output": 8, + "cache_read": 0.5 }, "type": "chat" }, { - "id": "meta-llama/llama-guard-3-8b", - "name": "Llama Guard 3 8B", - "display_name": "Llama Guard 3 8B", + "id": "gpt-image-1.5", + "name": "gpt-image-1.5", + "display_name": "gpt-image-1.5", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ - "text" + "text", + "image" ] }, "limit": { - "context": 131072, - "output": 26215 + "context": 8192, + "output": 8192 }, - "temperature": true, + "temperature": false, "tool_call": false, "reasoning": { "supported": false }, - "attachment": false, - "open_weights": true, - "release_date": "2024-04-18", - "last_updated": "2026-02-04", - "cost": { - "input": 0.02, - "output": 0.06 - }, - "type": "chat" + "attachment": true, + "open_weights": false, + "release_date": "2025-11-25", + "last_updated": "2025-11-25", + "type": "imageGeneration" }, { - "id": "kilo-auto/balanced", - "name": "Kilo Auto Balanced", - "display_name": "Kilo Auto Balanced", + "id": "gpt-4.1-nano", + "name": "GPT-4.1 nano", + "display_name": "GPT-4.1 nano", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 204800, - "output": 131072 + "context": 1047576, + "output": 32768 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, - "attachment": false, + "attachment": true, "open_weights": false, - "release_date": "2026-03-15", - "last_updated": "2026-03-15", + "knowledge": "2024-04", + "release_date": "2025-04-14", + "last_updated": "2025-04-14", "cost": { - "input": 0.6, - "output": 3 + "input": 0.1, + "output": 0.4, + "cache_read": 0.025 }, "type": "chat" }, { - "id": "kilo-auto/frontier", - "name": "Kilo Auto Frontier", - "display_name": "Kilo Auto Frontier", + "id": "gpt-4o-2024-11-20", + "name": "GPT-4o (2024-11-20)", + "display_name": "GPT-4o (2024-11-20)", "modalities": { "input": [ - "image", - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 1000000, - "output": 128000 + "context": 128000, + "output": 16384 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, "attachment": true, "open_weights": false, - "release_date": "2026-03-15", - "last_updated": "2026-03-15", + "knowledge": "2023-09", + "release_date": "2024-11-20", + "last_updated": "2024-11-20", "cost": { - "input": 5, - "output": 25 + "input": 2.5, + "output": 10, + "cache_read": 1.25 }, "type": "chat" }, { - "id": "kilo-auto/small", - "name": "Kilo Auto Small", - "display_name": "Kilo Auto Small", + "id": "o1", + "name": "o1", + "display_name": "o1", "modalities": { "input": [ + "text", "image", - "text" + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 400000, - "output": 128000 + "context": 200000, + "output": 100000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { "supported": true, "default": true }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": true, + "mode": "effort", + "effort": "medium", + "effort_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" + } + }, "attachment": true, "open_weights": false, - "release_date": "2026-03-15", - "last_updated": "2026-03-15", + "knowledge": "2023-09", + "release_date": "2024-12-05", + "last_updated": "2024-12-05", "cost": { - "input": 0.05, - "output": 0.4 + "input": 15, + "output": 60, + "cache_read": 7.5 }, "type": "chat" }, { - "id": "kilo-auto/free", - "name": "Kilo Auto Free", - "display_name": "Kilo Auto Free", + "id": "o1-pro", + "name": "o1-pro", + "display_name": "o1-pro", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 204800, - "output": 131072 + "context": 200000, + "output": 100000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { "supported": true, "default": true }, - "attachment": false, + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": true, + "mode": "effort", + "effort": "medium", + "effort_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" + } + }, + "attachment": true, "open_weights": false, - "release_date": "2026-03-15", - "last_updated": "2026-03-15", + "knowledge": "2023-09", + "release_date": "2025-03-19", + "last_updated": "2025-03-19", "cost": { - "input": 0, - "output": 0 + "input": 150, + "output": 600 }, "type": "chat" }, { - "id": "perplexity/sonar", - "name": "Perplexity: Sonar", - "display_name": "Perplexity: Sonar", + "id": "gpt-5.4", + "name": "GPT-5.4", + "display_name": "GPT-5.4", "modalities": { "input": [ "text", - "image" + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 127072, - "output": 25415 + "context": 1050000, + "output": 128000 }, - "temperature": true, - "tool_call": false, + "temperature": false, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": false }, - "attachment": true, - "open_weights": false, - "release_date": "2024-01-01", - "last_updated": "2025-09-01", - "cost": { - "input": 1, - "output": 1 + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": false, + "mode": "effort", + "effort": "none", + "effort_options": [ + "none", + "low", + "medium", + "high", + "xhigh" + ], + "verbosity": "medium", + "verbosity_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" + } + }, + "attachment": true, + "open_weights": false, + "knowledge": "2025-08-31", + "release_date": "2026-03-05", + "last_updated": "2026-03-05", + "cost": { + "input": 2.5, + "output": 15, + "cache_read": 0.25, + "tiers": [ + { + "input": 5, + "output": 22.5, + "cache_read": 0.5, + "tier": { + "type": "context", + "size": 272000 + } + } + ], + "context_over_200k": { + "input": 5, + "output": 22.5, + "cache_read": 0.5 + } }, "type": "chat" }, { - "id": "perplexity/sonar-pro", - "name": "Perplexity: Sonar Pro", - "display_name": "Perplexity: Sonar Pro", + "id": "gpt-5.4-mini", + "name": "GPT-5.4 mini", + "display_name": "GPT-5.4 mini", "modalities": { "input": [ "text", @@ -47468,65 +50279,92 @@ ] }, "limit": { - "context": 200000, - "output": 8000 + "context": 400000, + "output": 128000 }, - "temperature": true, - "tool_call": false, + "temperature": false, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": false + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": false, + "mode": "effort", + "effort": "none", + "effort_options": [ + "none", + "low", + "medium", + "high", + "xhigh" + ], + "verbosity": "medium", + "verbosity_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" + } }, "attachment": true, "open_weights": false, - "release_date": "2024-01-01", - "last_updated": "2025-09-01", + "knowledge": "2025-08-31", + "release_date": "2026-03-17", + "last_updated": "2026-03-17", "cost": { - "input": 3, - "output": 15 + "input": 0.75, + "output": 4.5, + "cache_read": 0.075 }, "type": "chat" }, { - "id": "perplexity/sonar-reasoning-pro", - "name": "Perplexity: Sonar Reasoning Pro", - "display_name": "Perplexity: Sonar Reasoning Pro", + "id": "gpt-4.1", + "name": "GPT-4.1", + "display_name": "GPT-4.1", "modalities": { "input": [ "text", - "image" + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 25600 + "context": 1047576, + "output": 32768 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, "attachment": true, "open_weights": false, - "release_date": "2024-01-01", - "last_updated": "2025-09-01", + "knowledge": "2024-04", + "release_date": "2025-04-14", + "last_updated": "2025-04-14", "cost": { "input": 2, - "output": 8 + "output": 8, + "cache_read": 0.5 }, "type": "chat" }, { - "id": "perplexity/sonar-pro-search", - "name": "Perplexity: Sonar Pro Search", - "display_name": "Perplexity: Sonar Pro Search", + "id": "o3-deep-research", + "name": "o3-deep-research", + "display_name": "o3-deep-research", "modalities": { "input": [ - "image", - "text" + "text", + "image" ], "output": [ "text" @@ -47534,155 +50372,163 @@ }, "limit": { "context": 200000, - "output": 8000 + "output": 100000 }, - "temperature": true, - "tool_call": false, + "temperature": false, + "tool_call": true, "reasoning": { "supported": true, "default": true }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": true, + "mode": "effort", + "effort": "medium", + "effort_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" + } + }, "attachment": true, "open_weights": false, - "release_date": "2025-10-31", - "last_updated": "2026-03-15", + "knowledge": "2024-05", + "release_date": "2024-06-26", + "last_updated": "2024-06-26", "cost": { - "input": 3, - "output": 15 + "input": 10, + "output": 40, + "cache_read": 2.5 }, "type": "chat" }, { - "id": "perplexity/sonar-deep-research", - "name": "Perplexity: Sonar Deep Research", - "display_name": "Perplexity: Sonar Deep Research", + "id": "gpt-5-mini", + "name": "GPT-5 Mini", + "display_name": "GPT-5 Mini", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 25600 + "context": 400000, + "output": 128000 }, - "temperature": true, - "tool_call": false, + "temperature": false, + "tool_call": true, "reasoning": { "supported": true, "default": true }, - "attachment": false, - "open_weights": false, - "release_date": "2025-01-27", - "last_updated": "2025-01-27", - "cost": { - "input": 2, - "output": 8 - }, - "type": "chat" - }, - { - "id": "anthracite-org/magnum-v4-72b", - "name": "Magnum v4 72B", - "display_name": "Magnum v4 72B", - "modalities": { - "input": [ - "text" - ], - "output": [ - "text" - ] - }, - "limit": { - "context": 16384, - "output": 2048 - }, - "temperature": true, - "tool_call": false, - "reasoning": { - "supported": false + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": true, + "mode": "effort", + "effort": "medium", + "effort_options": [ + "minimal", + "low", + "medium", + "high" + ], + "verbosity": "medium", + "verbosity_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" + } }, - "attachment": false, - "open_weights": true, - "release_date": "2024-10-22", - "last_updated": "2026-03-15", + "attachment": true, + "open_weights": false, + "knowledge": "2024-05-30", + "release_date": "2025-08-07", + "last_updated": "2025-08-07", "cost": { - "input": 3, - "output": 5 + "input": 0.25, + "output": 2, + "cache_read": 0.025 }, "type": "chat" }, { - "id": "mancer/weaver", - "name": "Mancer: Weaver (alpha)", - "display_name": "Mancer: Weaver (alpha)", + "id": "gpt-image-1", + "name": "gpt-image-1", + "display_name": "gpt-image-1", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ - "text" + "image" ] }, "limit": { - "context": 8000, - "output": 2000 + "context": 8192, + "output": 8192 }, - "temperature": true, + "temperature": false, "tool_call": false, "reasoning": { "supported": false }, - "attachment": false, + "attachment": true, "open_weights": false, - "release_date": "2023-08-02", - "last_updated": "2026-03-15", - "cost": { - "input": 0.75, - "output": 1 - }, - "type": "chat" + "release_date": "2025-04-24", + "last_updated": "2025-04-24", + "type": "imageGeneration" }, { - "id": "baidu/ernie-4.5-vl-424b-a47b", - "name": "Baidu: ERNIE 4.5 VL 424B A47B ", - "display_name": "Baidu: ERNIE 4.5 VL 424B A47B ", + "id": "gpt-4.1-mini", + "name": "GPT-4.1 mini", + "display_name": "GPT-4.1 mini", "modalities": { "input": [ + "text", "image", - "text" + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 123000, - "output": 16000 + "context": 1047576, + "output": 32768 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, "attachment": true, - "open_weights": true, - "release_date": "2025-06-30", - "last_updated": "2026-01", + "open_weights": false, + "knowledge": "2024-04", + "release_date": "2025-04-14", + "last_updated": "2025-04-14", "cost": { - "input": 0.42, - "output": 1.25 + "input": 0.4, + "output": 1.6, + "cache_read": 0.1 }, "type": "chat" }, { - "id": "baidu/ernie-4.5-vl-28b-a3b", - "name": "Baidu: ERNIE 4.5 VL 28B A3B", - "display_name": "Baidu: ERNIE 4.5 VL 28B A3B", + "id": "gpt-4-turbo", + "name": "GPT-4 Turbo", + "display_name": "GPT-4 Turbo", "modalities": { "input": [ "text", @@ -47693,72 +50539,70 @@ ] }, "limit": { - "context": 30000, - "output": 8000 + "context": 128000, + "output": 4096 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, "attachment": true, - "open_weights": true, - "release_date": "2025-06-30", - "last_updated": "2025-06-30", + "open_weights": false, + "knowledge": "2023-12", + "release_date": "2023-11-06", + "last_updated": "2024-04-09", "cost": { - "input": 0.14, - "output": 0.56 + "input": 10, + "output": 30 }, "type": "chat" }, { - "id": "baidu/ernie-4.5-21b-a3b-thinking", - "name": "Baidu: ERNIE 4.5 21B A3B Thinking", - "display_name": "Baidu: ERNIE 4.5 21B A3B Thinking", + "id": "gpt-image-1-mini", + "name": "gpt-image-1-mini", + "display_name": "gpt-image-1-mini", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ - "text" + "text", + "image" ] }, "limit": { - "context": 131072, - "output": 65536 + "context": 8192, + "output": 8192 }, - "temperature": true, + "temperature": false, "tool_call": false, "reasoning": { - "supported": true, - "default": true - }, - "attachment": false, - "open_weights": true, - "release_date": "2025-09-19", - "last_updated": "2025-09-19", - "cost": { - "input": 0.07, - "output": 0.28 + "supported": false }, - "type": "chat" + "attachment": true, + "open_weights": false, + "release_date": "2025-09-26", + "last_updated": "2025-09-26", + "type": "imageGeneration" }, { - "id": "baidu/cobuddy:free", - "name": "Baidu: CoBuddy (free)", - "display_name": "Baidu: CoBuddy (free)", + "id": "gpt-5-nano", + "name": "GPT-5 Nano", + "display_name": "GPT-5 Nano", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 131072, - "output": 65536 + "context": 400000, + "output": 128000 }, "temperature": false, "tool_call": true, @@ -47766,164 +50610,126 @@ "supported": true, "default": true }, - "attachment": false, - "open_weights": false, - "release_date": "2026-05-06", - "last_updated": "2026-05-07", - "cost": { - "input": 0, - "output": 0 - }, - "type": "chat" - }, - { - "id": "baidu/ernie-4.5-21b-a3b", - "name": "Baidu: ERNIE 4.5 21B A3B", - "display_name": "Baidu: ERNIE 4.5 21B A3B", - "modalities": { - "input": [ - "text" - ], - "output": [ - "text" - ] - }, - "limit": { - "context": 120000, - "output": 8000 - }, - "temperature": true, - "tool_call": true, - "reasoning": { - "supported": false - }, - "attachment": false, - "open_weights": true, - "release_date": "2025-06-30", - "last_updated": "2025-06-30", - "cost": { - "input": 0.07, - "output": 0.28 - }, - "type": "chat" - }, - { - "id": "baidu/qianfan-ocr-fast", - "name": "Baidu: Qianfan-OCR-Fast", - "display_name": "Baidu: Qianfan-OCR-Fast", - "modalities": { - "input": [ - "image", - "text" - ], - "output": [ - "text" - ] - }, - "limit": { - "context": 65536, - "output": 28672 - }, - "temperature": true, - "tool_call": false, - "reasoning": { - "supported": true, - "default": true + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": true, + "mode": "effort", + "effort": "medium", + "effort_options": [ + "minimal", + "low", + "medium", + "high" + ], + "verbosity": "medium", + "verbosity_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" + } }, "attachment": true, "open_weights": false, - "release_date": "2026-04-20", - "last_updated": "2026-05-16", - "cost": { - "input": 0.68, - "output": 2.81 - }, - "type": "chat" - }, - { - "id": "baidu/ernie-4.5-300b-a47b", - "name": "Baidu: ERNIE 4.5 300B A47B ", - "display_name": "Baidu: ERNIE 4.5 300B A47B ", - "modalities": { - "input": [ - "text" - ], - "output": [ - "text" - ] - }, - "limit": { - "context": 123000, - "output": 12000 - }, - "temperature": true, - "tool_call": false, - "reasoning": { - "supported": false - }, - "attachment": false, - "open_weights": true, - "release_date": "2025-06-30", - "last_updated": "2026-01", + "knowledge": "2024-05-30", + "release_date": "2025-08-07", + "last_updated": "2025-08-07", "cost": { - "input": 0.28, - "output": 1.1 + "input": 0.05, + "output": 0.4, + "cache_read": 0.005 }, "type": "chat" }, { - "id": "x-ai/grok-4.20-multi-agent", - "name": "xAI: Grok 4.20 Multi-Agent", - "display_name": "xAI: Grok 4.20 Multi-Agent", + "id": "gpt-5.4-pro", + "name": "GPT-5.4 Pro", + "display_name": "GPT-5.4 Pro", "modalities": { "input": [ - "image", - "pdf", - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 2000000, - "output": 2000000 + "context": 1050000, + "output": 128000 }, - "temperature": true, - "tool_call": false, + "temperature": false, + "tool_call": true, "reasoning": { "supported": true, "default": true }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": true, + "mode": "effort", + "effort": "high", + "effort_options": [ + "medium", + "high", + "xhigh" + ], + "verbosity": "medium", + "verbosity_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" + } + }, "attachment": true, "open_weights": false, - "release_date": "2026-03-31", - "last_updated": "2026-04-11", + "knowledge": "2025-08-31", + "release_date": "2026-03-05", + "last_updated": "2026-03-05", "cost": { - "input": 2, - "output": 6, - "cache_read": 0.2 + "input": 30, + "output": 180, + "tiers": [ + { + "input": 60, + "output": 270, + "tier": { + "type": "context", + "size": 272000 + } + } + ], + "context_over_200k": { + "input": 60, + "output": 270 + } }, "type": "chat" }, { - "id": "x-ai/grok-build-0.1", - "name": "xAI: Grok Build 0.1", - "display_name": "xAI: Grok Build 0.1", + "id": "gpt-5.5-pro", + "name": "GPT-5.5 Pro", + "display_name": "GPT-5.5 Pro", "modalities": { "input": [ + "text", "image", - "text" + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 256000, - "output": 256000 + "context": 1050000, + "output": 128000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { "supported": true, @@ -47936,69 +50742,82 @@ }, "attachment": true, "open_weights": false, - "release_date": "2026-05-20", - "last_updated": "2026-05-27", + "knowledge": "2025-12-01", + "release_date": "2026-04-23", + "last_updated": "2026-04-23", "cost": { - "input": 1, - "output": 2, - "cache_read": 0.2 + "input": 30, + "output": 180, + "tiers": [ + { + "input": 60, + "output": 270, + "tier": { + "type": "context", + "size": 272000 + } + } + ], + "context_over_200k": { + "input": 60, + "output": 270 + } }, "type": "chat" }, { - "id": "x-ai/grok-4.20", - "name": "xAI: Grok 4.20", - "display_name": "xAI: Grok 4.20", + "id": "gpt-4o-mini", + "name": "GPT-4o mini", + "display_name": "GPT-4o mini", "modalities": { "input": [ + "text", "image", - "pdf", - "text" + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 2000000, - "output": 2000000 + "context": 128000, + "output": 16384 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, "attachment": true, "open_weights": false, - "release_date": "2026-03-31", - "last_updated": "2026-04-11", + "knowledge": "2023-09", + "release_date": "2024-07-18", + "last_updated": "2024-07-18", "cost": { - "input": 2, - "output": 6, - "cache_read": 0.2 + "input": 0.15, + "output": 0.6, + "cache_read": 0.075 }, "type": "chat" }, { - "id": "x-ai/grok-4.3", - "name": "xAI: Grok 4.3", - "display_name": "xAI: Grok 4.3", + "id": "gpt-5-codex", + "name": "GPT-5-Codex", + "display_name": "GPT-5-Codex", "modalities": { "input": [ "text", - "image", - "pdf" + "image" ], "output": [ "text" ] }, "limit": { - "context": 1000000, - "output": 4096 + "context": 400000, + "output": 128000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { "supported": true, @@ -48006,100 +50825,109 @@ }, "extra_capabilities": { "reasoning": { - "supported": true + "supported": true, + "default_enabled": true, + "mode": "effort", + "effort": "medium", + "effort_options": [ + "minimal", + "low", + "medium", + "high" + ], + "verbosity": "medium", + "verbosity_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" } }, - "attachment": true, + "attachment": false, "open_weights": false, - "release_date": "2026-05-01", - "last_updated": "2026-05-01", + "knowledge": "2024-09-30", + "release_date": "2025-09-15", + "last_updated": "2025-09-15", "cost": { "input": 1.25, - "output": 2.5, - "cache_read": 0.2 + "output": 10, + "cache_read": 0.125 }, "type": "chat" }, { - "id": "stealth/claude-sonnet-4.6", - "name": "Stealth: Claude Sonnet 4.6 (20% off)", - "display_name": "Stealth: Claude Sonnet 4.6 (20% off)", + "id": "gpt-5.2-codex", + "name": "GPT-5.2 Codex", + "display_name": "GPT-5.2 Codex", "modalities": { "input": [ + "text", "image", - "pdf", - "text" + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 1000000, - "output": 64000 + "context": 400000, + "output": 128000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { "supported": true, - "default": false + "default": true }, "extra_capabilities": { "reasoning": { "supported": true, - "default_enabled": false, - "mode": "mixed", - "budget": { - "min": 1024, - "unit": "tokens" - }, - "effort": "high", + "default_enabled": true, + "mode": "effort", + "effort": "medium", "effort_options": [ "low", "medium", "high", - "max" + "xhigh" ], - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" + "verbosity": "medium", + "verbosity_options": [ + "low", + "medium", + "high" ], - "notes": [ - "Anthropic recommends adaptive thinking with effort for Claude 4.6; budget_tokens remains a deprecated compatibility path.", - "Anthropic API defaults effort to high; lower effort levels should be chosen per workload." - ] + "visibility": "hidden" } }, "attachment": true, "open_weights": false, - "release_date": "2026-02-17", - "last_updated": "2026-05-27", + "knowledge": "2025-08-31", + "release_date": "2025-12-11", + "last_updated": "2025-12-11", "cost": { - "input": 2.4, - "output": 12, - "cache_read": 0.24, - "cache_write": 3 + "input": 1.75, + "output": 14, + "cache_read": 0.175 }, "type": "chat" }, { - "id": "stealth/claude-opus-4.7", - "name": "Stealth: Claude Opus 4.7 (20% off)", - "display_name": "Stealth: Claude Opus 4.7 (20% off)", + "id": "gpt-5.1", + "name": "GPT-5.1", + "display_name": "GPT-5.1", "modalities": { "input": [ - "image", - "pdf", - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 1000000, + "context": 400000, "output": 128000 }, "temperature": false, @@ -48113,139 +50941,153 @@ "supported": true, "default_enabled": false, "mode": "effort", - "effort": "high", + "effort": "none", "effort_options": [ + "none", "low", "medium", - "high", - "xhigh", - "max" + "high" ], - "interleaved": true, - "summaries": true, - "visibility": "omitted", - "continuation": [ - "thinking_blocks" + "verbosity": "medium", + "verbosity_options": [ + "low", + "medium", + "high" ], - "notes": [ - "Claude Opus 4.7 and newer Opus models require thinking.type = \"adaptive\" to enable thinking explicitly.", - "Manual budget_tokens requests return 400 on Claude Opus 4.7 and newer adaptive-only Opus models.", - "task_budget is separate from thinking control and should not be treated as a thinking budget." - ] + "visibility": "hidden" } }, "attachment": true, "open_weights": false, - "release_date": "2026-04-16", - "last_updated": "2026-05-27", + "knowledge": "2024-09-30", + "release_date": "2025-11-13", + "last_updated": "2025-11-13", "cost": { - "input": 4, - "output": 20, - "cache_read": 0.4, - "cache_write": 5 + "input": 1.25, + "output": 10, + "cache_read": 0.125 }, "type": "chat" }, { - "id": "stealth/claude-opus-4.6", - "name": "Stealth: Claude Opus 4.6 (20% off)", - "display_name": "Stealth: Claude Opus 4.6 (20% off)", + "id": "gpt-5.5", + "name": "GPT-5.5", + "display_name": "GPT-5.5", "modalities": { "input": [ + "text", "image", - "pdf", - "text" + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 1000000, + "context": 1050000, "output": 128000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { "supported": true, - "default": false + "default": true }, "extra_capabilities": { "reasoning": { "supported": true, - "default_enabled": false, - "mode": "mixed", - "budget": { - "min": 1024, - "unit": "tokens" - }, - "effort": "high", + "default_enabled": true, + "mode": "effort", + "effort": "medium", "effort_options": [ "low", "medium", "high", - "max" + "xhigh" ], - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" + "verbosity": "medium", + "verbosity_options": [ + "low", + "medium", + "high" ], - "notes": [ - "Anthropic recommends adaptive thinking with effort for Claude 4.6; budget_tokens remains a deprecated compatibility path.", - "Anthropic API defaults effort to high; lower effort levels should be chosen per workload." - ] + "visibility": "hidden" } }, "attachment": true, "open_weights": false, - "release_date": "2026-02-05", - "last_updated": "2026-05-27", + "knowledge": "2025-12-01", + "release_date": "2026-04-23", + "last_updated": "2026-04-23", "cost": { - "input": 4, - "output": 20, - "cache_read": 0.4, - "cache_write": 5 + "input": 5, + "output": 30, + "cache_read": 0.5, + "tiers": [ + { + "input": 10, + "output": 45, + "cache_read": 1, + "tier": { + "type": "context", + "size": 272000 + } + } + ], + "context_over_200k": { + "input": 10, + "output": 45, + "cache_read": 1 + } }, "type": "chat" }, { - "id": "nvidia/nemotron-3-nano-30b-a3b", - "name": "NVIDIA: Nemotron 3 Nano 30B A3B", - "display_name": "NVIDIA: Nemotron 3 Nano 30B A3B", + "id": "gpt-image-2", + "name": "gpt-image-2", + "display_name": "gpt-image-2", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ - "text" + "image" ] }, "limit": { - "context": 262144, - "output": 52429 + "context": 8192, + "output": 8192 }, - "temperature": true, - "tool_call": true, + "temperature": false, + "tool_call": false, "reasoning": { - "supported": true, - "default": true + "supported": false }, - "attachment": false, - "open_weights": true, - "release_date": "2024-12", - "last_updated": "2026-02-04", + "attachment": true, + "open_weights": false, + "release_date": "2026-04-21", + "last_updated": "2026-04-21", "cost": { - "input": 0.05, - "output": 0.2 + "input": 5, + "output": 30, + "cache_read": 1.25 }, - "type": "chat" - }, + "type": "imageGeneration" + } + ] + }, + "berget": { + "id": "berget", + "name": "Berget.AI", + "display_name": "Berget.AI", + "api": "https://api.berget.ai/v1", + "doc": "https://api.berget.ai", + "models": [ { - "id": "nvidia/nemotron-nano-9b-v2", - "name": "NVIDIA: Nemotron Nano 9B V2", - "display_name": "NVIDIA: Nemotron Nano 9B V2", + "id": "meta-llama/Llama-3.3-70B-Instruct", + "name": "Llama 3.3 70B Instruct", + "display_name": "Llama 3.3 70B Instruct", "modalities": { "input": [ "text" @@ -48255,8 +51097,8 @@ ] }, "limit": { - "context": 131072, - "output": 26215 + "context": 128000, + "output": 8192 }, "temperature": true, "tool_call": true, @@ -48266,22 +51108,22 @@ }, "attachment": false, "open_weights": true, - "release_date": "2025-08-18", - "last_updated": "2025-08-18", + "knowledge": "2023-12", + "release_date": "2025-04-27", + "last_updated": "2025-04-27", "cost": { - "input": 0.04, - "output": 0.16 + "input": 0.99, + "output": 0.99 }, "type": "chat" }, { - "id": "nvidia/nemotron-3-nano-omni-30b-a3b-reasoning:free", - "name": "NVIDIA: Nemotron 3 Nano Omni (free)", - "display_name": "NVIDIA: Nemotron 3 Nano Omni (free)", + "id": "moonshotai/Kimi-K2.6", + "name": "Kimi K2.6", + "display_name": "Kimi K2.6", "modalities": { "input": [ "text", - "audio", "image", "video" ], @@ -48290,8 +51132,8 @@ ] }, "limit": { - "context": 256000, - "output": 65536 + "context": 262144, + "output": 262144 }, "temperature": true, "tool_call": true, @@ -48299,31 +51141,47 @@ "supported": true, "default": true }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } + }, "attachment": true, - "open_weights": false, - "release_date": "2026-04-28", - "last_updated": "2026-05-01", + "open_weights": true, + "knowledge": "2025-01", + "release_date": "2026-05-07", + "last_updated": "2026-05-07", "cost": { - "input": 0, - "output": 0 + "input": 0.83, + "output": 3.85, + "cache_read": 0.16 }, "type": "chat" }, { - "id": "nvidia/nemotron-3-super-120b-a12b:free", - "name": "NVIDIA: Nemotron 3 Super (free)", - "display_name": "NVIDIA: Nemotron 3 Super (free)", + "id": "google/gemma-4-31B-it", + "name": "Gemma 4 31B Instruct", + "display_name": "Gemma 4 31B Instruct", "modalities": { "input": [ - "text" + "audio", + "image", + "text", + "video" ], "output": [ "text" ] }, "limit": { - "context": 262144, - "output": 262144 + "context": 128000, + "output": 8192 }, "temperature": true, "tool_call": true, @@ -48331,20 +51189,21 @@ "supported": true, "default": true }, - "attachment": false, + "attachment": true, "open_weights": true, - "release_date": "2026-03-12", - "last_updated": "2026-03-15", + "knowledge": "2025-12", + "release_date": "2026-04-02", + "last_updated": "2026-04-02", "cost": { - "input": 0, - "output": 0 + "input": 0.275, + "output": 0.55 }, "type": "chat" }, { - "id": "nvidia/llama-3.3-nemotron-super-49b-v1.5", - "name": "NVIDIA: Llama 3.3 Nemotron Super 49B V1.5", - "display_name": "NVIDIA: Llama 3.3 Nemotron Super 49B V1.5", + "id": "openai/gpt-oss-120b", + "name": "GPT-OSS-120B", + "display_name": "GPT-OSS-120B", "modalities": { "input": [ "text" @@ -48354,8 +51213,8 @@ ] }, "limit": { - "context": 131072, - "output": 26215 + "context": 128000, + "output": 8192 }, "temperature": true, "tool_call": true, @@ -48363,22 +51222,29 @@ "supported": true, "default": true }, + "extra_capabilities": { + "reasoning": { + "supported": true + } + }, "attachment": false, - "open_weights": false, - "release_date": "2025-03-16", - "last_updated": "2025-03-16", + "open_weights": true, + "knowledge": "2025-08", + "release_date": "2025-08-05", + "last_updated": "2025-08-05", "cost": { - "input": 0.1, - "output": 0.4 + "input": 0.44, + "output": 0.99 }, "type": "chat" }, { - "id": "nvidia/nemotron-3-super-120b-a12b", - "name": "NVIDIA: Nemotron 3 Super", - "display_name": "NVIDIA: Nemotron 3 Super", + "id": "mistralai/Mistral-Medium-3.5-128B", + "name": "Mistral Medium 3.5 128B", + "display_name": "Mistral Medium 3.5 128B", "modalities": { "input": [ + "image", "text" ], "output": [ @@ -48387,7 +51253,7 @@ }, "limit": { "context": 262144, - "output": 262144 + "output": 131072 }, "temperature": true, "tool_call": true, @@ -48395,21 +51261,21 @@ "supported": true, "default": true }, - "attachment": false, + "attachment": true, "open_weights": true, - "release_date": "2026-03-11", - "last_updated": "2026-04-11", + "knowledge": "2026-04", + "release_date": "2026-04-29", + "last_updated": "2026-04-29", "cost": { - "input": 0.1, - "output": 0.5, - "cache_read": 0.1 + "input": 1.65, + "output": 5.5 }, "type": "chat" }, { - "id": "switchpoint/router", - "name": "Switchpoint Router", - "display_name": "Switchpoint Router", + "id": "mistralai/Mistral-Small-3.2-24B-Instruct-2506", + "name": "Mistral Small 3.2 24B Instruct 2506", + "display_name": "Mistral Small 3.2 24B Instruct 2506", "modalities": { "input": [ "text" @@ -48419,29 +51285,30 @@ ] }, "limit": { - "context": 131072, - "output": 32768 + "context": 32000, + "output": 8192 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { "supported": true, "default": true }, "attachment": false, - "open_weights": false, - "release_date": "2025-07-12", - "last_updated": "2026-03-15", + "open_weights": true, + "knowledge": "2025-09", + "release_date": "2025-10-01", + "last_updated": "2025-10-01", "cost": { - "input": 0.85, - "output": 3.4 + "input": 0.33, + "output": 0.33 }, "type": "chat" }, { - "id": "arcee-ai/trinity-mini", - "name": "Arcee AI: Trinity Mini", - "display_name": "Arcee AI: Trinity Mini", + "id": "zai-org/GLM-4.7", + "name": "GLM 4.7", + "display_name": "GLM 4.7", "modalities": { "input": [ "text" @@ -48451,8 +51318,8 @@ ] }, "limit": { - "context": 131072, - "output": 131072 + "context": 128000, + "output": 8192 }, "temperature": true, "tool_call": true, @@ -48460,55 +51327,73 @@ "supported": true, "default": true }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } + }, "attachment": false, "open_weights": true, - "release_date": "2025-12", - "last_updated": "2026-01-28", + "knowledge": "2025-12", + "release_date": "2026-01-19", + "last_updated": "2026-01-19", "cost": { - "input": 0.045, - "output": 0.15 + "input": 0.77, + "output": 2.75 }, "type": "chat" - }, + } + ] + }, + "snowflake-cortex": { + "id": "snowflake-cortex", + "name": "Snowflake Cortex", + "display_name": "Snowflake Cortex", + "api": "https://${SNOWFLAKE_ACCOUNT}.snowflakecomputing.com/api/v2/cortex/v1", + "doc": "https://docs.snowflake.com/en/user-guide/snowflake-cortex/cortex-rest-api", + "models": [ { - "id": "arcee-ai/trinity-large-thinking", - "name": "Arcee AI: Trinity Large Thinking", - "display_name": "Arcee AI: Trinity Large Thinking", + "id": "openai-gpt-5.1", + "name": "GPT-5.1", + "display_name": "GPT-5.1", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 262144, - "output": 262144 + "context": 400000, + "output": 128000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { "supported": true, "default": true }, - "attachment": false, - "open_weights": true, - "release_date": "2026-04-01", - "last_updated": "2026-04-11", - "cost": { - "input": 0.22, - "output": 0.85 - }, + "attachment": true, + "open_weights": false, + "knowledge": "2024-09-30", + "release_date": "2025-11-13", + "last_updated": "2025-11-13", "type": "chat" }, { - "id": "arcee-ai/spotlight", - "name": "Arcee AI: Spotlight", - "display_name": "Arcee AI: Spotlight", + "id": "snowflake-llama3.3-70b", + "name": "Llama-3.3-70B-Instruct", + "display_name": "Llama-3.3-70B-Instruct", "modalities": { "input": [ - "image", "text" ], "output": [ @@ -48516,121 +51401,164 @@ ] }, "limit": { - "context": 131072, - "output": 65537 + "context": 128000, + "output": 4096 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { "supported": false }, "attachment": true, "open_weights": true, - "release_date": "2025-05-06", - "last_updated": "2026-03-15", - "cost": { - "input": 0.18, - "output": 0.18 - }, + "knowledge": "2023-12", + "release_date": "2024-12-06", + "last_updated": "2024-12-06", "type": "chat" }, { - "id": "arcee-ai/maestro-reasoning", - "name": "Arcee AI: Maestro Reasoning", - "display_name": "Arcee AI: Maestro Reasoning", + "id": "openai-gpt-5.2", + "name": "GPT-5.2", + "display_name": "GPT-5.2", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 131072, - "output": 32000 + "context": 400000, + "output": 128000 }, - "temperature": true, - "tool_call": false, + "temperature": false, + "tool_call": true, "reasoning": { - "supported": false - }, - "attachment": false, - "open_weights": true, - "release_date": "2025-05-06", - "last_updated": "2026-03-15", - "cost": { - "input": 0.9, - "output": 3.3 + "supported": true, + "default": true }, + "attachment": true, + "open_weights": false, + "knowledge": "2025-08-31", + "release_date": "2025-12-11", + "last_updated": "2025-12-11", "type": "chat" }, { - "id": "arcee-ai/coder-large", - "name": "Arcee AI: Coder Large", - "display_name": "Arcee AI: Coder Large", + "id": "claude-sonnet-4-5", + "name": "Claude Sonnet 4.5 (latest)", + "display_name": "Claude Sonnet 4.5 (latest)", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 32768, - "output": 32768 + "context": 200000, + "output": 16384 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": false }, - "attachment": false, - "open_weights": true, - "release_date": "2025-05-06", - "last_updated": "2026-03-15", - "cost": { - "input": 0.5, - "output": 0.8 + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": false, + "mode": "budget", + "budget": { + "min": 1024, + "unit": "tokens" + }, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ], + "notes": [ + "Claude 4 manual thinking uses thinking.type = \"enabled\" with budget_tokens.", + "Interleaved thinking requires the interleaved-thinking-2025-05-14 beta header for this model family." + ] + } }, + "attachment": true, + "open_weights": false, + "knowledge": "2025-07-31", + "release_date": "2025-09-29", + "last_updated": "2025-09-29", "type": "chat" }, { - "id": "arcee-ai/virtuoso-large", - "name": "Arcee AI: Virtuoso Large", - "display_name": "Arcee AI: Virtuoso Large", + "id": "claude-opus-4-7", + "name": "Claude Opus 4.7", + "display_name": "Claude Opus 4.7", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 131072, - "output": 64000 + "context": 1000000, + "output": 128000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": false }, - "attachment": false, - "open_weights": true, - "release_date": "2025-05-06", - "last_updated": "2026-03-15", - "cost": { - "input": 0.75, - "output": 1.2 + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": false, + "mode": "effort", + "effort": "high", + "effort_options": [ + "low", + "medium", + "high", + "xhigh", + "max" + ], + "interleaved": true, + "summaries": true, + "visibility": "omitted", + "continuation": [ + "thinking_blocks" + ], + "notes": [ + "Claude Opus 4.7 and newer Opus models require thinking.type = \"adaptive\" to enable thinking explicitly.", + "Manual budget_tokens requests return 400 on Claude Opus 4.7 and newer adaptive-only Opus models.", + "task_budget is separate from thinking control and should not be treated as a thinking budget." + ] + } }, + "attachment": true, + "open_weights": false, + "knowledge": "2026-01-31", + "release_date": "2026-04-16", + "last_updated": "2026-04-16", "type": "chat" }, { - "id": "gryphe/mythomax-l2-13b", - "name": "MythoMax 13B", - "display_name": "MythoMax 13B", + "id": "deepseek-r1", + "name": "DeepSeek-R1", + "display_name": "DeepSeek-R1", "modalities": { "input": [ "text" @@ -48640,192 +51568,297 @@ ] }, "limit": { - "context": 4096, - "output": 4096 + "context": 128000, + "output": 32768 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } }, "attachment": false, "open_weights": true, - "release_date": "2024-04-25", - "last_updated": "2024-04-25", - "cost": { - "input": 0.06, - "output": 0.06 - }, + "knowledge": "2024-07", + "release_date": "2025-01-20", + "last_updated": "2025-05-29", "type": "chat" }, { - "id": "microsoft/phi-4", - "name": "Microsoft: Phi 4", - "display_name": "Microsoft: Phi 4", + "id": "claude-opus-4-8", + "name": "Claude Opus 4.8", + "display_name": "Claude Opus 4.8", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 16384, - "output": 16384 + "context": 1000000, + "output": 128000 }, - "temperature": true, - "tool_call": false, + "temperature": false, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": false }, - "attachment": false, - "open_weights": true, - "release_date": "2024-12-11", - "last_updated": "2024-12-11", - "cost": { - "input": 0.06, - "output": 0.14 + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": false, + "mode": "effort", + "effort": "high", + "effort_options": [ + "low", + "medium", + "high", + "xhigh", + "max" + ], + "interleaved": true, + "summaries": true, + "visibility": "omitted", + "continuation": [ + "thinking_blocks" + ], + "notes": [ + "Claude Opus 4.7 and newer Opus models require thinking.type = \"adaptive\" to enable thinking explicitly.", + "Manual budget_tokens requests return 400 on Claude Opus 4.7 and newer adaptive-only Opus models.", + "task_budget is separate from thinking control and should not be treated as a thinking budget." + ] + } }, + "attachment": true, + "open_weights": false, + "release_date": "2026-05-28", + "last_updated": "2026-05-28", "type": "chat" }, { - "id": "microsoft/wizardlm-2-8x22b", - "name": "WizardLM-2 8x22B", - "display_name": "WizardLM-2 8x22B", + "id": "openai-gpt-5", + "name": "GPT-5", + "display_name": "GPT-5", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 65535, - "output": 8000 + "context": 400000, + "output": 128000 }, - "temperature": true, - "tool_call": false, + "temperature": false, + "tool_call": true, "reasoning": { - "supported": false - }, - "attachment": false, - "open_weights": true, - "release_date": "2024-04-24", - "last_updated": "2024-04-24", - "cost": { - "input": 0.62, - "output": 0.62 + "supported": true, + "default": true }, + "attachment": true, + "open_weights": false, + "knowledge": "2024-09-30", + "release_date": "2025-08-07", + "last_updated": "2025-08-07", "type": "chat" }, { - "id": "microsoft/phi-4-mini-instruct", - "name": "Microsoft: Phi 4 Mini Instruct", - "display_name": "Microsoft: Phi 4 Mini Instruct", + "id": "openai-gpt-5.5", + "name": "GPT-5.5", + "display_name": "GPT-5.5", "modalities": { "input": [ + "text", + "image", + "pdf" + ], + "output": [ "text" + ] + }, + "limit": { + "context": 1050000, + "output": 128000 + }, + "temperature": false, + "tool_call": true, + "reasoning": { + "supported": true, + "default": true + }, + "attachment": true, + "open_weights": false, + "knowledge": "2025-12-01", + "release_date": "2026-04-23", + "last_updated": "2026-04-23", + "type": "chat" + }, + { + "id": "claude-fable-5", + "name": "Claude Fable 5", + "display_name": "Claude Fable 5", + "modalities": { + "input": [ + "text", + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 128000, + "context": 1000000, "output": 128000 }, - "temperature": true, - "tool_call": false, + "temperature": false, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": false, - "open_weights": true, - "release_date": "2025-10-17", - "last_updated": "2026-05-07", - "cost": { - "input": 0.08, - "output": 0.35, - "cache_read": 0.08 + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": true, + "mode": "effort", + "effort": "high", + "effort_options": [ + "low", + "medium", + "high", + "xhigh", + "max" + ], + "interleaved": true, + "summaries": true, + "visibility": "omitted", + "continuation": [ + "thinking_blocks" + ], + "notes": [ + "Adaptive thinking is always on for Claude Fable 5 and Claude Mythos 5; thinking.type = \"disabled\" is rejected.", + "Manual budget_tokens requests return 400 on Claude Fable 5 and Claude Mythos 5.", + "thinking.display defaults to omitted; set display to summarized to receive readable thinking summaries." + ] + } }, + "attachment": true, + "open_weights": false, + "knowledge": "2026-01-31", + "release_date": "2026-06-09", + "last_updated": "2026-06-09", "type": "chat" }, { - "id": "writer/palmyra-x5", - "name": "Writer: Palmyra X5", - "display_name": "Writer: Palmyra X5", + "id": "openai-gpt-5-nano", + "name": "GPT-5 Nano", + "display_name": "GPT-5 Nano", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 1040000, - "output": 8192 + "context": 400000, + "output": 128000 }, - "temperature": true, - "tool_call": false, + "temperature": false, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": false, + "attachment": true, "open_weights": false, - "release_date": "2025-04-28", - "last_updated": "2025-04-28", - "cost": { - "input": 0.6, - "output": 6 - }, + "knowledge": "2024-05-30", + "release_date": "2025-08-07", + "last_updated": "2025-08-07", "type": "chat" }, { - "id": "bytedance-seed/seed-2.0-mini", - "name": "ByteDance Seed: Seed-2.0-Mini", - "display_name": "ByteDance Seed: Seed-2.0-Mini", + "id": "claude-haiku-4-5", + "name": "Claude Haiku 4.5 (latest)", + "display_name": "Claude Haiku 4.5 (latest)", "modalities": { "input": [ - "image", "text", - "video" + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 262144, - "output": 131072 + "context": 200000, + "output": 16384 }, "temperature": true, "tool_call": true, "reasoning": { "supported": true, - "default": true + "default": false }, - "attachment": true, - "open_weights": true, - "release_date": "2026-02-27", - "last_updated": "2026-03-15", - "cost": { - "input": 0.1, - "output": 0.4 + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": false, + "mode": "budget", + "budget": { + "min": 1024, + "unit": "tokens" + }, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ], + "notes": [ + "Claude 4 manual thinking uses thinking.type = \"enabled\" with budget_tokens.", + "Interleaved thinking requires the interleaved-thinking-2025-05-14 beta header for this model family." + ] + } }, + "attachment": true, + "open_weights": false, + "knowledge": "2025-02-28", + "release_date": "2025-10-15", + "last_updated": "2025-10-15", "type": "chat" }, { - "id": "bytedance-seed/seed-1.6-flash", - "name": "ByteDance Seed: Seed 1.6 Flash", - "display_name": "ByteDance Seed: Seed 1.6 Flash", + "id": "mistral-large2", + "name": "Mistral Large (latest)", + "display_name": "Mistral Large (latest)", "modalities": { "input": [ - "image", "text", - "video" + "image" ], "output": [ "text" @@ -48833,138 +51866,159 @@ }, "limit": { "context": 262144, - "output": 32768 + "output": 262144 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, "attachment": true, "open_weights": true, - "release_date": "2025-12-23", - "last_updated": "2026-03-15", - "cost": { - "input": 0.075, - "output": 0.3 - }, + "knowledge": "2024-11", + "release_date": "2024-11-01", + "last_updated": "2025-12-02", "type": "chat" }, { - "id": "bytedance-seed/seed-1.6", - "name": "ByteDance Seed: Seed 1.6", - "display_name": "ByteDance Seed: Seed 1.6", + "id": "openai-gpt-4.1", + "name": "GPT-4.1", + "display_name": "GPT-4.1", "modalities": { "input": [ - "image", "text", - "video" + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 262144, + "context": 1047576, "output": 32768 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, "attachment": true, "open_weights": false, - "release_date": "2025-09", - "last_updated": "2025-09", - "cost": { - "input": 0.25, - "output": 2 - }, + "knowledge": "2024-04", + "release_date": "2025-04-14", + "last_updated": "2025-04-14", "type": "chat" }, { - "id": "bytedance-seed/seed-2.0-lite", - "name": "ByteDance Seed: Seed-2.0-Lite", - "display_name": "ByteDance Seed: Seed-2.0-Lite", + "id": "claude-sonnet-4-6", + "name": "Claude Sonnet 4.6", + "display_name": "Claude Sonnet 4.6", "modalities": { "input": [ - "image", "text", - "video" + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 262144, - "output": 131072 + "context": 1000000, + "output": 16384 }, "temperature": true, "tool_call": true, "reasoning": { "supported": true, - "default": true + "default": false }, - "attachment": true, - "open_weights": true, - "release_date": "2026-03-10", - "last_updated": "2026-03-15", - "cost": { - "input": 0.25, - "output": 2 + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": false, + "mode": "mixed", + "budget": { + "min": 1024, + "unit": "tokens" + }, + "effort": "high", + "effort_options": [ + "low", + "medium", + "high", + "max" + ], + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ], + "notes": [ + "Anthropic recommends adaptive thinking with effort for Claude 4.6; budget_tokens remains a deprecated compatibility path.", + "Anthropic API defaults effort to high; lower effort levels should be chosen per workload." + ] + } }, + "attachment": true, + "open_weights": false, + "knowledge": "2025-08-31", + "release_date": "2026-02-17", + "last_updated": "2026-03-13", "type": "chat" }, { - "id": "nex-agi/deepseek-v3.1-nex-n1", - "name": "Nex AGI: DeepSeek V3.1 Nex N1", - "display_name": "Nex AGI: DeepSeek V3.1 Nex N1", + "id": "openai-gpt-5.4", + "name": "GPT-5.4", + "display_name": "GPT-5.4", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 131072, - "output": 163840 + "context": 1050000, + "output": 128000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": false, + "attachment": true, "open_weights": false, - "release_date": "2025-01-01", - "last_updated": "2025-11-25", - "cost": { - "input": 0.27, - "output": 1 - }, + "knowledge": "2025-08-31", + "release_date": "2026-03-05", + "last_updated": "2026-03-05", "type": "chat" }, { - "id": "tencent/hy3-preview", - "name": "Tencent: Hy3 Preview", - "display_name": "Tencent: Hy3 Preview", + "id": "gemini-3.1-pro", + "name": "Gemini 3.1 Pro Preview", + "display_name": "Gemini 3.1 Pro Preview", "modalities": { "input": [ - "text" + "text", + "image", + "video", + "audio", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 262144, - "output": 262144 + "context": 1048576, + "output": 65536 }, "temperature": true, "tool_call": true, @@ -48974,56 +52028,71 @@ }, "extra_capabilities": { "reasoning": { - "supported": true + "supported": true, + "default_enabled": true, + "mode": "level", + "level": "high", + "level_options": [ + "low", + "high" + ], + "summaries": true, + "visibility": "summary", + "continuation": [ + "thought_signatures" + ] } }, - "attachment": false, + "attachment": true, "open_weights": false, - "release_date": "2026-04-22", - "last_updated": "2026-05-16", - "cost": { - "input": 0.066, - "output": 0.26, - "cache_read": 0.029 - }, + "knowledge": "2025-01", + "release_date": "2026-02-19", + "last_updated": "2026-02-19", "type": "chat" }, { - "id": "tencent/hunyuan-a13b-instruct", - "name": "Tencent: Hunyuan A13B Instruct", - "display_name": "Tencent: Hunyuan A13B Instruct", + "id": "openai-gpt-5-mini", + "name": "GPT-5 Mini", + "display_name": "GPT-5 Mini", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 131072, - "output": 131072 + "context": 272000, + "output": 8192 }, - "temperature": true, - "tool_call": false, + "temperature": false, + "tool_call": true, "reasoning": { "supported": true, "default": true }, - "attachment": false, + "attachment": true, "open_weights": false, - "release_date": "2025-06-30", - "last_updated": "2025-11-25", - "cost": { - "input": 0.14, - "output": 0.57 - }, + "knowledge": "2024-05-30", + "release_date": "2025-08-07", + "last_updated": "2025-08-07", "type": "chat" - }, + } + ] + }, + "github-models": { + "id": "github-models", + "name": "GitHub Models", + "display_name": "GitHub Models", + "api": "https://models.github.ai/inference", + "doc": "https://docs.github.com/en/github-models", + "models": [ { - "id": "ibm-granite/granite-4.1-8b", - "name": "IBM: Granite 4.1 8B", - "display_name": "IBM: Granite 4.1 8B", + "id": "ai21-labs/ai21-jamba-1.5-mini", + "name": "AI21 Jamba 1.5 Mini", + "display_name": "AI21 Jamba 1.5 Mini", "modalities": { "input": [ "text" @@ -49033,29 +52102,30 @@ ] }, "limit": { - "context": 131072, - "output": 131072 + "context": 256000, + "output": 4096 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "attachment": false, "open_weights": false, - "release_date": "2026-04-30", - "last_updated": "2026-05-01", + "knowledge": "2024-03", + "release_date": "2024-08-29", + "last_updated": "2024-08-29", "cost": { - "input": 0.05, - "output": 0.1, - "cache_read": 0.05 + "input": 0, + "output": 0 }, "type": "chat" }, { - "id": "ibm-granite/granite-4.0-h-micro", - "name": "IBM: Granite 4.0 Micro", - "display_name": "IBM: Granite 4.0 Micro", + "id": "ai21-labs/ai21-jamba-1.5-large", + "name": "AI21 Jamba 1.5 Large", + "display_name": "AI21 Jamba 1.5 Large", "modalities": { "input": [ "text" @@ -49065,28 +52135,30 @@ ] }, "limit": { - "context": 131000, - "output": 32768 + "context": 256000, + "output": 4096 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "attachment": false, - "open_weights": true, - "release_date": "2025-10-20", - "last_updated": "2026-03-15", + "open_weights": false, + "knowledge": "2024-03", + "release_date": "2024-08-29", + "last_updated": "2024-08-29", "cost": { - "input": 0.017, - "output": 0.11 + "input": 0, + "output": 0 }, "type": "chat" }, { - "id": "stepfun/step-3.5-flash", - "name": "StepFun: Step 3.5 Flash", - "display_name": "StepFun: Step 3.5 Flash", + "id": "core42/jais-30b-chat", + "name": "JAIS 30b Chat", + "display_name": "JAIS 30b Chat", "modalities": { "input": [ "text" @@ -49096,8 +52168,8 @@ ] }, "limit": { - "context": 256000, - "output": 256000 + "context": 8192, + "output": 2048 }, "temperature": true, "tool_call": true, @@ -49107,19 +52179,19 @@ }, "attachment": false, "open_weights": true, - "release_date": "2026-01-29", - "last_updated": "2026-01-29", + "knowledge": "2023-03", + "release_date": "2023-08-30", + "last_updated": "2023-08-30", "cost": { - "input": 0.1, - "output": 0.3, - "cache_read": 0.02 + "input": 0, + "output": 0 }, "type": "chat" }, { - "id": "aion-labs/aion-2.0", - "name": "AionLabs: Aion-2.0", - "display_name": "AionLabs: Aion-2.0", + "id": "xai/grok-3-mini", + "name": "Grok 3 Mini", + "display_name": "Grok 3 Mini", "modalities": { "input": [ "text" @@ -49129,29 +52201,30 @@ ] }, "limit": { - "context": 131072, - "output": 32768 + "context": 128000, + "output": 8192 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { "supported": true, "default": true }, "attachment": false, "open_weights": false, - "release_date": "2026-02-24", - "last_updated": "2026-03-15", + "knowledge": "2024-10", + "release_date": "2024-12-09", + "last_updated": "2024-12-09", "cost": { - "input": 0.8, - "output": 1.6 + "input": 0, + "output": 0 }, "type": "chat" }, { - "id": "aion-labs/aion-1.0", - "name": "AionLabs: Aion-1.0", - "display_name": "AionLabs: Aion-1.0", + "id": "xai/grok-3", + "name": "Grok 3", + "display_name": "Grok 3", "modalities": { "input": [ "text" @@ -49161,29 +52234,30 @@ ] }, "limit": { - "context": 131072, - "output": 32768 + "context": 128000, + "output": 8192 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { "supported": true, "default": true }, "attachment": false, "open_weights": false, - "release_date": "2025-02-05", - "last_updated": "2026-03-15", + "knowledge": "2024-10", + "release_date": "2024-12-09", + "last_updated": "2024-12-09", "cost": { - "input": 4, - "output": 8 + "input": 0, + "output": 0 }, "type": "chat" }, { - "id": "aion-labs/aion-rp-llama-3.1-8b", - "name": "AionLabs: Aion-RP 1.0 (8B)", - "display_name": "AionLabs: Aion-RP 1.0 (8B)", + "id": "microsoft/phi-3.5-moe-instruct", + "name": "Phi-3.5-MoE instruct (128k)", + "display_name": "Phi-3.5-MoE instruct (128k)", "modalities": { "input": [ "text" @@ -49193,28 +52267,30 @@ ] }, "limit": { - "context": 32768, - "output": 32768 + "context": 128000, + "output": 4096 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "attachment": false, - "open_weights": false, - "release_date": "2025-02-05", - "last_updated": "2026-03-15", + "open_weights": true, + "knowledge": "2023-10", + "release_date": "2024-08-20", + "last_updated": "2024-08-20", "cost": { - "input": 0.8, - "output": 1.6 + "input": 0, + "output": 0 }, "type": "chat" }, { - "id": "aion-labs/aion-1.0-mini", - "name": "AionLabs: Aion-1.0-Mini", - "display_name": "AionLabs: Aion-1.0-Mini", + "id": "microsoft/phi-3-small-128k-instruct", + "name": "Phi-3-small instruct (128k)", + "display_name": "Phi-3-small instruct (128k)", "modalities": { "input": [ "text" @@ -49224,64 +52300,65 @@ ] }, "limit": { - "context": 131072, - "output": 32768 + "context": 128000, + "output": 4096 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { "supported": true, "default": true }, "attachment": false, - "open_weights": false, - "release_date": "2025-02-05", - "last_updated": "2026-03-15", + "open_weights": true, + "knowledge": "2023-10", + "release_date": "2024-04-23", + "last_updated": "2024-04-23", "cost": { - "input": 0.7, - "output": 1.4 + "input": 0, + "output": 0 }, "type": "chat" }, { - "id": "amazon/nova-pro-v1", - "name": "Amazon: Nova Pro 1.0", - "display_name": "Amazon: Nova Pro 1.0", + "id": "microsoft/phi-3.5-mini-instruct", + "name": "Phi-3.5-mini instruct (128k)", + "display_name": "Phi-3.5-mini instruct (128k)", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 300000, - "output": 5120 + "context": 128000, + "output": 4096 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": true, - "open_weights": false, - "release_date": "2024-12-03", - "last_updated": "2024-12-03", + "attachment": false, + "open_weights": true, + "knowledge": "2023-10", + "release_date": "2024-08-20", + "last_updated": "2024-08-20", "cost": { - "input": 0.8, - "output": 3.2 + "input": 0, + "output": 0 }, "type": "chat" }, { - "id": "amazon/nova-lite-v1", - "name": "Amazon: Nova Lite 1.0", - "display_name": "Amazon: Nova Lite 1.0", + "id": "microsoft/phi-3-medium-128k-instruct", + "name": "Phi-3-medium instruct (128k)", + "display_name": "Phi-3-medium instruct (128k)", "modalities": { "input": [ - "image", "text" ], "output": [ @@ -49289,28 +52366,30 @@ ] }, "limit": { - "context": 300000, - "output": 5120 + "context": 128000, + "output": 4096 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": true, - "open_weights": false, - "release_date": "2024-12-06", - "last_updated": "2026-03-15", + "attachment": false, + "open_weights": true, + "knowledge": "2023-10", + "release_date": "2024-04-23", + "last_updated": "2024-04-23", "cost": { - "input": 0.06, - "output": 0.24 + "input": 0, + "output": 0 }, "type": "chat" }, { - "id": "amazon/nova-micro-v1", - "name": "Amazon: Nova Micro 1.0", - "display_name": "Amazon: Nova Micro 1.0", + "id": "microsoft/phi-3-small-8k-instruct", + "name": "Phi-3-small instruct (8k)", + "display_name": "Phi-3-small instruct (8k)", "modalities": { "input": [ "text" @@ -49320,31 +52399,32 @@ ] }, "limit": { - "context": 128000, - "output": 5120 + "context": 8192, + "output": 2048 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "attachment": false, - "open_weights": false, - "release_date": "2024-12-06", - "last_updated": "2026-03-15", + "open_weights": true, + "knowledge": "2023-10", + "release_date": "2024-04-23", + "last_updated": "2024-04-23", "cost": { - "input": 0.035, - "output": 0.14 + "input": 0, + "output": 0 }, "type": "chat" }, { - "id": "amazon/nova-premier-v1", - "name": "Amazon: Nova Premier 1.0", - "display_name": "Amazon: Nova Premier 1.0", + "id": "microsoft/phi-4-reasoning", + "name": "Phi-4-Reasoning", + "display_name": "Phi-4-Reasoning", "modalities": { "input": [ - "image", "text" ], "output": [ @@ -49352,42 +52432,41 @@ ] }, "limit": { - "context": 1000000, - "output": 32000 + "context": 128000, + "output": 4096 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": true, - "open_weights": false, - "release_date": "2025-11-01", - "last_updated": "2026-03-15", + "attachment": false, + "open_weights": true, + "knowledge": "2023-10", + "release_date": "2024-12-11", + "last_updated": "2024-12-11", "cost": { - "input": 2.5, - "output": 12.5 + "input": 0, + "output": 0 }, "type": "chat" }, { - "id": "amazon/nova-2-lite-v1", - "name": "Amazon: Nova 2 Lite", - "display_name": "Amazon: Nova 2 Lite", - "modalities": { + "id": "microsoft/mai-ds-r1", + "name": "MAI-DS-R1", + "display_name": "MAI-DS-R1", + "modalities": { "input": [ - "image", - "pdf", - "text", - "video" + "text" ], "output": [ "text" ] }, "limit": { - "context": 1000000, - "output": 65535 + "context": 65536, + "output": 8192 }, "temperature": true, "tool_call": true, @@ -49395,20 +52474,21 @@ "supported": true, "default": true }, - "attachment": true, + "attachment": false, "open_weights": false, - "release_date": "2024-12-01", - "last_updated": "2026-03-15", + "knowledge": "2024-06", + "release_date": "2025-01-20", + "last_updated": "2025-01-20", "cost": { - "input": 0.3, - "output": 2.5 + "input": 0, + "output": 0 }, "type": "chat" }, { - "id": "inclusionai/ling-2.6-flash", - "name": "inclusionAI: Ling-2.6 Flash", - "display_name": "inclusionAI: Ling-2.6 Flash", + "id": "microsoft/phi-4-mini-instruct", + "name": "Phi-4-mini-instruct", + "display_name": "Phi-4-mini-instruct", "modalities": { "input": [ "text" @@ -49418,29 +52498,30 @@ ] }, "limit": { - "context": 262144, - "output": 32768 + "context": 128000, + "output": 4096 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "attachment": false, - "open_weights": false, - "release_date": "2026-04-21", - "last_updated": "2026-05-01", + "open_weights": true, + "knowledge": "2023-10", + "release_date": "2024-12-11", + "last_updated": "2024-12-11", "cost": { - "input": 0.08, - "output": 0.24, - "cache_read": 0.016 + "input": 0, + "output": 0 }, "type": "chat" }, { - "id": "inclusionai/ling-2.6-1t", - "name": "inclusionAI: Ling-2.6-1T", - "display_name": "inclusionAI: Ling-2.6-1T", + "id": "microsoft/phi-4", + "name": "Phi-4", + "display_name": "Phi-4", "modalities": { "input": [ "text" @@ -49450,40 +52531,42 @@ ] }, "limit": { - "context": 262144, - "output": 32768 + "context": 16000, + "output": 4096 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "attachment": false, - "open_weights": false, - "release_date": "2026-04-23", - "last_updated": "2026-05-16", + "open_weights": true, + "knowledge": "2023-10", + "release_date": "2024-12-11", + "last_updated": "2024-12-11", "cost": { - "input": 0.3, - "output": 2.5, - "cache_read": 0.06 + "input": 0, + "output": 0 }, "type": "chat" }, { - "id": "inclusionai/ring-2.6-1t", - "name": "inclusionAI: Ring-2.6-1T", - "display_name": "inclusionAI: Ring-2.6-1T", + "id": "microsoft/phi-3.5-vision-instruct", + "name": "Phi-3.5-vision instruct (128k)", + "display_name": "Phi-3.5-vision instruct (128k)", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 262144, - "output": 65536 + "context": 128000, + "output": 4096 }, "temperature": true, "tool_call": true, @@ -49492,20 +52575,20 @@ "default": true }, "attachment": false, - "open_weights": false, - "release_date": "2026-05-08", - "last_updated": "2026-05-16", + "open_weights": true, + "knowledge": "2023-10", + "release_date": "2024-08-20", + "last_updated": "2024-08-20", "cost": { - "input": 0.075, - "output": 0.625, - "cache_read": 0.015 + "input": 0, + "output": 0 }, "type": "chat" }, { - "id": "morph/morph-v3-fast", - "name": "Morph: Morph V3 Fast", - "display_name": "Morph: Morph V3 Fast", + "id": "microsoft/phi-3-medium-4k-instruct", + "name": "Phi-3-medium instruct (4k)", + "display_name": "Phi-3-medium instruct (4k)", "modalities": { "input": [ "text" @@ -49515,59 +52598,65 @@ ] }, "limit": { - "context": 81920, - "output": 38000 + "context": 4096, + "output": 1024 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "attachment": false, - "open_weights": false, - "release_date": "2024-08-15", - "last_updated": "2024-08-15", + "open_weights": true, + "knowledge": "2023-10", + "release_date": "2024-04-23", + "last_updated": "2024-04-23", "cost": { - "input": 0.8, - "output": 1.2 + "input": 0, + "output": 0 }, "type": "chat" }, { - "id": "morph/morph-v3-large", - "name": "Morph: Morph V3 Large", - "display_name": "Morph: Morph V3 Large", + "id": "microsoft/phi-4-multimodal-instruct", + "name": "Phi-4-multimodal-instruct", + "display_name": "Phi-4-multimodal-instruct", "modalities": { "input": [ - "text" + "text", + "image", + "audio" ], "output": [ "text" ] }, "limit": { - "context": 262144, - "output": 131072 + "context": 128000, + "output": 4096 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "attachment": false, - "open_weights": false, - "release_date": "2024-08-15", - "last_updated": "2024-08-15", + "open_weights": true, + "knowledge": "2023-10", + "release_date": "2024-12-11", + "last_updated": "2024-12-11", "cost": { - "input": 0.9, - "output": 1.9 + "input": 0, + "output": 0 }, "type": "chat" }, { - "id": "undi95/remm-slerp-l2-13b", - "name": "ReMM SLERP 13B", - "display_name": "ReMM SLERP 13B", + "id": "microsoft/phi-4-mini-reasoning", + "name": "Phi-4-mini-reasoning", + "display_name": "Phi-4-mini-reasoning", "modalities": { "input": [ "text" @@ -49577,156 +52666,86 @@ ] }, "limit": { - "context": 6144, + "context": 128000, "output": 4096 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "attachment": false, "open_weights": true, - "release_date": "2023-07-22", - "last_updated": "2026-03-15", - "cost": { - "input": 0.45, - "output": 0.65 - }, - "type": "chat" - }, - { - "id": "google/gemini-2.0-flash-lite-001", - "name": "Google: Gemini 2.0 Flash Lite", - "display_name": "Google: Gemini 2.0 Flash Lite", - "modalities": { - "input": [ - "audio", - "image", - "pdf", - "text", - "video" - ], - "output": [ - "text" - ] - }, - "limit": { - "context": 1048576, - "output": 8192 - }, - "temperature": true, - "tool_call": true, - "reasoning": { - "supported": false - }, - "attachment": true, - "open_weights": false, + "knowledge": "2023-10", "release_date": "2024-12-11", - "last_updated": "2026-03-15", + "last_updated": "2024-12-11", "cost": { - "input": 0.075, - "output": 0.3 + "input": 0, + "output": 0 }, "type": "chat" }, { - "id": "google/gemini-2.5-flash-image", - "name": "Google: Nano Banana (Gemini 2.5 Flash Image)", - "display_name": "Google: Nano Banana (Gemini 2.5 Flash Image)", + "id": "microsoft/phi-3-mini-128k-instruct", + "name": "Phi-3-mini instruct (128k)", + "display_name": "Phi-3-mini instruct (128k)", "modalities": { "input": [ - "image", - "text" - ], - "output": [ - "image", "text" - ] - }, - "limit": { - "context": 32768, - "output": 32768 - }, - "temperature": true, - "tool_call": false, - "reasoning": { - "supported": false - }, - "attachment": true, - "open_weights": false, - "release_date": "2025-10-08", - "last_updated": "2026-03-15", - "cost": { - "input": 0.3, - "output": 2.5 - }, - "type": "imageGeneration" - }, - { - "id": "google/gemini-2.0-flash-001", - "name": "Google: Gemini 2.0 Flash", - "display_name": "Google: Gemini 2.0 Flash", - "modalities": { - "input": [ - "audio", - "image", - "pdf", - "text", - "video" ], "output": [ "text" ] }, "limit": { - "context": 1048576, - "output": 8192 + "context": 128000, + "output": 4096 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": true, - "open_weights": false, - "release_date": "2024-12-11", - "last_updated": "2026-03-15", + "attachment": false, + "open_weights": true, + "knowledge": "2023-10", + "release_date": "2024-04-23", + "last_updated": "2024-04-23", "cost": { - "input": 0.1, - "output": 0.4, - "cache_read": 0.025, - "cache_write": 0.083333 + "input": 0, + "output": 0 }, "type": "chat" }, { - "id": "google/lyria-3-clip-preview", - "name": "Google: Lyria 3 Clip Preview", - "display_name": "Google: Lyria 3 Clip Preview", + "id": "microsoft/phi-3-mini-4k-instruct", + "name": "Phi-3-mini instruct (4k)", + "display_name": "Phi-3-mini instruct (4k)", "modalities": { "input": [ - "image", "text" ], "output": [ - "audio", "text" ] }, "limit": { - "context": 1048576, - "output": 65536 + "context": 4096, + "output": 1024 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": true, - "open_weights": false, - "release_date": "2026-03-30", - "last_updated": "2026-04-11", + "attachment": false, + "open_weights": true, + "knowledge": "2023-10", + "release_date": "2024-04-23", + "last_updated": "2024-04-23", "cost": { "input": 0, "output": 0 @@ -49734,26 +52753,24 @@ "type": "chat" }, { - "id": "google/gemini-2.5-pro-preview", - "name": "Google: Gemini 2.5 Pro Preview 06-05", - "display_name": "Google: Gemini 2.5 Pro Preview 06-05", + "id": "openai/o3", + "name": "OpenAI o3", + "display_name": "OpenAI o3", "modalities": { "input": [ - "audio", - "image", - "pdf", - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 1048576, - "output": 65536 + "context": 200000, + "output": 100000 }, - "temperature": true, - "tool_call": true, + "temperature": false, + "tool_call": false, "reasoning": { "supported": true, "default": true @@ -49762,132 +52779,127 @@ "reasoning": { "supported": true, "default_enabled": true, - "mode": "budget", - "budget": { - "default": -1, - "min": 128, - "max": 32768, - "auto": -1, - "unit": "tokens" - }, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thought_signatures" - ] + "mode": "effort", + "effort": "medium", + "effort_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" } }, - "attachment": true, + "attachment": false, "open_weights": false, - "release_date": "2025-06-05", - "last_updated": "2026-03-15", + "knowledge": "2024-04", + "release_date": "2025-01-31", + "last_updated": "2025-01-31", "cost": { - "input": 1.25, - "output": 10, - "reasoning": 10, - "cache_read": 0.125, - "cache_write": 0.375 + "input": 0, + "output": 0 }, "type": "chat" }, { - "id": "google/gemini-3.1-flash-lite-preview", - "name": "Google: Gemini 3.1 Flash Lite Preview", - "display_name": "Google: Gemini 3.1 Flash Lite Preview", + "id": "openai/o1-mini", + "name": "OpenAI o1-mini", + "display_name": "OpenAI o1-mini", "modalities": { "input": [ - "audio", - "image", - "pdf", - "text", - "video" + "text" ], "output": [ "text" ] }, "limit": { - "context": 1048576, + "context": 128000, "output": 65536 }, - "temperature": true, - "tool_call": true, + "temperature": false, + "tool_call": false, "reasoning": { "supported": true, "default": true }, "extra_capabilities": { "reasoning": { - "supported": true + "supported": true, + "default_enabled": true, + "mode": "effort", + "effort": "medium", + "effort_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" } }, - "attachment": true, + "attachment": false, "open_weights": false, - "release_date": "2026-03-03", - "last_updated": "2026-03-15", + "knowledge": "2023-10", + "release_date": "2024-09-12", + "last_updated": "2024-12-17", "cost": { - "input": 0.25, - "output": 1.5, - "reasoning": 1.5 + "input": 0, + "output": 0 }, "type": "chat" }, { - "id": "google/gemma-4-31b-it", - "name": "Google: Gemma 4 31B", - "display_name": "Google: Gemma 4 31B", + "id": "openai/gpt-4o", + "name": "GPT-4o", + "display_name": "GPT-4o", "modalities": { "input": [ - "image", "text", - "video" + "image", + "audio" ], "output": [ "text" ] }, "limit": { - "context": 262144, - "output": 131072 + "context": 128000, + "output": 16384 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, "attachment": true, - "open_weights": true, - "release_date": "2026-04-02", - "last_updated": "2026-04-11", + "open_weights": false, + "knowledge": "2023-10", + "release_date": "2024-05-13", + "last_updated": "2024-05-13", "cost": { - "input": 0.14, - "output": 0.4 + "input": 0, + "output": 0 }, "type": "chat" }, { - "id": "google/gemini-3-flash-preview", - "name": "Google: Gemini 3 Flash Preview", - "display_name": "Google: Gemini 3 Flash Preview", + "id": "openai/o4-mini", + "name": "OpenAI o4-mini", + "display_name": "OpenAI o4-mini", "modalities": { "input": [ - "audio", - "image", - "pdf", "text", - "video" + "image" ], "output": [ "text" ] }, "limit": { - "context": 1048576, - "output": 65536 + "context": 200000, + "output": 100000 }, - "temperature": true, - "tool_call": true, + "temperature": false, + "tool_call": false, "reasoning": { "supported": true, "default": true @@ -49896,56 +52908,45 @@ "reasoning": { "supported": true, "default_enabled": true, - "mode": "level", - "level": "high", - "level_options": [ - "minimal", + "mode": "effort", + "effort": "medium", + "effort_options": [ "low", "medium", "high" ], - "summaries": true, - "visibility": "summary", - "continuation": [ - "thought_signatures" - ] + "visibility": "hidden" } }, - "attachment": true, + "attachment": false, "open_weights": false, - "release_date": "2025-12-17", - "last_updated": "2026-03-15", + "knowledge": "2024-04", + "release_date": "2025-01-31", + "last_updated": "2025-01-31", "cost": { - "input": 0.5, - "output": 3, - "reasoning": 3, - "cache_read": 0.05, - "cache_write": 0.083333 + "input": 0, + "output": 0 }, "type": "chat" }, { - "id": "google/gemini-3.1-pro-preview-customtools", - "name": "Google: Gemini 3.1 Pro Preview Custom Tools", - "display_name": "Google: Gemini 3.1 Pro Preview Custom Tools", + "id": "openai/o1-preview", + "name": "OpenAI o1-preview", + "display_name": "OpenAI o1-preview", "modalities": { "input": [ - "audio", - "image", - "pdf", - "text", - "video" + "text" ], "output": [ "text" ] }, "limit": { - "context": 1048576, - "output": 65536 + "context": 128000, + "output": 32768 }, - "temperature": true, - "tool_call": true, + "temperature": false, + "tool_call": false, "reasoning": { "supported": true, "default": true @@ -49954,52 +52955,45 @@ "reasoning": { "supported": true, "default_enabled": true, - "mode": "level", - "level": "high", - "level_options": [ + "mode": "effort", + "effort": "medium", + "effort_options": [ "low", + "medium", "high" ], - "summaries": true, - "visibility": "summary", - "continuation": [ - "thought_signatures" - ] + "visibility": "hidden" } }, - "attachment": true, + "attachment": false, "open_weights": false, - "release_date": "2026-02-26", - "last_updated": "2026-03-15", + "knowledge": "2023-10", + "release_date": "2024-09-12", + "last_updated": "2024-09-12", "cost": { - "input": 2, - "output": 12, - "reasoning": 12 + "input": 0, + "output": 0 }, "type": "chat" }, { - "id": "google/gemini-2.5-pro-preview-05-06", - "name": "Google: Gemini 2.5 Pro Preview 05-06", - "display_name": "Google: Gemini 2.5 Pro Preview 05-06", + "id": "openai/o3-mini", + "name": "OpenAI o3-mini", + "display_name": "OpenAI o3-mini", "modalities": { "input": [ - "audio", - "image", - "pdf", - "text", - "video" + "text" ], "output": [ "text" ] }, "limit": { - "context": 1048576, - "output": 65535 + "context": 200000, + "output": 100000 }, - "temperature": true, - "tool_call": true, + "temperature": false, + "tool_call": false, "reasoning": { "supported": true, "default": true @@ -50008,87 +53002,79 @@ "reasoning": { "supported": true, "default_enabled": true, - "mode": "budget", - "budget": { - "default": -1, - "min": 128, - "max": 32768, - "auto": -1, - "unit": "tokens" - }, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thought_signatures" - ] + "mode": "effort", + "effort": "medium", + "effort_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" } }, - "attachment": true, + "attachment": false, "open_weights": false, - "release_date": "2025-05-06", - "last_updated": "2026-03-15", + "knowledge": "2024-04", + "release_date": "2025-01-31", + "last_updated": "2025-01-31", "cost": { - "input": 1.25, - "output": 10, - "reasoning": 10, - "cache_read": 0.125, - "cache_write": 0.375 + "input": 0, + "output": 0 }, "type": "chat" }, { - "id": "google/gemma-3n-e4b-it", - "name": "Google: Gemma 3n 4B", - "display_name": "Google: Gemma 3n 4B", + "id": "openai/gpt-4.1-nano", + "name": "GPT-4.1-nano", + "display_name": "GPT-4.1-nano", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 32768, - "output": 6554 + "context": 128000, + "output": 16384 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { "supported": false }, - "attachment": false, - "open_weights": true, - "release_date": "2025-05-20", - "last_updated": "2025-05-20", + "attachment": true, + "open_weights": false, + "knowledge": "2024-04", + "release_date": "2025-04-14", + "last_updated": "2025-04-14", "cost": { - "input": 0.02, - "output": 0.04 + "input": 0, + "output": 0 }, "type": "chat" }, { - "id": "google/gemini-2.5-pro", - "name": "Google: Gemini 2.5 Pro", - "display_name": "Google: Gemini 2.5 Pro", + "id": "openai/o1", + "name": "OpenAI o1", + "display_name": "OpenAI o1", "modalities": { "input": [ - "audio", - "image", - "pdf", "text", - "video" + "image" ], "output": [ "text" ] }, "limit": { - "context": 1048576, - "output": 65536 + "context": 200000, + "output": 100000 }, - "temperature": true, - "tool_call": true, + "temperature": false, + "tool_call": false, "reasoning": { "supported": true, "default": true @@ -50097,96 +53083,68 @@ "reasoning": { "supported": true, "default_enabled": true, - "mode": "budget", - "budget": { - "default": -1, - "min": 128, - "max": 32768, - "auto": -1, - "unit": "tokens" - }, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thought_signatures" - ] + "mode": "effort", + "effort": "medium", + "effort_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" } }, - "attachment": true, + "attachment": false, "open_weights": false, - "release_date": "2025-03-20", - "last_updated": "2026-03-15", + "knowledge": "2023-10", + "release_date": "2024-09-12", + "last_updated": "2024-12-17", "cost": { - "input": 1.25, - "output": 10, - "reasoning": 10, - "cache_read": 0.125, - "cache_write": 0.375 + "input": 0, + "output": 0 }, "type": "chat" }, { - "id": "google/gemini-3.1-pro-preview", - "name": "Google: Gemini 3.1 Pro Preview", - "display_name": "Google: Gemini 3.1 Pro Preview", + "id": "openai/gpt-4.1", + "name": "GPT-4.1", + "display_name": "GPT-4.1", "modalities": { "input": [ - "audio", - "image", - "pdf", "text", - "video" + "image" ], "output": [ "text" ] }, "limit": { - "context": 1048576, - "output": 65536 + "context": 128000, + "output": 16384 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": true, - "mode": "level", - "level": "high", - "level_options": [ - "low", - "high" - ], - "summaries": true, - "visibility": "summary", - "continuation": [ - "thought_signatures" - ] - } + "supported": false }, "attachment": true, "open_weights": false, - "release_date": "2026-02-19", - "last_updated": "2026-03-15", + "knowledge": "2024-04", + "release_date": "2025-04-14", + "last_updated": "2025-04-14", "cost": { - "input": 2, - "output": 12, - "reasoning": 12 + "input": 0, + "output": 0 }, "type": "chat" }, { - "id": "google/gemma-3-27b-it", - "name": "Google: Gemma 3 27B", - "display_name": "Google: Gemma 3 27B", + "id": "openai/gpt-4.1-mini", + "name": "GPT-4.1-mini", + "display_name": "GPT-4.1-mini", "modalities": { "input": [ - "image", - "text" + "text", + "image" ], "output": [ "text" @@ -50194,7 +53152,7 @@ }, "limit": { "context": 128000, - "output": 65536 + "output": 16384 }, "temperature": true, "tool_call": true, @@ -50202,137 +53160,99 @@ "supported": false }, "attachment": true, - "open_weights": true, - "release_date": "2025-03-12", - "last_updated": "2026-03-15", + "open_weights": false, + "knowledge": "2024-04", + "release_date": "2025-04-14", + "last_updated": "2025-04-14", "cost": { - "input": 0.03, - "output": 0.11, - "cache_read": 0.02 + "input": 0, + "output": 0 }, "type": "chat" }, { - "id": "google/gemini-3.1-flash-lite", - "name": "Google: Gemini 3.1 Flash Lite", - "display_name": "Google: Gemini 3.1 Flash Lite", + "id": "openai/gpt-4o-mini", + "name": "GPT-4o mini", + "display_name": "GPT-4o mini", "modalities": { "input": [ - "audio", - "image", - "pdf", "text", - "video" + "image", + "audio" ], "output": [ "text" ] }, "limit": { - "context": 1048576, - "output": 65536 + "context": 128000, + "output": 16384 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true - } + "supported": false }, "attachment": true, "open_weights": false, - "release_date": "2026-05-07", - "last_updated": "2026-05-16", + "knowledge": "2023-10", + "release_date": "2024-07-18", + "last_updated": "2024-07-18", "cost": { - "input": 0.25, - "output": 1.5, - "reasoning": 1.5, - "cache_read": 0.025, - "cache_write": 0.08333 + "input": 0, + "output": 0 }, "type": "chat" }, { - "id": "google/gemini-2.5-flash-lite", - "name": "Google: Gemini 2.5 Flash Lite", - "display_name": "Google: Gemini 2.5 Flash Lite", + "id": "mistral-ai/mistral-small-2503", + "name": "Mistral Small 3.1", + "display_name": "Mistral Small 3.1", "modalities": { "input": [ - "audio", - "image", - "pdf", "text", - "video" + "image" ], "output": [ "text" ] }, "limit": { - "context": 1048576, - "output": 65535 + "context": 128000, + "output": 32768 }, "temperature": true, "tool_call": true, "reasoning": { "supported": true, - "default": false - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": false, - "mode": "budget", - "budget": { - "default": -1, - "min": 512, - "max": 24576, - "auto": -1, - "unit": "tokens" - }, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thought_signatures" - ] - } + "default": true }, - "attachment": true, + "attachment": false, "open_weights": false, - "release_date": "2025-06-17", - "last_updated": "2026-03-15", + "knowledge": "2024-09", + "release_date": "2025-03-01", + "last_updated": "2025-03-01", "cost": { - "input": 0.1, - "output": 0.4, - "reasoning": 0.4, - "cache_read": 0.01, - "cache_write": 0.083333 + "input": 0, + "output": 0 }, "type": "chat" }, { - "id": "google/gemini-2.5-flash", - "name": "Google: Gemini 2.5 Flash", - "display_name": "Google: Gemini 2.5 Flash", + "id": "mistral-ai/mistral-nemo", + "name": "Mistral Nemo", + "display_name": "Mistral Nemo", "modalities": { "input": [ - "audio", - "image", - "pdf", - "text", - "video" + "text" ], "output": [ "text" ] }, "limit": { - "context": 1048576, - "output": 65535 + "context": 128000, + "output": 8192 }, "temperature": true, "tool_call": true, @@ -50340,89 +53260,66 @@ "supported": true, "default": true }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": true, - "mode": "budget", - "budget": { - "default": -1, - "min": 0, - "max": 24576, - "auto": -1, - "off": 0, - "unit": "tokens" - }, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thought_signatures" - ] - } - }, - "attachment": true, - "open_weights": false, - "release_date": "2025-07-17", - "last_updated": "2026-03-15", + "attachment": false, + "open_weights": true, + "knowledge": "2024-03", + "release_date": "2024-07-18", + "last_updated": "2024-07-18", "cost": { - "input": 0.3, - "output": 2.5, - "reasoning": 2.5, - "cache_read": 0.03, - "cache_write": 0.083333 + "input": 0, + "output": 0 }, "type": "chat" }, { - "id": "google/gemma-3-12b-it", - "name": "Google: Gemma 3 12B", - "display_name": "Google: Gemma 3 12B", + "id": "mistral-ai/mistral-medium-2505", + "name": "Mistral Medium 3 (25.05)", + "display_name": "Mistral Medium 3 (25.05)", "modalities": { "input": [ - "image", - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 131072, - "output": 131072 + "context": 128000, + "output": 32768 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": true, - "open_weights": true, - "release_date": "2025-03-13", - "last_updated": "2026-03-15", + "attachment": false, + "open_weights": false, + "knowledge": "2024-09", + "release_date": "2025-05-01", + "last_updated": "2025-05-01", "cost": { - "input": 0.04, - "output": 0.13, - "cache_read": 0.015 + "input": 0, + "output": 0 }, "type": "chat" }, { - "id": "google/gemma-4-26b-a4b-it", - "name": "Google: Gemma 4 26B A4B", - "display_name": "Google: Gemma 4 26B A4B", + "id": "mistral-ai/mistral-large-2411", + "name": "Mistral Large 24.11", + "display_name": "Mistral Large 24.11", "modalities": { "input": [ - "image", - "text", - "video" + "text" ], "output": [ "text" ] }, "limit": { - "context": 262144, - "output": 262144 + "context": 128000, + "output": 32768 }, "temperature": true, "tool_call": true, @@ -50430,81 +53327,56 @@ "supported": true, "default": true }, - "attachment": true, - "open_weights": true, - "release_date": "2026-04-03", - "last_updated": "2026-04-11", + "attachment": false, + "open_weights": false, + "knowledge": "2024-09", + "release_date": "2024-11-01", + "last_updated": "2024-11-01", "cost": { - "input": 0.12, - "output": 0.4 + "input": 0, + "output": 0 }, "type": "chat" }, { - "id": "google/gemini-2.5-flash-lite-preview-09-2025", - "name": "Google: Gemini 2.5 Flash Lite Preview 09-2025", - "display_name": "Google: Gemini 2.5 Flash Lite Preview 09-2025", + "id": "mistral-ai/ministral-3b", + "name": "Ministral 3B", + "display_name": "Ministral 3B", "modalities": { "input": [ - "audio", - "image", - "pdf", - "text", - "video" + "text" ], "output": [ "text" ] }, "limit": { - "context": 1048576, - "output": 65536 + "context": 128000, + "output": 8192 }, "temperature": true, "tool_call": true, "reasoning": { "supported": true, - "default": false - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": false, - "mode": "budget", - "budget": { - "default": -1, - "min": 512, - "max": 24576, - "auto": -1, - "unit": "tokens" - }, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thought_signatures" - ] - } + "default": true }, - "attachment": true, - "open_weights": false, - "release_date": "2025-09-25", - "last_updated": "2026-03-15", + "attachment": false, + "open_weights": true, + "knowledge": "2024-03", + "release_date": "2024-10-22", + "last_updated": "2024-10-22", "cost": { - "input": 0.1, - "output": 0.4, - "reasoning": 0.4, - "cache_read": 0.01, - "cache_write": 0.083333 + "input": 0, + "output": 0 }, "type": "chat" }, { - "id": "google/gemma-3-4b-it", - "name": "Google: Gemma 3 4B", - "display_name": "Google: Gemma 3 4B", + "id": "mistral-ai/codestral-2501", + "name": "Codestral 25.01", + "display_name": "Codestral 25.01", "modalities": { "input": [ - "image", "text" ], "output": [ @@ -50512,43 +53384,41 @@ ] }, "limit": { - "context": 131072, - "output": 19200 + "context": 32000, + "output": 8192 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": true, - "open_weights": true, - "release_date": "2025-03-13", - "last_updated": "2026-03-15", + "attachment": false, + "open_weights": false, + "knowledge": "2024-03", + "release_date": "2025-01-01", + "last_updated": "2025-01-01", "cost": { - "input": 0.04, - "output": 0.08 + "input": 0, + "output": 0 }, "type": "chat" }, { - "id": "google/gemini-3.5-flash", - "name": "Google: Gemini 3.5 Flash", - "display_name": "Google: Gemini 3.5 Flash", + "id": "cohere/cohere-command-a", + "name": "Cohere Command A", + "display_name": "Cohere Command A", "modalities": { "input": [ - "audio", - "image", - "pdf", - "text", - "video" + "text" ], "output": [ "text" ] }, "limit": { - "context": 1048576, - "output": 65536 + "context": 128000, + "output": 4096 }, "temperature": true, "tool_call": true, @@ -50556,65 +53426,43 @@ "supported": true, "default": true }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": true, - "mode": "level", - "level": "high", - "level_options": [ - "minimal", - "low", - "medium", - "high" - ], - "summaries": true, - "visibility": "summary", - "continuation": [ - "thought_signatures" - ] - } - }, - "attachment": true, + "attachment": false, "open_weights": false, - "release_date": "2026-05-19", - "last_updated": "2026-05-27", + "knowledge": "2024-03", + "release_date": "2024-11-01", + "last_updated": "2024-11-01", "cost": { - "input": 1.5, - "output": 9, - "reasoning": 9, - "cache_read": 0.15, - "cache_write": 0.08333 + "input": 0, + "output": 0 }, "type": "chat" }, { - "id": "google/lyria-3-pro-preview", - "name": "Google: Lyria 3 Pro Preview", - "display_name": "Google: Lyria 3 Pro Preview", + "id": "cohere/cohere-command-r-08-2024", + "name": "Cohere Command R 08-2024", + "display_name": "Cohere Command R 08-2024", "modalities": { "input": [ - "image", "text" ], "output": [ - "audio", "text" ] }, "limit": { - "context": 1048576, - "output": 65536 + "context": 128000, + "output": 4096 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { "supported": false }, - "attachment": true, + "attachment": false, "open_weights": false, - "release_date": "2026-03-30", - "last_updated": "2026-04-11", + "knowledge": "2024-03", + "release_date": "2024-08-01", + "last_updated": "2024-08-01", "cost": { "input": 0, "output": 0 @@ -50622,9 +53470,9 @@ "type": "chat" }, { - "id": "google/gemma-2-27b-it", - "name": "Google: Gemma 2 27B", - "display_name": "Google: Gemma 2 27B", + "id": "cohere/cohere-command-r-plus", + "name": "Cohere Command R+", + "display_name": "Cohere Command R+", "modalities": { "input": [ "text" @@ -50634,123 +53482,96 @@ ] }, "limit": { - "context": 8192, - "output": 2048 + "context": 128000, + "output": 4096 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { "supported": false }, "attachment": false, - "open_weights": true, - "release_date": "2024-06-24", - "last_updated": "2024-06-24", + "open_weights": false, + "knowledge": "2024-03", + "release_date": "2024-04-04", + "last_updated": "2024-08-01", "cost": { - "input": 0.65, - "output": 0.65 + "input": 0, + "output": 0 }, "type": "chat" }, { - "id": "google/gemini-3-pro-image-preview", - "name": "Google: Nano Banana Pro (Gemini 3 Pro Image Preview)", - "display_name": "Google: Nano Banana Pro (Gemini 3 Pro Image Preview)", + "id": "cohere/cohere-command-r-plus-08-2024", + "name": "Cohere Command R+ 08-2024", + "display_name": "Cohere Command R+ 08-2024", "modalities": { "input": [ - "image", "text" ], "output": [ - "image", "text" ] }, "limit": { - "context": 65536, - "output": 32768 + "context": 128000, + "output": 4096 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": true, - "mode": "level", - "level": "high", - "level_options": [ - "low", - "high" - ], - "summaries": true, - "visibility": "summary", - "continuation": [ - "thought_signatures" - ] - } + "supported": false }, - "attachment": true, + "attachment": false, "open_weights": false, - "release_date": "2025-11-20", - "last_updated": "2026-03-15", + "knowledge": "2024-03", + "release_date": "2024-08-01", + "last_updated": "2024-08-01", "cost": { - "input": 2, - "output": 12, - "reasoning": 12 + "input": 0, + "output": 0 }, - "type": "imageGeneration" + "type": "chat" }, { - "id": "google/gemini-3.1-flash-image-preview", - "name": "Google: Nano Banana 2 (Gemini 3.1 Flash Image Preview)", - "display_name": "Google: Nano Banana 2 (Gemini 3.1 Flash Image Preview)", + "id": "cohere/cohere-command-r", + "name": "Cohere Command R", + "display_name": "Cohere Command R", "modalities": { "input": [ - "image", "text" ], "output": [ - "image", "text" ] }, "limit": { - "context": 65536, - "output": 65536 + "context": 128000, + "output": 4096 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { "supported": true, "default": true }, - "extra_capabilities": { - "reasoning": { - "supported": true - } - }, - "attachment": true, + "attachment": false, "open_weights": false, - "release_date": "2026-02-26", - "last_updated": "2026-03-15", + "knowledge": "2024-03", + "release_date": "2024-03-11", + "last_updated": "2024-08-01", "cost": { - "input": 0.5, - "output": 3 + "input": 0, + "output": 0 }, - "type": "imageGeneration" + "type": "chat" }, { - "id": "openai/gpt-4o-2024-08-06", - "name": "OpenAI: GPT-4o (2024-08-06)", - "display_name": "OpenAI: GPT-4o (2024-08-06)", + "id": "meta/meta-llama-3-8b-instruct", + "name": "Meta-Llama-3-8B-Instruct", + "display_name": "Meta-Llama-3-8B-Instruct", "modalities": { "input": [ - "image", - "pdf", "text" ], "output": [ @@ -50758,82 +53579,67 @@ ] }, "limit": { - "context": 128000, - "output": 16384 + "context": 8192, + "output": 2048 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": true, - "open_weights": false, - "release_date": "2024-08-06", - "last_updated": "2026-03-15", + "attachment": false, + "open_weights": true, + "knowledge": "2023-12", + "release_date": "2024-04-18", + "last_updated": "2024-04-18", "cost": { - "input": 2.5, - "output": 10, - "cache_read": 1.25 + "input": 0, + "output": 0 }, "type": "chat" }, { - "id": "openai/gpt-5-pro", - "name": "OpenAI: GPT-5 Pro", - "display_name": "OpenAI: GPT-5 Pro", + "id": "meta/llama-3.2-11b-vision-instruct", + "name": "Llama-3.2-11B-Vision-Instruct", + "display_name": "Llama-3.2-11B-Vision-Instruct", "modalities": { "input": [ + "text", "image", - "pdf", - "text" + "audio" ], "output": [ "text" ] }, "limit": { - "context": 400000, - "output": 128000 + "context": 128000, + "output": 8192 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, "default": true }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": true, - "mode": "fixed", - "effort": "high", - "verbosity": "medium", - "verbosity_options": [ - "low", - "medium", - "high" - ], - "visibility": "hidden" - } - }, - "attachment": true, - "open_weights": false, - "release_date": "2025-10-06", - "last_updated": "2026-03-15", + "attachment": false, + "open_weights": true, + "knowledge": "2023-12", + "release_date": "2024-09-25", + "last_updated": "2024-09-25", "cost": { - "input": 15, - "output": 120 + "input": 0, + "output": 0 }, "type": "chat" }, { - "id": "openai/gpt-5-mini", - "name": "OpenAI: GPT-5 Mini", - "display_name": "OpenAI: GPT-5 Mini", + "id": "meta/meta-llama-3.1-405b-instruct", + "name": "Meta-Llama-3.1-405B-Instruct", + "display_name": "Meta-Llama-3.1-405B-Instruct", "modalities": { "input": [ - "image", - "pdf", "text" ], "output": [ @@ -50841,103 +53647,66 @@ ] }, "limit": { - "context": 400000, - "output": 128000 + "context": 128000, + "output": 32768 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, "default": true }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": true, - "mode": "effort", - "effort": "medium", - "effort_options": [ - "minimal", - "low", - "medium", - "high" - ], - "verbosity": "medium", - "verbosity_options": [ - "low", - "medium", - "high" - ], - "visibility": "hidden" - } - }, - "attachment": true, - "open_weights": false, - "release_date": "2025-08-07", - "last_updated": "2026-03-15", + "attachment": false, + "open_weights": true, + "knowledge": "2023-12", + "release_date": "2024-07-23", + "last_updated": "2024-07-23", "cost": { - "input": 0.25, - "output": 2, - "cache_read": 0.025 + "input": 0, + "output": 0 }, "type": "chat" }, { - "id": "openai/o3-mini-high", - "name": "OpenAI: o3 Mini High", - "display_name": "OpenAI: o3 Mini High", + "id": "meta/llama-4-scout-17b-16e-instruct", + "name": "Llama 4 Scout 17B 16E Instruct", + "display_name": "Llama 4 Scout 17B 16E Instruct", "modalities": { "input": [ - "pdf", - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 100000 + "context": 128000, + "output": 8192 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, "default": true }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": true, - "mode": "effort", - "effort": "medium", - "effort_options": [ - "low", - "medium", - "high" - ], - "visibility": "hidden" - } - }, - "attachment": true, - "open_weights": false, + "attachment": false, + "open_weights": true, + "knowledge": "2024-12", "release_date": "2025-01-31", - "last_updated": "2026-03-15", + "last_updated": "2025-01-31", "cost": { - "input": 1.1, - "output": 4.4, - "cache_read": 0.55 + "input": 0, + "output": 0 }, "type": "chat" }, { - "id": "openai/o4-mini-high", - "name": "OpenAI: o4 Mini High", - "display_name": "OpenAI: o4 Mini High", + "id": "meta/llama-3.3-70b-instruct", + "name": "Llama-3.3-70B-Instruct", + "display_name": "Llama-3.3-70B-Instruct", "modalities": { "input": [ - "image", - "pdf", "text" ], "output": [ @@ -50945,46 +53714,32 @@ ] }, "limit": { - "context": 200000, - "output": 100000 + "context": 128000, + "output": 32768 }, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, "default": true }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": true, - "mode": "effort", - "effort": "medium", - "effort_options": [ - "low", - "medium", - "high" - ], - "visibility": "hidden" - } - }, - "attachment": true, - "open_weights": false, - "release_date": "2025-04-17", - "last_updated": "2026-03-15", + "attachment": false, + "open_weights": true, + "knowledge": "2023-12", + "release_date": "2024-12-06", + "last_updated": "2024-12-06", "cost": { - "input": 1.1, - "output": 4.4 + "input": 0, + "output": 0 }, "type": "chat" }, { - "id": "openai/gpt-5-chat", - "name": "OpenAI: GPT-5 Chat", - "display_name": "OpenAI: GPT-5 Chat", + "id": "meta/meta-llama-3.1-70b-instruct", + "name": "Meta-Llama-3.1-70B-Instruct", + "display_name": "Meta-Llama-3.1-70B-Instruct", "modalities": { "input": [ - "image", - "pdf", "text" ], "output": [ @@ -50993,32 +53748,31 @@ }, "limit": { "context": 128000, - "output": 16384 + "output": 32768 }, - "temperature": false, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": true, - "open_weights": false, - "release_date": "2025-08-07", - "last_updated": "2026-03-15", + "attachment": false, + "open_weights": true, + "knowledge": "2023-12", + "release_date": "2024-07-23", + "last_updated": "2024-07-23", "cost": { - "input": 1.25, - "output": 10, - "cache_read": 0.125 + "input": 0, + "output": 0 }, "type": "chat" }, { - "id": "openai/gpt-4o", - "name": "OpenAI: GPT-4o", - "display_name": "OpenAI: GPT-4o", + "id": "meta/meta-llama-3.1-8b-instruct", + "name": "Meta-Llama-3.1-8B-Instruct", + "display_name": "Meta-Llama-3.1-8B-Instruct", "modalities": { "input": [ - "image", - "pdf", "text" ], "output": [ @@ -51027,90 +53781,68 @@ }, "limit": { "context": 128000, - "output": 16384 + "output": 32768 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": true, - "open_weights": false, - "release_date": "2024-05-13", - "last_updated": "2026-03-15", + "attachment": false, + "open_weights": true, + "knowledge": "2023-12", + "release_date": "2024-07-23", + "last_updated": "2024-07-23", "cost": { - "input": 2.5, - "output": 10, - "cache_read": 1.25 + "input": 0, + "output": 0 }, "type": "chat" }, { - "id": "openai/gpt-5.2", - "name": "OpenAI: GPT-5.2", - "display_name": "OpenAI: GPT-5.2", + "id": "meta/llama-3.2-90b-vision-instruct", + "name": "Llama-3.2-90B-Vision-Instruct", + "display_name": "Llama-3.2-90B-Vision-Instruct", "modalities": { "input": [ + "text", "image", - "pdf", - "text" + "audio" ], "output": [ "text" ] }, "limit": { - "context": 400000, - "output": 128000 + "context": 128000, + "output": 8192 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, - "default": false - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": false, - "mode": "effort", - "effort": "none", - "effort_options": [ - "none", - "low", - "medium", - "high", - "xhigh" - ], - "verbosity": "medium", - "verbosity_options": [ - "low", - "medium", - "high" - ], - "visibility": "hidden" - } + "default": true }, - "attachment": true, - "open_weights": false, - "release_date": "2025-12-11", - "last_updated": "2026-03-15", + "attachment": false, + "open_weights": true, + "knowledge": "2023-12", + "release_date": "2024-09-25", + "last_updated": "2024-09-25", "cost": { - "input": 1.75, - "output": 14, - "cache_read": 0.175 + "input": 0, + "output": 0 }, "type": "chat" }, { - "id": "openai/gpt-4o-mini-2024-07-18", - "name": "OpenAI: GPT-4o-mini (2024-07-18)", - "display_name": "OpenAI: GPT-4o-mini (2024-07-18)", + "id": "meta/llama-4-maverick-17b-128e-instruct-fp8", + "name": "Llama 4 Maverick 17B 128E Instruct FP8", + "display_name": "Llama 4 Maverick 17B 128E Instruct FP8", "modalities": { "input": [ - "image", - "pdf", - "text" + "text", + "image" ], "output": [ "text" @@ -51118,86 +53850,64 @@ }, "limit": { "context": 128000, - "output": 16384 + "output": 8192 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": true, - "open_weights": false, - "release_date": "2024-07-18", - "last_updated": "2026-03-15", + "attachment": false, + "open_weights": true, + "knowledge": "2024-12", + "release_date": "2025-01-31", + "last_updated": "2025-01-31", "cost": { - "input": 0.15, - "output": 0.6 + "input": 0, + "output": 0 }, "type": "chat" }, { - "id": "openai/gpt-5-codex", - "name": "OpenAI: GPT-5 Codex", - "display_name": "OpenAI: GPT-5 Codex", + "id": "meta/meta-llama-3-70b-instruct", + "name": "Meta-Llama-3-70B-Instruct", + "display_name": "Meta-Llama-3-70B-Instruct", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 400000, - "output": 128000 + "context": 8192, + "output": 2048 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, "default": true }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": true, - "mode": "effort", - "effort": "medium", - "effort_options": [ - "minimal", - "low", - "medium", - "high" - ], - "verbosity": "medium", - "verbosity_options": [ - "low", - "medium", - "high" - ], - "visibility": "hidden" - } - }, - "attachment": true, - "open_weights": false, - "release_date": "2025-09-15", - "last_updated": "2025-09-15", + "attachment": false, + "open_weights": true, + "knowledge": "2023-12", + "release_date": "2024-04-18", + "last_updated": "2024-04-18", "cost": { - "input": 1.25, - "output": 10, - "cache_read": 0.125 + "input": 0, + "output": 0 }, "type": "chat" }, { - "id": "openai/o3", - "name": "OpenAI: o3", - "display_name": "OpenAI: o3", + "id": "deepseek/deepseek-r1-0528", + "name": "DeepSeek-R1-0528", + "display_name": "DeepSeek-R1-0528", "modalities": { "input": [ - "image", - "pdf", "text" ], "output": [ @@ -51205,10 +53915,10 @@ ] }, "limit": { - "context": 200000, - "output": 100000 + "context": 65536, + "output": 8192 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, @@ -51217,46 +53927,40 @@ "extra_capabilities": { "reasoning": { "supported": true, - "default_enabled": true, - "mode": "effort", - "effort": "medium", - "effort_options": [ - "low", - "medium", - "high" - ], - "visibility": "hidden" + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] } }, - "attachment": true, - "open_weights": false, - "release_date": "2025-04-16", - "last_updated": "2026-03-15", + "attachment": false, + "open_weights": true, + "knowledge": "2024-06", + "release_date": "2025-05-28", + "last_updated": "2025-05-28", "cost": { - "input": 2, - "output": 8, - "cache_read": 0.5 + "input": 0, + "output": 0 }, "type": "chat" }, { - "id": "openai/gpt-5-image", - "name": "OpenAI: GPT-5 Image", - "display_name": "OpenAI: GPT-5 Image", + "id": "deepseek/deepseek-v3-0324", + "name": "DeepSeek-V3-0324", + "display_name": "DeepSeek-V3-0324", "modalities": { "input": [ - "image", - "pdf", "text" ], "output": [ - "image", "text" ] }, "limit": { - "context": 400000, - "output": 128000 + "context": 128000, + "output": 8192 }, "temperature": true, "tool_call": true, @@ -51264,24 +53968,23 @@ "supported": true, "default": true }, - "attachment": true, - "open_weights": false, - "release_date": "2025-10-14", - "last_updated": "2026-03-15", + "attachment": false, + "open_weights": true, + "knowledge": "2024-06", + "release_date": "2025-03-24", + "last_updated": "2025-03-24", "cost": { - "input": 10, - "output": 10 + "input": 0, + "output": 0 }, "type": "chat" }, { - "id": "openai/gpt-4o-2024-11-20", - "name": "OpenAI: GPT-4o (2024-11-20)", - "display_name": "OpenAI: GPT-4o (2024-11-20)", + "id": "deepseek/deepseek-r1", + "name": "DeepSeek-R1", + "display_name": "DeepSeek-R1", "modalities": { "input": [ - "image", - "pdf", "text" ], "output": [ @@ -51289,45 +53992,11 @@ ] }, "limit": { - "context": 128000, - "output": 16384 + "context": 65536, + "output": 8192 }, "temperature": true, "tool_call": true, - "reasoning": { - "supported": false - }, - "attachment": true, - "open_weights": false, - "release_date": "2024-11-20", - "last_updated": "2026-03-15", - "cost": { - "input": 2.5, - "output": 10, - "cache_read": 1.25 - }, - "type": "chat" - }, - { - "id": "openai/gpt-5", - "name": "OpenAI: GPT-5", - "display_name": "OpenAI: GPT-5", - "modalities": { - "input": [ - "image", - "pdf", - "text" - ], - "output": [ - "text" - ] - }, - "limit": { - "context": 400000, - "output": 128000 - }, - "temperature": false, - "tool_call": true, "reasoning": { "supported": true, "default": true @@ -51335,96 +54004,72 @@ "extra_capabilities": { "reasoning": { "supported": true, - "default_enabled": true, - "mode": "effort", - "effort": "medium", - "effort_options": [ - "minimal", - "low", - "medium", - "high" - ], - "verbosity": "medium", - "verbosity_options": [ - "low", - "medium", - "high" - ], - "visibility": "hidden" + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] } }, - "attachment": true, - "open_weights": false, - "release_date": "2025-08-07", - "last_updated": "2026-03-15", + "attachment": false, + "open_weights": true, + "knowledge": "2024-06", + "release_date": "2025-01-20", + "last_updated": "2025-01-20", "cost": { - "input": 1.25, - "output": 10, - "cache_read": 0.125 + "input": 0, + "output": 0 }, "type": "chat" - }, + } + ] + }, + "neuralwatt": { + "id": "neuralwatt", + "name": "Neuralwatt", + "display_name": "Neuralwatt", + "api": "https://api.neuralwatt.com/v1", + "doc": "https://portal.neuralwatt.com/docs", + "models": [ { - "id": "openai/gpt-5.4-pro", - "name": "OpenAI: GPT-5.4 Pro", - "display_name": "OpenAI: GPT-5.4 Pro", + "id": "kimi-k2.5-fast", + "name": "Kimi K2.5 Fast", + "display_name": "Kimi K2.5 Fast", "modalities": { "input": [ - "image", - "pdf", - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 1050000, - "output": 128000 + "context": 262128, + "output": 262128 }, + "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": true, - "mode": "effort", - "effort": "high", - "effort_options": [ - "medium", - "high", - "xhigh" - ], - "verbosity": "medium", - "verbosity_options": [ - "low", - "medium", - "high" - ], - "visibility": "hidden" - } + "supported": false }, "attachment": true, - "open_weights": false, - "release_date": "2026-03-06", - "last_updated": "2026-03-15", + "open_weights": true, + "release_date": "2026-01-27", + "last_updated": "2026-01-27", "cost": { - "input": 30, - "output": 180 + "input": 0.52, + "output": 2.59 }, "type": "chat" }, { - "id": "openai/gpt-4.1-mini", - "name": "OpenAI: GPT-4.1 Mini", - "display_name": "OpenAI: GPT-4.1 Mini", + "id": "glm-5-fast", + "name": "GLM 5 Fast", + "display_name": "GLM 5 Fast", "modalities": { "input": [ - "image", - "pdf", "text" ], "output": [ @@ -51432,33 +54077,30 @@ ] }, "limit": { - "context": 1047576, - "output": 32768 + "context": 202736, + "output": 202736 }, "temperature": true, "tool_call": true, "reasoning": { "supported": false }, - "attachment": true, - "open_weights": false, - "release_date": "2025-04-14", - "last_updated": "2026-03-15", + "attachment": false, + "open_weights": true, + "release_date": "2026-04-07", + "last_updated": "2026-04-07", "cost": { - "input": 0.4, - "output": 1.6, - "cache_read": 0.1 + "input": 1.1, + "output": 3.6 }, "type": "chat" }, { - "id": "openai/gpt-5.2-pro", - "name": "OpenAI: GPT-5.2 Pro", - "display_name": "OpenAI: GPT-5.2 Pro", + "id": "qwen3.5-397b-fast", + "name": "Qwen3.5 397B Fast", + "display_name": "Qwen3.5 397B Fast", "modalities": { "input": [ - "image", - "pdf", "text" ], "output": [ @@ -51466,53 +54108,41 @@ ] }, "limit": { - "context": 400000, - "output": 128000 + "context": 262128, + "output": 262128 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": true }, "extra_capabilities": { "reasoning": { "supported": true, - "default_enabled": true, - "mode": "effort", - "effort": "high", - "effort_options": [ - "medium", - "high", - "xhigh" - ], - "verbosity": "medium", - "verbosity_options": [ - "low", - "medium", - "high" - ], - "visibility": "hidden" + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] } }, - "attachment": true, - "open_weights": false, - "release_date": "2025-12-11", - "last_updated": "2026-03-15", + "attachment": false, + "open_weights": true, + "release_date": "2026-02-01", + "last_updated": "2026-02-01", "cost": { - "input": 21, - "output": 168 + "input": 0.69, + "output": 4.14 }, "type": "chat" }, { - "id": "openai/o3-pro", - "name": "OpenAI: o3 Pro", - "display_name": "OpenAI: o3 Pro", + "id": "glm-5.1-fast", + "name": "GLM 5.1 Fast", + "display_name": "GLM 5.1 Fast", "modalities": { "input": [ - "image", - "pdf", "text" ], "output": [ @@ -51520,250 +54150,205 @@ ] }, "limit": { - "context": 200000, - "output": 100000 + "context": 202736, + "output": 202736 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": true, - "mode": "effort", - "effort": "medium", - "effort_options": [ - "low", - "medium", - "high" - ], - "visibility": "hidden" - } + "supported": false }, - "attachment": true, - "open_weights": false, - "release_date": "2025-04-16", - "last_updated": "2026-03-15", + "attachment": false, + "open_weights": true, + "release_date": "2026-04-07", + "last_updated": "2026-04-07", "cost": { - "input": 20, - "output": 80 + "input": 1.1, + "output": 3.6 }, "type": "chat" }, { - "id": "openai/gpt-4o-mini-search-preview", - "name": "OpenAI: GPT-4o-mini Search Preview", - "display_name": "OpenAI: GPT-4o-mini Search Preview", + "id": "kimi-k2.6-fast", + "name": "Kimi K2.6 Fast", + "display_name": "Kimi K2.6 Fast", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 16384 + "context": 262128, + "output": 262128 }, - "temperature": false, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { "supported": false }, - "attachment": false, - "open_weights": false, - "release_date": "2025-01", - "last_updated": "2025-01", + "attachment": true, + "open_weights": true, + "release_date": "2026-04-21", + "last_updated": "2026-04-21", "cost": { - "input": 0.15, - "output": 0.6 + "input": 0.69, + "output": 3.22 }, "type": "chat" }, { - "id": "openai/o4-mini", - "name": "OpenAI: o4 Mini", - "display_name": "OpenAI: o4 Mini", + "id": "qwen3.6-35b-fast", + "name": "Qwen3.6 35B Fast", + "display_name": "Qwen3.6 35B Fast", "modalities": { "input": [ - "image", - "pdf", - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 100000 + "context": 131056, + "output": 131056 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": true }, "extra_capabilities": { "reasoning": { "supported": true, - "default_enabled": true, - "mode": "effort", - "effort": "medium", - "effort_options": [ - "low", - "medium", - "high" - ], - "visibility": "hidden" + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] } }, "attachment": true, - "open_weights": false, - "release_date": "2025-04-16", - "last_updated": "2026-03-15", + "open_weights": true, + "release_date": "2026-04-01", + "last_updated": "2026-04-01", "cost": { - "input": 1.1, - "output": 4.4, - "cache_read": 0.275 + "input": 0.29, + "output": 1.15 }, "type": "chat" }, { - "id": "openai/gpt-5.4", - "name": "OpenAI: GPT-5.4", - "display_name": "OpenAI: GPT-5.4", + "id": "moonshotai/Kimi-K2.6", + "name": "Kimi K2.6", + "display_name": "Kimi K2.6", "modalities": { "input": [ - "image", - "pdf", - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 1050000, - "output": 128000 + "context": 262128, + "output": 262128 }, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, - "default": false + "default": true }, "extra_capabilities": { "reasoning": { "supported": true, - "default_enabled": false, - "mode": "effort", - "effort": "none", - "effort_options": [ - "none", - "low", - "medium", - "high", - "xhigh" - ], - "verbosity": "medium", - "verbosity_options": [ - "low", - "medium", - "high" - ], - "visibility": "hidden" + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] } }, "attachment": true, - "open_weights": false, - "release_date": "2026-03-06", - "last_updated": "2026-03-15", + "open_weights": true, + "release_date": "2026-04-21", + "last_updated": "2026-04-21", "cost": { - "input": 2.5, - "output": 15 + "input": 0.69, + "output": 3.22 }, "type": "chat" }, { - "id": "openai/gpt-5.4-image-2", - "name": "OpenAI: GPT-5.4 Image 2", - "display_name": "OpenAI: GPT-5.4 Image 2", + "id": "moonshotai/Kimi-K2.5", + "name": "Kimi K2.5", + "display_name": "Kimi K2.5", "modalities": { "input": [ - "image", "text", - "pdf" + "image" ], "output": [ - "image", "text" ] }, "limit": { - "context": 272000, - "output": 128000 + "context": 262128, + "output": 262128 }, - "temperature": false, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { "supported": true, - "default": false + "default": true }, "extra_capabilities": { "reasoning": { "supported": true, - "default_enabled": false, - "mode": "effort", - "effort": "none", - "effort_options": [ - "none", - "low", - "medium", - "high", - "xhigh" - ], - "verbosity": "medium", - "verbosity_options": [ - "low", - "medium", - "high" - ], - "visibility": "hidden" + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] } }, "attachment": true, - "open_weights": false, - "release_date": "2026-04-21", - "last_updated": "2026-05-01", + "open_weights": true, + "release_date": "2026-01-27", + "last_updated": "2026-01-27", "cost": { - "input": 8, - "output": 15, - "cache_read": 2 + "input": 0.52, + "output": 2.59 }, "type": "chat" }, { - "id": "openai/o3-mini", - "name": "OpenAI: o3 Mini", - "display_name": "OpenAI: o3 Mini", + "id": "Qwen/Qwen3.6-35B-A3B", + "name": "Qwen3.6 35B A3B", + "display_name": "Qwen3.6 35B A3B", "modalities": { "input": [ - "pdf", - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 100000 + "context": 131056, + "output": 131056 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, @@ -51772,47 +54357,41 @@ "extra_capabilities": { "reasoning": { "supported": true, - "default_enabled": true, - "mode": "effort", - "effort": "medium", - "effort_options": [ - "low", - "medium", - "high" - ], - "visibility": "hidden" + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] } }, "attachment": true, - "open_weights": false, - "release_date": "2024-12-20", - "last_updated": "2026-03-15", + "open_weights": true, + "release_date": "2026-04-01", + "last_updated": "2026-04-01", "cost": { - "input": 1.1, - "output": 4.4, - "cache_read": 0.55 + "input": 0.29, + "output": 1.15 }, "type": "chat" }, { - "id": "openai/gpt-5.5", - "name": "OpenAI: GPT-5.5", - "display_name": "OpenAI: GPT-5.5", + "id": "Qwen/Qwen3.5-397B-A17B-FP8", + "name": "Qwen3.5 397B A17B FP8", + "display_name": "Qwen3.5 397B A17B FP8", "modalities": { "input": [ - "text", - "image", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 1050000, - "output": 128000 + "context": 262128, + "output": 262128 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, @@ -51821,39 +54400,28 @@ "extra_capabilities": { "reasoning": { "supported": true, - "default_enabled": true, - "mode": "effort", - "effort": "medium", - "effort_options": [ - "low", - "medium", - "high", - "xhigh" - ], - "verbosity": "medium", - "verbosity_options": [ - "low", - "medium", - "high" - ], - "visibility": "hidden" + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] } }, - "attachment": true, - "open_weights": false, - "release_date": "2026-04-24", - "last_updated": "2026-05-01", + "attachment": false, + "open_weights": true, + "release_date": "2026-02-01", + "last_updated": "2026-02-01", "cost": { - "input": 5, - "output": 30, - "cache_read": 0.5 + "input": 0.69, + "output": 4.14 }, "type": "chat" }, { - "id": "openai/gpt-3.5-turbo-16k", - "name": "OpenAI: GPT-3.5 Turbo 16k", - "display_name": "OpenAI: GPT-3.5 Turbo 16k", + "id": "openai/gpt-oss-20b", + "name": "GPT OSS 20B", + "display_name": "GPT OSS 20B", "modalities": { "input": [ "text" @@ -51863,88 +54431,68 @@ ] }, "limit": { - "context": 16385, - "output": 4096 + "context": 16368, + "output": 16368 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true + } }, "attachment": false, - "open_weights": false, - "release_date": "2023-08-28", - "last_updated": "2026-03-15", + "open_weights": true, + "release_date": "2025-08-05", + "last_updated": "2025-08-05", "cost": { - "input": 3, - "output": 4 + "input": 0.03, + "output": 0.16 }, "type": "chat" }, { - "id": "openai/gpt-5.1", - "name": "OpenAI: GPT-5.1", - "display_name": "OpenAI: GPT-5.1", + "id": "mistralai/Devstral-Small-2-24B-Instruct-2512", + "name": "Devstral Small 2 24B Instruct 2512", + "display_name": "Devstral Small 2 24B Instruct 2512", "modalities": { "input": [ - "image", - "pdf", - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 400000, - "output": 128000 + "context": 262128, + "output": 262128 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": false - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": false, - "mode": "effort", - "effort": "none", - "effort_options": [ - "none", - "low", - "medium", - "high" - ], - "verbosity": "medium", - "verbosity_options": [ - "low", - "medium", - "high" - ], - "visibility": "hidden" - } + "supported": false }, "attachment": true, - "open_weights": false, - "release_date": "2025-11-13", - "last_updated": "2026-03-15", + "open_weights": true, + "release_date": "2025-12-09", + "last_updated": "2025-12-09", "cost": { - "input": 1.25, - "output": 10, - "cache_read": 0.125 + "input": 0.12, + "output": 0.35 }, "type": "chat" }, { - "id": "openai/gpt-5-nano", - "name": "OpenAI: GPT-5 Nano", - "display_name": "OpenAI: GPT-5 Nano", + "id": "zai-org/GLM-5.1-FP8", + "name": "GLM 5.1 FP8", + "display_name": "GLM 5.1 FP8", "modalities": { "input": [ - "image", - "pdf", "text" ], "output": [ @@ -51952,10 +54500,10 @@ ] }, "limit": { - "context": 400000, - "output": 128000 + "context": 202736, + "output": 202736 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, @@ -51964,39 +54512,28 @@ "extra_capabilities": { "reasoning": { "supported": true, - "default_enabled": true, - "mode": "effort", - "effort": "medium", - "effort_options": [ - "minimal", - "low", - "medium", - "high" - ], - "verbosity": "medium", - "verbosity_options": [ - "low", - "medium", - "high" - ], - "visibility": "hidden" + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] } }, - "attachment": true, - "open_weights": false, - "release_date": "2025-08-07", - "last_updated": "2026-03-15", + "attachment": false, + "open_weights": true, + "release_date": "2026-04-07", + "last_updated": "2026-04-07", "cost": { - "input": 0.05, - "output": 0.4, - "cache_read": 0.005 + "input": 1.1, + "output": 3.6 }, "type": "chat" }, { - "id": "openai/gpt-oss-120b", - "name": "OpenAI: gpt-oss-120b", - "display_name": "OpenAI: gpt-oss-120b", + "id": "MiniMaxAI/MiniMax-M2.5", + "name": "MiniMax M2.5", + "display_name": "MiniMax M2.5", "modalities": { "input": [ "text" @@ -52006,8 +54543,8 @@ ] }, "limit": { - "context": 131072, - "output": 26215 + "context": 196592, + "output": 196592 }, "temperature": true, "tool_call": true, @@ -52017,27 +54554,40 @@ }, "extra_capabilities": { "reasoning": { - "supported": true + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] } }, "attachment": false, "open_weights": true, - "release_date": "2025-08-05", - "last_updated": "2025-08-05", + "release_date": "2026-02-12", + "last_updated": "2026-02-12", "cost": { - "input": 0.039, - "output": 0.19 + "input": 0.35, + "output": 1.38 }, "type": "chat" - }, + } + ] + }, + "siliconflow": { + "id": "siliconflow", + "name": "SiliconFlow", + "display_name": "SiliconFlow", + "api": "https://api.siliconflow.cn/v1", + "doc": "https://cloud.siliconflow.com/models", + "models": [ { - "id": "openai/gpt-4o-mini", - "name": "OpenAI: GPT-4o-mini", - "display_name": "OpenAI: GPT-4o-mini", + "id": "THUDM/GLM-Z1-9B-0414", + "name": "THUDM/GLM-Z1-9B-0414", + "display_name": "THUDM/GLM-Z1-9B-0414", "modalities": { "input": [ - "image", - "pdf", "text" ], "output": [ @@ -52045,87 +54595,61 @@ ] }, "limit": { - "context": 128000, - "output": 16384 + "context": 131072, + "output": 8192 }, "temperature": true, "tool_call": true, "reasoning": { "supported": false }, - "attachment": true, + "attachment": false, "open_weights": false, - "release_date": "2024-07-18", - "last_updated": "2026-03-15", + "release_date": "2025-04-18", + "last_updated": "2025-11-25", "cost": { - "input": 0.15, - "output": 0.6, - "cache_read": 0.075 + "input": 0.086, + "output": 0.086 }, "type": "chat" }, { - "id": "openai/gpt-5.1-codex-max", - "name": "OpenAI: GPT-5.1-Codex-Max", - "display_name": "OpenAI: GPT-5.1-Codex-Max", + "id": "THUDM/GLM-4-9B-0414", + "name": "THUDM/GLM-4-9B-0414", + "display_name": "THUDM/GLM-4-9B-0414", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 400000, - "output": 128000 + "context": 131072, + "output": 8192 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": false - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": false, - "mode": "effort", - "effort": "none", - "effort_options": [ - "none", - "low", - "medium", - "high" - ], - "verbosity": "medium", - "verbosity_options": [ - "low", - "medium", - "high" - ], - "visibility": "hidden" - } + "supported": false }, - "attachment": true, + "attachment": false, "open_weights": false, - "release_date": "2025-11-13", - "last_updated": "2025-11-13", + "release_date": "2025-04-18", + "last_updated": "2025-11-25", "cost": { - "input": 1.25, - "output": 10, - "cache_read": 0.125 + "input": 0.086, + "output": 0.086 }, "type": "chat" }, { - "id": "openai/gpt-5.1-codex-mini", - "name": "OpenAI: GPT-5.1-Codex-Mini", - "display_name": "OpenAI: GPT-5.1-Codex-Mini", + "id": "THUDM/GLM-4-32B-0414", + "name": "THUDM/GLM-4-32B-0414", + "display_name": "THUDM/GLM-4-32B-0414", "modalities": { "input": [ - "image", "text" ], "output": [ @@ -52133,55 +54657,30 @@ ] }, "limit": { - "context": 400000, - "output": 100000 + "context": 131072, + "output": 8192 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": false - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": false, - "mode": "effort", - "effort": "none", - "effort_options": [ - "none", - "low", - "medium", - "high" - ], - "verbosity": "medium", - "verbosity_options": [ - "low", - "medium", - "high" - ], - "visibility": "hidden" - } + "supported": false }, - "attachment": true, + "attachment": false, "open_weights": false, - "release_date": "2025-11-13", - "last_updated": "2025-11-13", + "release_date": "2025-04-18", + "last_updated": "2025-11-25", "cost": { - "input": 0.25, - "output": 2, - "cache_read": 0.025 + "input": 0.27, + "output": 0.27 }, "type": "chat" }, { - "id": "openai/o1-pro", - "name": "OpenAI: o1-pro", - "display_name": "OpenAI: o1-pro", + "id": "THUDM/GLM-Z1-32B-0414", + "name": "THUDM/GLM-Z1-32B-0414", + "display_name": "THUDM/GLM-Z1-32B-0414", "modalities": { "input": [ - "image", - "pdf", "text" ], "output": [ @@ -52189,47 +54688,61 @@ ] }, "limit": { - "context": 200000, - "output": 100000 + "context": 131072, + "output": 8192 }, - "temperature": false, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": true, - "mode": "effort", - "effort": "medium", - "effort_options": [ - "low", - "medium", - "high" - ], - "visibility": "hidden" - } + "attachment": false, + "open_weights": false, + "release_date": "2025-04-18", + "last_updated": "2025-11-25", + "cost": { + "input": 0.14, + "output": 0.57 }, - "attachment": true, + "type": "chat" + }, + { + "id": "moonshotai/Kimi-K2-Instruct-0905", + "name": "moonshotai/Kimi-K2-Instruct-0905", + "display_name": "moonshotai/Kimi-K2-Instruct-0905", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 131072, + "output": 8192 + }, + "temperature": true, + "tool_call": true, + "reasoning": { + "supported": false + }, + "attachment": false, "open_weights": false, - "release_date": "2025-03-19", - "last_updated": "2026-03-15", + "release_date": "2025-09-08", + "last_updated": "2025-11-25", "cost": { - "input": 150, - "output": 600 + "input": 0.4, + "output": 2 }, "type": "chat" }, { - "id": "openai/gpt-chat-latest", - "name": "OpenAI: GPT Chat Latest", - "display_name": "OpenAI: GPT Chat Latest", + "id": "moonshotai/Kimi-K2-Thinking", + "name": "moonshotai/Kimi-K2-Thinking", + "display_name": "moonshotai/Kimi-K2-Thinking", "modalities": { "input": [ - "image", - "pdf", "text" ], "output": [ @@ -52237,10 +54750,10 @@ ] }, "limit": { - "context": 400000, - "output": 128000 + "context": 262000, + "output": 262000 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, @@ -52248,24 +54761,29 @@ }, "extra_capabilities": { "reasoning": { - "supported": true + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] } }, - "attachment": true, + "attachment": false, "open_weights": false, - "release_date": "2026-05-05", - "last_updated": "2026-05-07", + "release_date": "2025-11-07", + "last_updated": "2025-11-25", "cost": { - "input": 5, - "output": 30, - "cache_read": 0.5 + "input": 0.55, + "output": 2.5 }, "type": "chat" }, { - "id": "openai/gpt-4-1106-preview", - "name": "OpenAI: GPT-4 Turbo (older v1106)", - "display_name": "OpenAI: GPT-4 Turbo (older v1106)", + "id": "baidu/ERNIE-4.5-300B-A47B", + "name": "baidu/ERNIE-4.5-300B-A47B", + "display_name": "baidu/ERNIE-4.5-300B-A47B", "modalities": { "input": [ "text" @@ -52275,8 +54793,8 @@ ] }, "limit": { - "context": 128000, - "output": 4096 + "context": 131072, + "output": 8192 }, "temperature": true, "tool_call": true, @@ -52285,18 +54803,18 @@ }, "attachment": false, "open_weights": false, - "release_date": "2023-11-06", - "last_updated": "2026-03-15", + "release_date": "2025-07-02", + "last_updated": "2025-11-25", "cost": { - "input": 10, - "output": 30 + "input": 0.28, + "output": 1.1 }, "type": "chat" }, { - "id": "openai/gpt-oss-20b", - "name": "OpenAI: gpt-oss-20b", - "display_name": "OpenAI: gpt-oss-20b", + "id": "ByteDance-Seed/Seed-OSS-36B-Instruct", + "name": "ByteDance-Seed/Seed-OSS-36B-Instruct", + "display_name": "ByteDance-Seed/Seed-OSS-36B-Instruct", "modalities": { "input": [ "text" @@ -52307,13 +54825,12 @@ }, "limit": { "context": 131072, - "output": 26215 + "output": 8192 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": true }, "extra_capabilities": { "reasoning": { @@ -52321,19 +54838,19 @@ } }, "attachment": false, - "open_weights": true, - "release_date": "2025-08-05", - "last_updated": "2025-08-05", + "open_weights": false, + "release_date": "2025-09-04", + "last_updated": "2025-11-25", "cost": { - "input": 0.03, - "output": 0.14 + "input": 0.21, + "output": 0.57 }, "type": "chat" }, { - "id": "openai/gpt-4-0314", - "name": "OpenAI: GPT-4 (older v0314)", - "display_name": "OpenAI: GPT-4 (older v0314)", + "id": "stepfun-ai/Step-3.5-Flash", + "name": "stepfun-ai/Step-3.5-Flash", + "display_name": "stepfun-ai/Step-3.5-Flash", "modalities": { "input": [ "text" @@ -52343,28 +54860,29 @@ ] }, "limit": { - "context": 8191, - "output": 4096 + "context": 262000, + "output": 262000 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "attachment": false, "open_weights": false, - "release_date": "2023-05-28", - "last_updated": "2026-03-15", + "release_date": "2026-02-11", + "last_updated": "2026-02-11", "cost": { - "input": 30, - "output": 60 + "input": 0.1, + "output": 0.3 }, "type": "chat" }, { - "id": "openai/gpt-4-turbo-preview", - "name": "OpenAI: GPT-4 Turbo Preview", - "display_name": "OpenAI: GPT-4 Turbo Preview", + "id": "inclusionAI/Ling-flash-2.0", + "name": "inclusionAI/Ling-flash-2.0", + "display_name": "inclusionAI/Ling-flash-2.0", "modalities": { "input": [ "text" @@ -52374,8 +54892,8 @@ ] }, "limit": { - "context": 128000, - "output": 4096 + "context": 131072, + "output": 8192 }, "temperature": true, "tool_call": true, @@ -52384,22 +54902,20 @@ }, "attachment": false, "open_weights": false, - "release_date": "2024-01-25", - "last_updated": "2026-03-15", + "release_date": "2025-09-18", + "last_updated": "2025-11-25", "cost": { - "input": 10, - "output": 30 + "input": 0.14, + "output": 0.57 }, "type": "chat" }, { - "id": "openai/o3-deep-research", - "name": "OpenAI: o3 Deep Research", - "display_name": "OpenAI: o3 Deep Research", + "id": "inclusionAI/Ling-mini-2.0", + "name": "inclusionAI/Ling-mini-2.0", + "display_name": "inclusionAI/Ling-mini-2.0", "modalities": { "input": [ - "image", - "pdf", "text" ], "output": [ @@ -52407,91 +54923,76 @@ ] }, "limit": { - "context": 200000, - "output": 100000 + "context": 131072, + "output": 8192 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": true, - "mode": "effort", - "effort": "medium", - "effort_options": [ - "low", - "medium", - "high" - ], - "visibility": "hidden" - } + "supported": false }, - "attachment": true, + "attachment": false, "open_weights": false, - "release_date": "2024-06-26", - "last_updated": "2026-03-15", + "release_date": "2025-09-10", + "last_updated": "2025-11-25", "cost": { - "input": 10, - "output": 40, - "cache_read": 2.5 + "input": 0.07, + "output": 0.28 }, "type": "chat" }, { - "id": "openai/gpt-audio", - "name": "OpenAI: GPT Audio", - "display_name": "OpenAI: GPT Audio", + "id": "inclusionAI/Ring-flash-2.0", + "name": "inclusionAI/Ring-flash-2.0", + "display_name": "inclusionAI/Ring-flash-2.0", "modalities": { "input": [ - "audio", "text" ], "output": [ - "audio", "text" ] }, "limit": { - "context": 128000, - "output": 16384 + "context": 131072, + "output": 8192 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true + } }, "attachment": false, "open_weights": false, - "release_date": "2026-01-20", - "last_updated": "2026-03-15", + "release_date": "2025-09-29", + "last_updated": "2025-11-25", "cost": { - "input": 2.5, - "output": 10 + "input": 0.14, + "output": 0.57 }, "type": "chat" }, { - "id": "openai/gpt-5-image-mini", - "name": "OpenAI: GPT-5 Image Mini", - "display_name": "OpenAI: GPT-5 Image Mini", + "id": "Pro/moonshotai/Kimi-K2-Thinking", + "name": "Pro/moonshotai/Kimi-K2-Thinking", + "display_name": "Pro/moonshotai/Kimi-K2-Thinking", "modalities": { "input": [ - "image", - "pdf", "text" ], "output": [ - "image", "text" ] }, "limit": { - "context": 400000, - "output": 128000 + "context": 262000, + "output": 262000 }, "temperature": true, "tool_call": true, @@ -52499,24 +55000,33 @@ "supported": true, "default": true }, - "attachment": true, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } + }, + "attachment": false, "open_weights": false, - "release_date": "2025-10-16", - "last_updated": "2026-03-15", + "release_date": "2025-11-07", + "last_updated": "2025-11-25", "cost": { - "input": 2.5, - "output": 2 + "input": 0.55, + "output": 2.5 }, "type": "chat" }, { - "id": "openai/gpt-4.1", - "name": "OpenAI: GPT-4.1", - "display_name": "OpenAI: GPT-4.1", + "id": "Pro/moonshotai/Kimi-K2-Instruct-0905", + "name": "Pro/moonshotai/Kimi-K2-Instruct-0905", + "display_name": "Pro/moonshotai/Kimi-K2-Instruct-0905", "modalities": { "input": [ - "image", - "pdf", "text" ], "output": [ @@ -52524,122 +55034,119 @@ ] }, "limit": { - "context": 1047576, - "output": 32768 + "context": 131072, + "output": 8192 }, "temperature": true, "tool_call": true, "reasoning": { "supported": false }, - "attachment": true, + "attachment": false, "open_weights": false, - "release_date": "2025-04-14", - "last_updated": "2026-03-15", + "release_date": "2025-09-08", + "last_updated": "2025-11-25", "cost": { - "input": 2, - "output": 8, - "cache_read": 0.5 + "input": 0.4, + "output": 2 }, "type": "chat" }, { - "id": "openai/gpt-5.4-nano", - "name": "OpenAI: GPT-5.4 Nano", - "display_name": "OpenAI: GPT-5.4 Nano", + "id": "Pro/moonshotai/Kimi-K2.6", + "name": "Pro/moonshotai/Kimi-K2.6", + "display_name": "Pro/moonshotai/Kimi-K2.6", "modalities": { "input": [ - "image", - "pdf", - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 400000, - "output": 128000 + "context": 262000, + "output": 262000 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, - "default": false + "default": true }, "extra_capabilities": { "reasoning": { "supported": true, - "default_enabled": false, - "mode": "effort", - "effort": "none", - "effort_options": [ - "none", - "low", - "medium", - "high", - "xhigh" - ], - "verbosity": "medium", - "verbosity_options": [ - "low", - "medium", - "high" - ], - "visibility": "hidden" + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] } }, - "attachment": true, - "open_weights": false, - "release_date": "2026-03-17", - "last_updated": "2026-04-11", + "attachment": false, + "open_weights": true, + "release_date": "2026-04-21", + "last_updated": "2026-04-21", "cost": { - "input": 0.2, - "output": 1.25, - "cache_read": 0.02 + "input": 0.95, + "output": 4, + "cache_read": 0.16 }, "type": "chat" }, { - "id": "openai/gpt-audio-mini", - "name": "OpenAI: GPT Audio Mini", - "display_name": "OpenAI: GPT Audio Mini", + "id": "Pro/moonshotai/Kimi-K2.5", + "name": "Pro/moonshotai/Kimi-K2.5", + "display_name": "Pro/moonshotai/Kimi-K2.5", "modalities": { "input": [ - "audio", - "text" + "text", + "image" ], "output": [ - "audio", "text" ] }, "limit": { - "context": 128000, - "output": 16384 + "context": 262000, + "output": 262000 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } }, "attachment": false, - "open_weights": false, - "release_date": "2026-01-20", - "last_updated": "2026-03-15", + "open_weights": true, + "release_date": "2026-01-27", + "last_updated": "2026-01-27", "cost": { - "input": 0.6, - "output": 2.4 + "input": 0.45, + "output": 2.25 }, "type": "chat" }, { - "id": "openai/gpt-5.3-codex", - "name": "OpenAI: GPT-5.3-Codex", - "display_name": "OpenAI: GPT-5.3-Codex", + "id": "Pro/zai-org/GLM-5", + "name": "Pro/zai-org/GLM-5", + "display_name": "Pro/zai-org/GLM-5", "modalities": { "input": [ - "image", "text" ], "output": [ @@ -52647,9 +55154,10 @@ ] }, "limit": { - "context": 400000, - "output": 128000 + "context": 205000, + "output": 205000 }, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, @@ -52658,53 +55166,41 @@ "extra_capabilities": { "reasoning": { "supported": true, - "default_enabled": true, - "mode": "effort", - "effort": "medium", - "effort_options": [ - "low", - "medium", - "high", - "xhigh" - ], - "verbosity": "medium", - "verbosity_options": [ - "low", - "medium", - "high" - ], - "visibility": "hidden" + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] } }, - "attachment": true, - "open_weights": false, - "release_date": "2026-02-25", - "last_updated": "2026-03-15", + "attachment": false, + "open_weights": true, + "release_date": "2026-02-12", + "last_updated": "2026-02-12", "cost": { - "input": 1.75, - "output": 14 + "input": 1, + "output": 3.2 }, "type": "chat" }, { - "id": "openai/gpt-5.5-pro", - "name": "OpenAI: GPT-5.5 Pro", - "display_name": "OpenAI: GPT-5.5 Pro", + "id": "Pro/zai-org/GLM-4.7", + "name": "Pro/zai-org/GLM-4.7", + "display_name": "Pro/zai-org/GLM-4.7", "modalities": { "input": [ - "text", - "image", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 1050000, - "output": 128000 + "context": 205000, + "output": 205000 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, @@ -52712,60 +55208,75 @@ }, "extra_capabilities": { "reasoning": { - "supported": true + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] } }, - "attachment": true, + "attachment": false, "open_weights": false, - "release_date": "2026-04-24", - "last_updated": "2026-05-01", + "release_date": "2025-12-22", + "last_updated": "2025-12-22", "cost": { - "input": 30, - "output": 180 + "input": 0.6, + "output": 2.2 }, "type": "chat" }, { - "id": "openai/gpt-4o-audio-preview", - "name": "OpenAI: GPT-4o Audio", - "display_name": "OpenAI: GPT-4o Audio", + "id": "Pro/zai-org/GLM-5.1", + "name": "Pro/zai-org/GLM-5.1", + "display_name": "Pro/zai-org/GLM-5.1", "modalities": { "input": [ - "audio", "text" ], "output": [ - "audio", "text" ] }, "limit": { - "context": 128000, - "output": 16384 + "context": 205000, + "output": 205000 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } }, "attachment": false, - "open_weights": false, - "release_date": "2025-08-15", - "last_updated": "2026-03-15", + "open_weights": true, + "release_date": "2026-04-08", + "last_updated": "2026-04-08", "cost": { - "input": 2.5, - "output": 10 + "input": 1.4, + "output": 4.4, + "cache_write": 0 }, "type": "chat" }, { - "id": "openai/o4-mini-deep-research", - "name": "OpenAI: o4 Mini Deep Research", - "display_name": "OpenAI: o4 Mini Deep Research", + "id": "Pro/deepseek-ai/DeepSeek-R1", + "name": "Pro/deepseek-ai/DeepSeek-R1", + "display_name": "Pro/deepseek-ai/DeepSeek-R1", "modalities": { "input": [ - "image", - "pdf", "text" ], "output": [ @@ -52773,8 +55284,8 @@ ] }, "limit": { - "context": 200000, - "output": 100000 + "context": 131072, + "output": 8192 }, "temperature": true, "tool_call": true, @@ -52785,32 +55296,28 @@ "extra_capabilities": { "reasoning": { "supported": true, - "default_enabled": true, - "mode": "effort", - "effort": "medium", - "effort_options": [ - "low", - "medium", - "high" - ], - "visibility": "hidden" + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] } }, - "attachment": true, + "attachment": false, "open_weights": false, - "release_date": "2024-06-26", - "last_updated": "2026-03-15", + "release_date": "2025-05-28", + "last_updated": "2025-11-25", "cost": { - "input": 2, - "output": 8, - "cache_read": 0.5 + "input": 0.5, + "output": 2.18 }, "type": "chat" }, { - "id": "openai/gpt-3.5-turbo", - "name": "OpenAI: GPT-3.5 Turbo", - "display_name": "OpenAI: GPT-3.5 Turbo", + "id": "Pro/deepseek-ai/DeepSeek-V3.1-Terminus", + "name": "Pro/deepseek-ai/DeepSeek-V3.1-Terminus", + "display_name": "Pro/deepseek-ai/DeepSeek-V3.1-Terminus", "modalities": { "input": [ "text" @@ -52820,32 +55327,31 @@ ] }, "limit": { - "context": 16385, - "output": 4096 + "context": 131072, + "output": 8192 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "attachment": false, "open_weights": false, - "release_date": "2023-03-01", - "last_updated": "2023-11-06", + "release_date": "2025-09-29", + "last_updated": "2025-11-25", "cost": { - "input": 0.5, - "output": 1.5 + "input": 0.27, + "output": 1 }, "type": "chat" }, { - "id": "openai/gpt-5.2-chat", - "name": "OpenAI: GPT-5.2 Chat", - "display_name": "OpenAI: GPT-5.2 Chat", + "id": "Pro/deepseek-ai/DeepSeek-V3.2", + "name": "Pro/deepseek-ai/DeepSeek-V3.2", + "display_name": "Pro/deepseek-ai/DeepSeek-V3.2", "modalities": { "input": [ - "image", - "pdf", "text" ], "output": [ @@ -52853,29 +55359,34 @@ ] }, "limit": { - "context": 128000, - "output": 16384 + "context": 164000, + "output": 164000 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": true, + "extra_capabilities": { + "reasoning": { + "supported": true + } + }, + "attachment": false, "open_weights": false, - "release_date": "2025-12-11", - "last_updated": "2026-03-15", + "release_date": "2025-12-03", + "last_updated": "2025-12-03", "cost": { - "input": 1.75, - "output": 14, - "cache_read": 0.175 + "input": 0.27, + "output": 0.42 }, "type": "chat" }, { - "id": "openai/gpt-3.5-turbo-instruct", - "name": "OpenAI: GPT-3.5 Turbo Instruct", - "display_name": "OpenAI: GPT-3.5 Turbo Instruct", + "id": "Pro/deepseek-ai/DeepSeek-V3", + "name": "Pro/deepseek-ai/DeepSeek-V3", + "display_name": "Pro/deepseek-ai/DeepSeek-V3", "modalities": { "input": [ "text" @@ -52885,215 +55396,210 @@ ] }, "limit": { - "context": 4095, - "output": 4096 + "context": 131072, + "output": 8192 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { "supported": false }, "attachment": false, "open_weights": false, - "release_date": "2023-03-01", - "last_updated": "2023-09-21", + "release_date": "2024-12-26", + "last_updated": "2025-11-25", "cost": { - "input": 1.5, - "output": 2 + "input": 0.25, + "output": 1 }, "type": "chat" }, { - "id": "openai/gpt-5.2-codex", - "name": "OpenAI: GPT-5.2-Codex", - "display_name": "OpenAI: GPT-5.2-Codex", + "id": "Pro/MiniMaxAI/MiniMax-M2.1", + "name": "Pro/MiniMaxAI/MiniMax-M2.1", + "display_name": "Pro/MiniMaxAI/MiniMax-M2.1", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 400000, - "output": 128000 + "context": 197000, + "output": 131000 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": true }, "extra_capabilities": { "reasoning": { - "supported": true, - "default_enabled": true, - "mode": "effort", - "effort": "medium", - "effort_options": [ - "low", - "medium", - "high", - "xhigh" - ], - "verbosity": "medium", - "verbosity_options": [ - "low", - "medium", - "high" - ], - "visibility": "hidden" + "supported": true } }, - "attachment": true, + "attachment": false, "open_weights": false, - "release_date": "2026-01-14", - "last_updated": "2026-01-14", + "release_date": "2025-12-23", + "last_updated": "2025-12-23", "cost": { - "input": 1.75, - "output": 14, - "cache_read": 0.175 + "input": 0.3, + "output": 1.2 }, "type": "chat" }, { - "id": "openai/gpt-5.1-codex", - "name": "OpenAI: GPT-5.1-Codex", - "display_name": "OpenAI: GPT-5.1-Codex", + "id": "Pro/MiniMaxAI/MiniMax-M2.5", + "name": "Pro/MiniMaxAI/MiniMax-M2.5", + "display_name": "Pro/MiniMaxAI/MiniMax-M2.5", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 400000, - "output": 128000 + "context": 192000, + "output": 131000 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": false + "supported": true }, "extra_capabilities": { "reasoning": { "supported": true, - "default_enabled": false, - "mode": "effort", - "effort": "none", - "effort_options": [ - "none", - "low", - "medium", - "high" - ], - "verbosity": "medium", - "verbosity_options": [ - "low", - "medium", - "high" - ], - "visibility": "hidden" + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] } }, - "attachment": true, + "attachment": false, "open_weights": false, - "release_date": "2025-11-13", - "last_updated": "2025-11-13", + "release_date": "2026-02-13", + "last_updated": "2026-02-13", "cost": { - "input": 1.25, - "output": 10, - "cache_read": 0.125 + "input": 0.3, + "output": 1.22 }, "type": "chat" }, { - "id": "openai/gpt-4o-2024-05-13", - "name": "OpenAI: GPT-4o (2024-05-13)", - "display_name": "OpenAI: GPT-4o (2024-05-13)", + "id": "Qwen/Qwen3.6-35B-A3B", + "name": "Qwen/Qwen3.6-35B-A3B", + "display_name": "Qwen/Qwen3.6-35B-A3B", "modalities": { "input": [ + "text", "image", - "pdf", - "text" + "video" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 4096 + "context": 262144, + "output": 65536 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": true, - "open_weights": false, - "release_date": "2024-05-13", - "last_updated": "2026-03-15", + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } + }, + "attachment": false, + "open_weights": true, + "knowledge": "2025-04", + "release_date": "2026-04-17", + "last_updated": "2026-04-17", "cost": { - "input": 5, - "output": 15 + "input": 0.23, + "output": 1.86 }, "type": "chat" }, { - "id": "openai/gpt-5.1-chat", - "name": "OpenAI: GPT-5.1 Chat", - "display_name": "OpenAI: GPT-5.1 Chat", + "id": "Qwen/Qwen3.5-397B-A17B", + "name": "Qwen/Qwen3.5-397B-A17B", + "display_name": "Qwen/Qwen3.5-397B-A17B", "modalities": { "input": [ + "text", "image", - "pdf", - "text" + "video" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 16384 + "context": 262144, + "output": 65536 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": true, - "open_weights": false, - "release_date": "2025-11-13", - "last_updated": "2026-03-15", + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } + }, + "attachment": false, + "open_weights": true, + "knowledge": "2025-04", + "release_date": "2026-02-16", + "last_updated": "2026-02-16", "cost": { - "input": 1.25, - "output": 10, - "cache_read": 0.125 + "input": 0.29, + "output": 1.74 }, "type": "chat" }, { - "id": "openai/gpt-oss-safeguard-20b", - "name": "OpenAI: gpt-oss-safeguard-20b", - "display_name": "OpenAI: gpt-oss-safeguard-20b", + "id": "Qwen/Qwen3.5-122B-A10B", + "name": "Qwen/Qwen3.5-122B-A10B", + "display_name": "Qwen/Qwen3.5-122B-A10B", "modalities": { "input": [ - "text" + "text", + "image", + "video" ], "output": [ "text" ] }, "limit": { - "context": 131072, + "context": 262144, "output": 65536 }, "temperature": true, @@ -53102,156 +55608,185 @@ "supported": true, "default": true }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } + }, "attachment": false, - "open_weights": false, - "release_date": "2025-10-29", - "last_updated": "2025-10-29", + "open_weights": true, + "knowledge": "2025-04", + "release_date": "2026-02-26", + "last_updated": "2026-02-26", "cost": { - "input": 0.075, - "output": 0.3, - "cache_read": 0.037 + "input": 0.29, + "output": 2.32 }, "type": "chat" }, { - "id": "openai/gpt-3.5-turbo-0613", - "name": "OpenAI: GPT-3.5 Turbo (older v0613)", - "display_name": "OpenAI: GPT-3.5 Turbo (older v0613)", + "id": "Qwen/Qwen3.5-27B", + "name": "Qwen/Qwen3.5-27B", + "display_name": "Qwen/Qwen3.5-27B", "modalities": { "input": [ - "text" + "text", + "image", + "video" ], "output": [ "text" ] }, "limit": { - "context": 4095, - "output": 4096 + "context": 262144, + "output": 65536 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } }, "attachment": false, - "open_weights": false, - "release_date": "2023-06-13", - "last_updated": "2023-06-13", + "open_weights": true, + "knowledge": "2025-04", + "release_date": "2026-02-25", + "last_updated": "2026-02-25", "cost": { - "input": 1, - "output": 2 + "input": 0.26, + "output": 2.09 }, "type": "chat" }, { - "id": "openai/gpt-5.4-mini", - "name": "OpenAI: GPT-5.4 Mini", - "display_name": "OpenAI: GPT-5.4 Mini", + "id": "Qwen/Qwen3.5-4B", + "name": "Qwen/Qwen3.5-4B", + "display_name": "Qwen/Qwen3.5-4B", "modalities": { "input": [ + "text", "image", - "pdf", - "text" + "video" ], "output": [ "text" ] }, "limit": { - "context": 400000, - "output": 128000 + "context": 262144, + "output": 65536 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, - "default": false + "default": true }, "extra_capabilities": { "reasoning": { "supported": true, - "default_enabled": false, - "mode": "effort", - "effort": "none", - "effort_options": [ - "none", - "low", - "medium", - "high", - "xhigh" - ], - "verbosity": "medium", - "verbosity_options": [ - "low", - "medium", - "high" - ], - "visibility": "hidden" + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] } }, - "attachment": true, - "open_weights": false, - "release_date": "2026-03-17", - "last_updated": "2026-04-11", + "attachment": false, + "open_weights": true, + "knowledge": "2025-04", + "release_date": "2026-03-03", + "last_updated": "2026-03-03", "cost": { - "input": 0.75, - "output": 4.5, - "cache_read": 0.075 + "input": 0, + "output": 0 }, "type": "chat" }, { - "id": "openai/gpt-4-turbo", - "name": "OpenAI: GPT-4 Turbo", - "display_name": "OpenAI: GPT-4 Turbo", + "id": "Qwen/Qwen3.5-9B", + "name": "Qwen/Qwen3.5-9B", + "display_name": "Qwen/Qwen3.5-9B", "modalities": { "input": [ "text", - "image" + "image", + "video" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 4096 + "context": 262144, + "output": 65536 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": true, - "open_weights": false, - "release_date": "2023-09-13", - "last_updated": "2024-04-09", + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } + }, + "attachment": false, + "open_weights": true, + "knowledge": "2025-04", + "release_date": "2026-03-03", + "last_updated": "2026-03-03", "cost": { - "input": 10, - "output": 30 + "input": 0.22, + "output": 1.74 }, "type": "chat" }, { - "id": "openai/o1", - "name": "OpenAI: o1", - "display_name": "OpenAI: o1", + "id": "Qwen/Qwen3.5-35B-A3B", + "name": "Qwen/Qwen3.5-35B-A3B", + "display_name": "Qwen/Qwen3.5-35B-A3B", "modalities": { "input": [ + "text", "image", - "pdf", - "text" + "video" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 100000 + "context": 262144, + "output": 65536 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, @@ -53260,67 +55795,75 @@ "extra_capabilities": { "reasoning": { "supported": true, - "default_enabled": true, - "mode": "effort", - "effort": "medium", - "effort_options": [ - "low", - "medium", - "high" - ], - "visibility": "hidden" + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] } }, - "attachment": true, - "open_weights": false, - "release_date": "2024-12-05", - "last_updated": "2026-03-15", + "attachment": false, + "open_weights": true, + "knowledge": "2025-04", + "release_date": "2026-02-25", + "last_updated": "2026-02-25", "cost": { - "input": 15, - "output": 60, - "cache_read": 7.5 + "input": 0.23, + "output": 1.86 }, "type": "chat" }, { - "id": "openai/gpt-4", - "name": "OpenAI: GPT-4", - "display_name": "OpenAI: GPT-4", + "id": "Qwen/Qwen3-VL-32B-Thinking", + "name": "Qwen/Qwen3-VL-32B-Thinking", + "display_name": "Qwen/Qwen3-VL-32B-Thinking", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 8191, - "output": 4096 + "context": 262000, + "output": 262000 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": false, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } + }, + "attachment": true, "open_weights": false, - "release_date": "2023-03-14", - "last_updated": "2024-04-09", + "release_date": "2025-10-21", + "last_updated": "2025-11-25", "cost": { - "input": 30, - "output": 60 + "input": 0.2, + "output": 1.5 }, "type": "chat" }, { - "id": "openai/gpt-5.3-chat", - "name": "OpenAI: GPT-5.3 Chat", - "display_name": "OpenAI: GPT-5.3 Chat", + "id": "Qwen/Qwen3-VL-30B-A3B-Instruct", + "name": "Qwen/Qwen3-VL-30B-A3B-Instruct", + "display_name": "Qwen/Qwen3-VL-30B-A3B-Instruct", "modalities": { "input": [ - "image", - "pdf", "text" ], "output": [ @@ -53328,27 +55871,28 @@ ] }, "limit": { - "context": 128000, - "output": 16384 + "context": 131072, + "output": 8192 }, + "temperature": true, "tool_call": true, "reasoning": { "supported": false }, "attachment": true, "open_weights": false, - "release_date": "2026-03-04", - "last_updated": "2026-03-15", + "release_date": "2025-10-05", + "last_updated": "2025-11-25", "cost": { - "input": 1.75, - "output": 14 + "input": 0.29, + "output": 1 }, "type": "chat" }, { - "id": "openai/gpt-4o-search-preview", - "name": "OpenAI: GPT-4o Search Preview", - "display_name": "OpenAI: GPT-4o Search Preview", + "id": "Qwen/Qwen3-Omni-30B-A3B-Instruct", + "name": "Qwen/Qwen3-Omni-30B-A3B-Instruct", + "display_name": "Qwen/Qwen3-Omni-30B-A3B-Instruct", "modalities": { "input": [ "text" @@ -53358,31 +55902,30 @@ ] }, "limit": { - "context": 128000, - "output": 16384 + "context": 131072, + "output": 8192 }, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { "supported": false }, - "attachment": false, + "attachment": true, "open_weights": false, - "release_date": "2025-03-13", - "last_updated": "2026-03-15", + "release_date": "2025-10-04", + "last_updated": "2025-11-25", "cost": { - "input": 2.5, - "output": 10 + "input": 0.1, + "output": 0.4 }, "type": "chat" }, { - "id": "openai/gpt-4.1-nano", - "name": "OpenAI: GPT-4.1 Nano", - "display_name": "OpenAI: GPT-4.1 Nano", + "id": "Qwen/Qwen2.5-72B-Instruct", + "name": "Qwen/Qwen2.5-72B-Instruct", + "display_name": "Qwen/Qwen2.5-72B-Instruct", "modalities": { "input": [ - "image", - "pdf", "text" ], "output": [ @@ -53390,29 +55933,28 @@ ] }, "limit": { - "context": 1047576, - "output": 32768 + "context": 131072, + "output": 8192 }, "temperature": true, "tool_call": true, "reasoning": { "supported": false }, - "attachment": true, + "attachment": false, "open_weights": false, - "release_date": "2025-04-14", - "last_updated": "2026-03-15", + "release_date": "2024-09-18", + "last_updated": "2025-11-25", "cost": { - "input": 0.1, - "output": 0.4, - "cache_read": 0.025 + "input": 0.59, + "output": 0.59 }, "type": "chat" }, { - "id": "poolside/laguna-m.1:free", - "name": "Poolside: Laguna M.1 (free)", - "display_name": "Poolside: Laguna M.1 (free)", + "id": "Qwen/Qwen3-14B", + "name": "Qwen/Qwen3-14B", + "display_name": "Qwen/Qwen3-14B", "modalities": { "input": [ "text" @@ -53428,23 +55970,33 @@ "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } }, "attachment": false, "open_weights": false, - "release_date": "2026-04-28", - "last_updated": "2026-05-01", + "release_date": "2025-04-30", + "last_updated": "2025-11-25", "cost": { - "input": 0, - "output": 0 + "input": 0.07, + "output": 0.28 }, "type": "chat" }, { - "id": "poolside/laguna-xs.2:free", - "name": "Poolside: Laguna XS.2 (free)", - "display_name": "Poolside: Laguna XS.2 (free)", + "id": "Qwen/Qwen2.5-14B-Instruct", + "name": "Qwen/Qwen2.5-14B-Instruct", + "display_name": "Qwen/Qwen2.5-14B-Instruct", "modalities": { "input": [ "text" @@ -53460,55 +56012,54 @@ "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, "attachment": false, "open_weights": false, - "release_date": "2026-04-28", - "last_updated": "2026-05-01", + "release_date": "2024-09-18", + "last_updated": "2025-11-25", "cost": { - "input": 0, - "output": 0 + "input": 0.1, + "output": 0.1 }, "type": "chat" }, { - "id": "bytedance/ui-tars-1.5-7b", - "name": "ByteDance: UI-TARS 7B ", - "display_name": "ByteDance: UI-TARS 7B ", + "id": "Qwen/Qwen3-VL-32B-Instruct", + "name": "Qwen/Qwen3-VL-32B-Instruct", + "display_name": "Qwen/Qwen3-VL-32B-Instruct", "modalities": { "input": [ - "image", - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 2048 + "context": 262000, + "output": 262000 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { "supported": false }, "attachment": true, "open_weights": false, - "release_date": "2025-07-23", - "last_updated": "2026-03-15", + "release_date": "2025-10-21", + "last_updated": "2025-11-25", "cost": { - "input": 0.1, - "output": 0.2 + "input": 0.2, + "output": 0.6 }, "type": "chat" }, { - "id": "minimax/minimax-m1", - "name": "MiniMax: MiniMax M1", - "display_name": "MiniMax: MiniMax M1", + "id": "Qwen/Qwen3-32B", + "name": "Qwen/Qwen3-32B", + "display_name": "Qwen/Qwen3-32B", "modalities": { "input": [ "text" @@ -53518,61 +56069,70 @@ ] }, "limit": { - "context": 1000000, - "output": 40000 + "context": 131072, + "output": 8192 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } }, "attachment": false, - "open_weights": true, - "release_date": "2025-06-17", - "last_updated": "2025-06-17", + "open_weights": false, + "release_date": "2025-04-30", + "last_updated": "2025-11-25", "cost": { - "input": 0.4, - "output": 2.2 + "input": 0.14, + "output": 0.57 }, "type": "chat" }, { - "id": "minimax/minimax-01", - "name": "MiniMax: MiniMax-01", - "display_name": "MiniMax: MiniMax-01", + "id": "Qwen/Qwen3-235B-A22B-Instruct-2507", + "name": "Qwen/Qwen3-235B-A22B-Instruct-2507", + "display_name": "Qwen/Qwen3-235B-A22B-Instruct-2507", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 1000192, - "output": 1000192 + "context": 131072, + "output": 8192 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { "supported": false }, - "attachment": true, - "open_weights": true, - "release_date": "2025-01-15", - "last_updated": "2025-01-15", + "attachment": false, + "open_weights": false, + "release_date": "2025-07-23", + "last_updated": "2025-11-25", "cost": { - "input": 0.2, - "output": 1.1 + "input": 0.09, + "output": 0.6 }, "type": "chat" }, { - "id": "minimax/minimax-m2.1", - "name": "MiniMax: MiniMax M2.1", - "display_name": "MiniMax: MiniMax M2.1", + "id": "Qwen/Qwen3-8B", + "name": "Qwen/Qwen3-8B", + "display_name": "Qwen/Qwen3-8B", "modalities": { "input": [ "text" @@ -53582,35 +56142,39 @@ ] }, "limit": { - "context": 196608, - "output": 39322 + "context": 131072, + "output": 8192 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": true }, "extra_capabilities": { "reasoning": { - "supported": true + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] } }, "attachment": false, - "open_weights": true, - "release_date": "2025-12-23", - "last_updated": "2025-12-23", + "open_weights": false, + "release_date": "2025-04-30", + "last_updated": "2025-11-25", "cost": { - "input": 0.27, - "output": 0.95, - "cache_read": 0.03 + "input": 0.06, + "output": 0.06 }, "type": "chat" }, { - "id": "minimax/minimax-m2.7", - "name": "MiniMax: MiniMax M2.7", - "display_name": "MiniMax: MiniMax M2.7", + "id": "Qwen/Qwen2.5-Coder-32B-Instruct", + "name": "Qwen/Qwen2.5-Coder-32B-Instruct", + "display_name": "Qwen/Qwen2.5-Coder-32B-Instruct", "modalities": { "input": [ "text" @@ -53620,41 +56184,27 @@ ] }, "limit": { - "context": 204800, - "output": 131072 + "context": 131072, + "output": 8192 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } + "supported": false }, "attachment": false, - "open_weights": true, - "release_date": "2026-03-18", - "last_updated": "2026-03-18", + "open_weights": false, + "release_date": "2024-11-11", + "last_updated": "2025-11-25", "cost": { - "input": 0.3, - "output": 1.2, - "cache_read": 0.06 - }, - "type": "chat" + "input": 0.18, + "output": 0.18 + } }, { - "id": "minimax/minimax-m2", - "name": "MiniMax: MiniMax M2", - "display_name": "MiniMax: MiniMax M2", + "id": "Qwen/Qwen3-Next-80B-A3B-Thinking", + "name": "Qwen/Qwen3-Next-80B-A3B-Thinking", + "display_name": "Qwen/Qwen3-Next-80B-A3B-Thinking", "modalities": { "input": [ "text" @@ -53664,8 +56214,8 @@ ] }, "limit": { - "context": 196608, - "output": 196608 + "context": 131072, + "output": 8192 }, "temperature": true, "tool_call": true, @@ -53675,24 +56225,29 @@ }, "extra_capabilities": { "reasoning": { - "supported": true + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] } }, "attachment": false, - "open_weights": true, - "release_date": "2025-10-23", - "last_updated": "2026-03-15", + "open_weights": false, + "release_date": "2025-09-25", + "last_updated": "2025-11-25", "cost": { - "input": 0.255, - "output": 1, - "cache_read": 0.03 + "input": 0.14, + "output": 0.57 }, "type": "chat" }, { - "id": "minimax/minimax-m2.5", - "name": "MiniMax: MiniMax M2.5", - "display_name": "MiniMax: MiniMax M2.5", + "id": "Qwen/Qwen3-VL-235B-A22B-Thinking", + "name": "Qwen/Qwen3-VL-235B-A22B-Thinking", + "display_name": "Qwen/Qwen3-VL-235B-A22B-Thinking", "modalities": { "input": [ "text" @@ -53702,8 +56257,8 @@ ] }, "limit": { - "context": 196608, - "output": 196608 + "context": 131072, + "output": 8192 }, "temperature": true, "tool_call": true, @@ -53713,24 +56268,29 @@ }, "extra_capabilities": { "reasoning": { - "supported": true + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] } }, - "attachment": false, - "open_weights": true, - "release_date": "2026-02-12", - "last_updated": "2026-03-15", + "attachment": true, + "open_weights": false, + "release_date": "2025-10-04", + "last_updated": "2025-11-25", "cost": { - "input": 0.25, - "output": 1.2, - "cache_read": 0.029 + "input": 0.45, + "output": 3.5 }, "type": "chat" }, { - "id": "minimax/minimax-m2-her", - "name": "MiniMax: MiniMax M2-her", - "display_name": "MiniMax: MiniMax M2-her", + "id": "Qwen/Qwen3-Omni-30B-A3B-Captioner", + "name": "Qwen/Qwen3-Omni-30B-A3B-Captioner", + "display_name": "Qwen/Qwen3-Omni-30B-A3B-Captioner", "modalities": { "input": [ "text" @@ -53740,28 +56300,28 @@ ] }, "limit": { - "context": 65536, - "output": 2048 + "context": 131072, + "output": 8192 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { "supported": false }, - "attachment": false, - "open_weights": true, - "release_date": "2026-01-23", - "last_updated": "2026-03-15", + "attachment": true, + "open_weights": false, + "release_date": "2025-10-04", + "last_updated": "2025-11-25", "cost": { - "input": 0.3, - "output": 1.2 + "input": 0.1, + "output": 0.4 }, "type": "chat" }, { - "id": "allenai/olmo-3-32b-think", - "name": "AllenAI: Olmo 3 32B Think", - "display_name": "AllenAI: Olmo 3 32B Think", + "id": "Qwen/QwQ-32B", + "name": "Qwen/QwQ-32B", + "display_name": "Qwen/QwQ-32B", "modalities": { "input": [ "text" @@ -53771,101 +56331,71 @@ ] }, "limit": { - "context": 65536, - "output": 65536 + "context": 131072, + "output": 8192 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } }, "attachment": false, - "open_weights": true, - "release_date": "2025-11-22", - "last_updated": "2026-03-15", + "open_weights": false, + "release_date": "2025-03-06", + "last_updated": "2025-11-25", "cost": { "input": 0.15, - "output": 0.5 + "output": 0.58 }, "type": "chat" - } - ] - }, - "regolo-ai": { - "id": "regolo-ai", - "name": "Regolo AI", - "display_name": "Regolo AI", - "api": "https://api.regolo.ai/v1", - "doc": "https://docs.regolo.ai/", - "models": [ + }, { - "id": "mistral-small3.2", - "name": "Mistral Small 3.2", - "display_name": "Mistral Small 3.2", + "id": "Qwen/Qwen3-VL-8B-Instruct", + "name": "Qwen/Qwen3-VL-8B-Instruct", + "display_name": "Qwen/Qwen3-VL-8B-Instruct", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 120000, - "output": 120000 + "context": 262000, + "output": 262000 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, - "attachment": false, + "attachment": true, "open_weights": false, - "release_date": "2025-01-31", - "last_updated": "2025-01-31", + "release_date": "2025-10-15", + "last_updated": "2025-11-25", "cost": { - "input": 0.5, - "output": 2.2 + "input": 0.18, + "output": 0.68 }, "type": "chat" }, { - "id": "qwen3-reranker-4b", - "name": "Qwen3-Reranker-4B", - "display_name": "Qwen3-Reranker-4B", - "modalities": { - "input": [ - "text" - ], - "output": [ - "text" - ] - }, - "limit": { - "context": 32768, - "output": 8192 - }, - "temperature": false, - "tool_call": false, - "reasoning": { - "supported": false - }, - "attachment": false, - "open_weights": true, - "release_date": "2026-02-01", - "last_updated": "2026-02-01", - "cost": { - "input": 0.12, - "output": 0.12 - }, - "type": "rerank" - }, - { - "id": "qwen3.5-122b", - "name": "Qwen3.5-122B", - "display_name": "Qwen3.5-122B", + "id": "Qwen/Qwen3-VL-8B-Thinking", + "name": "Qwen/Qwen3-VL-8B-Thinking", + "display_name": "Qwen/Qwen3-VL-8B-Thinking", "modalities": { "input": [ "text", @@ -53876,8 +56406,8 @@ ] }, "limit": { - "context": 262144, - "output": 16384 + "context": 262000, + "output": 262000 }, "temperature": true, "tool_call": true, @@ -53897,31 +56427,30 @@ } }, "attachment": true, - "open_weights": true, - "release_date": "2026-02-01", - "last_updated": "2026-02-01", + "open_weights": false, + "release_date": "2025-10-15", + "last_updated": "2025-11-25", "cost": { - "input": 0.9, - "output": 3.6 + "input": 0.18, + "output": 2 }, "type": "chat" }, { - "id": "mistral-small-4-119b", - "name": "Mistral Small 4 119B", - "display_name": "Mistral Small 4 119B", + "id": "Qwen/Qwen3-VL-30B-A3B-Thinking", + "name": "Qwen/Qwen3-VL-30B-A3B-Thinking", + "display_name": "Qwen/Qwen3-VL-30B-A3B-Thinking", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 256000, - "output": 16384 + "context": 131072, + "output": 8192 }, "temperature": true, "tool_call": true, @@ -53929,20 +56458,31 @@ "supported": true, "default": true }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } + }, "attachment": true, "open_weights": false, - "release_date": "2026-03-15", - "last_updated": "2026-03-15", + "release_date": "2025-10-11", + "last_updated": "2025-11-25", "cost": { - "input": 0.75, - "output": 3 + "input": 0.29, + "output": 1 }, "type": "chat" }, { - "id": "gpt-oss-120b", - "name": "GPT-OSS-120B", - "display_name": "GPT-OSS-120B", + "id": "Qwen/Qwen3-30B-A3B-Instruct-2507", + "name": "Qwen/Qwen3-30B-A3B-Instruct-2507", + "display_name": "Qwen/Qwen3-30B-A3B-Instruct-2507", "modalities": { "input": [ "text" @@ -53952,34 +56492,28 @@ ] }, "limit": { - "context": 128000, - "output": 16384 + "context": 131072, + "output": 8192 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true - } + "supported": false }, "attachment": false, "open_weights": false, - "release_date": "2025-08-05", - "last_updated": "2025-08-05", + "release_date": "2025-07-30", + "last_updated": "2025-11-25", "cost": { - "input": 1, - "output": 4.2 + "input": 0.09, + "output": 0.3 }, "type": "chat" }, { - "id": "qwen3-coder-next", - "name": "Qwen3-Coder-Next", - "display_name": "Qwen3-Coder-Next", + "id": "Qwen/Qwen3-Coder-30B-A3B-Instruct", + "name": "Qwen/Qwen3-Coder-30B-A3B-Instruct", + "display_name": "Qwen/Qwen3-Coder-30B-A3B-Instruct", "modalities": { "input": [ "text" @@ -53989,29 +56523,27 @@ ] }, "limit": { - "context": 262144, - "output": 16384 + "context": 131072, + "output": 8192 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, "attachment": false, - "open_weights": true, - "release_date": "2026-03-01", - "last_updated": "2026-03-01", + "open_weights": false, + "release_date": "2025-08-01", + "last_updated": "2025-11-25", "cost": { - "input": 0.3, - "output": 1.2 - }, - "type": "chat" + "input": 0.07, + "output": 0.28 + } }, { - "id": "gpt-oss-20b", - "name": "GPT-OSS-20B", - "display_name": "GPT-OSS-20B", + "id": "Qwen/Qwen3-Coder-480B-A35B-Instruct", + "name": "Qwen/Qwen3-Coder-480B-A35B-Instruct", + "display_name": "Qwen/Qwen3-Coder-480B-A35B-Instruct", "modalities": { "input": [ "text" @@ -54021,45 +56553,68 @@ ] }, "limit": { - "context": 128000, - "output": 16384 + "context": 131072, + "output": 8192 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, - "extra_capabilities": { - "reasoning": { - "supported": true - } + "attachment": false, + "open_weights": false, + "release_date": "2025-07-31", + "last_updated": "2025-11-25", + "cost": { + "input": 0.25, + "output": 1 + } + }, + { + "id": "Qwen/Qwen2.5-72B-Instruct-128K", + "name": "Qwen/Qwen2.5-72B-Instruct-128K", + "display_name": "Qwen/Qwen2.5-72B-Instruct-128K", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 131072, + "output": 8192 + }, + "temperature": true, + "tool_call": true, + "reasoning": { + "supported": false }, "attachment": false, - "open_weights": true, - "release_date": "2026-03-01", - "last_updated": "2026-03-01", + "open_weights": false, + "release_date": "2024-09-18", + "last_updated": "2025-11-25", "cost": { - "input": 0.4, - "output": 1.8 + "input": 0.59, + "output": 0.59 }, "type": "chat" }, { - "id": "qwen3.5-9b", - "name": "Qwen3.5-9B", - "display_name": "Qwen3.5-9B", + "id": "Qwen/Qwen3-235B-A22B-Thinking-2507", + "name": "Qwen/Qwen3-235B-A22B-Thinking-2507", + "display_name": "Qwen/Qwen3-235B-A22B-Thinking-2507", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 262144, + "context": 131072, "output": 8192 }, "temperature": true, @@ -54079,20 +56634,20 @@ ] } }, - "attachment": true, - "open_weights": true, - "release_date": "2026-02-01", - "last_updated": "2026-02-01", + "attachment": false, + "open_weights": false, + "release_date": "2025-07-28", + "last_updated": "2025-11-25", "cost": { - "input": 0.15, + "input": 0.13, "output": 0.6 }, "type": "chat" }, { - "id": "qwen3-embedding-8b", - "name": "Qwen3-Embedding-8B", - "display_name": "Qwen3-Embedding-8B", + "id": "Qwen/Qwen3-Next-80B-A3B-Instruct", + "name": "Qwen/Qwen3-Next-80B-A3B-Instruct", + "display_name": "Qwen/Qwen3-Next-80B-A3B-Instruct", "modalities": { "input": [ "text" @@ -54102,59 +56657,59 @@ ] }, "limit": { - "context": 32768, + "context": 131072, "output": 8192 }, - "temperature": false, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { "supported": false }, "attachment": false, - "open_weights": true, - "release_date": "2026-02-01", - "last_updated": "2026-02-01", + "open_weights": false, + "release_date": "2025-09-18", + "last_updated": "2025-11-25", "cost": { - "input": 0.1, - "output": 0.1 + "input": 0.14, + "output": 1.4 }, - "type": "embedding" + "type": "chat" }, { - "id": "qwen-image", - "name": "Qwen-Image", - "display_name": "Qwen-Image", + "id": "Qwen/Qwen2.5-32B-Instruct", + "name": "Qwen/Qwen2.5-32B-Instruct", + "display_name": "Qwen/Qwen2.5-32B-Instruct", "modalities": { "input": [ "text" ], "output": [ - "image" + "text" ] }, "limit": { - "context": 8192, - "output": 4096 + "context": 131072, + "output": 8192 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { "supported": false }, "attachment": false, "open_weights": false, - "release_date": "2026-03-01", - "last_updated": "2026-03-01", + "release_date": "2024-09-19", + "last_updated": "2025-11-25", "cost": { - "input": 0.5, - "output": 2 + "input": 0.18, + "output": 0.18 }, - "type": "imageGeneration" + "type": "chat" }, { - "id": "minimax-m2.5", - "name": "MiniMax 2.5", - "display_name": "MiniMax 2.5", + "id": "Qwen/Qwen3-VL-235B-A22B-Instruct", + "name": "Qwen/Qwen3-VL-235B-A22B-Instruct", + "display_name": "Qwen/Qwen3-VL-235B-A22B-Instruct", "modalities": { "input": [ "text" @@ -54164,34 +56719,28 @@ ] }, "limit": { - "context": 190000, - "output": 64000 + "context": 131072, + "output": 8192 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true - } + "supported": false }, - "attachment": false, + "attachment": true, "open_weights": false, - "release_date": "2026-03-10", - "last_updated": "2026-03-10", + "release_date": "2025-10-04", + "last_updated": "2025-11-25", "cost": { - "input": 0.8, - "output": 3.5 + "input": 0.3, + "output": 1.5 }, "type": "chat" }, { - "id": "llama-3.1-8b-instruct", - "name": "Llama 3.1 8B Instruct", - "display_name": "Llama 3.1 8B Instruct", + "id": "Qwen/Qwen2.5-7B-Instruct", + "name": "Qwen/Qwen2.5-7B-Instruct", + "display_name": "Qwen/Qwen2.5-7B-Instruct", "modalities": { "input": [ "text" @@ -54201,8 +56750,8 @@ ] }, "limit": { - "context": 120000, - "output": 120000 + "context": 131072, + "output": 8192 }, "temperature": true, "tool_call": true, @@ -54211,18 +56760,18 @@ }, "attachment": false, "open_weights": false, - "release_date": "2025-04-07", - "last_updated": "2025-04-07", + "release_date": "2024-09-18", + "last_updated": "2025-11-25", "cost": { "input": 0.05, - "output": 0.25 + "output": 0.05 }, "type": "chat" }, { - "id": "llama-3.3-70b-instruct", - "name": "Llama 3.3 70B Instruct", - "display_name": "Llama 3.3 70B Instruct", + "id": "Qwen/Qwen3-30B-A3B-Thinking-2507", + "name": "Qwen/Qwen3-30B-A3B-Thinking-2507", + "display_name": "Qwen/Qwen3-30B-A3B-Thinking-2507", "modalities": { "input": [ "text" @@ -54232,127 +56781,113 @@ ] }, "limit": { - "context": 128000, - "output": 16384 + "context": 131072, + "output": 8192 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } }, "attachment": false, "open_weights": false, - "release_date": "2025-04-28", - "last_updated": "2025-04-28", + "release_date": "2025-07-31", + "last_updated": "2025-11-25", "cost": { - "input": 0.6, - "output": 2.7 + "input": 0.09, + "output": 0.3 }, "type": "chat" - } - ] - }, - "google-vertex": { - "id": "google-vertex", - "name": "Vertex", - "display_name": "Vertex", - "doc": "https://cloud.google.com/vertex-ai/generative-ai/docs/models", - "models": [ + }, { - "id": "gemini-2.5-flash-tts", - "name": "Gemini 2.5 Flash TTS", - "display_name": "Gemini 2.5 Flash TTS", + "id": "Qwen/Qwen2.5-VL-32B-Instruct", + "name": "Qwen/Qwen2.5-VL-32B-Instruct", + "display_name": "Qwen/Qwen2.5-VL-32B-Instruct", "modalities": { "input": [ "text" ], "output": [ - "audio" + "text" ] }, "limit": { - "context": 32768, - "output": 16384 + "context": 131072, + "output": 8192 }, - "temperature": false, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { "supported": false }, - "attachment": false, + "attachment": true, "open_weights": false, - "knowledge": "2025-01", - "release_date": "2025-09-30", - "last_updated": "2025-12-10", + "release_date": "2025-03-24", + "last_updated": "2025-11-25", "cost": { - "input": 0.5, - "output": 10 + "input": 0.27, + "output": 0.27 }, "type": "chat" }, { - "id": "gemini-3.1-flash-lite-preview", - "name": "Gemini 3.1 Flash Lite Preview", - "display_name": "Gemini 3.1 Flash Lite Preview", + "id": "Qwen/Qwen2.5-VL-72B-Instruct", + "name": "Qwen/Qwen2.5-VL-72B-Instruct", + "display_name": "Qwen/Qwen2.5-VL-72B-Instruct", "modalities": { "input": [ - "text", - "image", - "video", - "audio", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 1048576, - "output": 65536 + "context": 131072, + "output": 8192 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true - } + "supported": false }, "attachment": true, "open_weights": false, - "knowledge": "2025-01", - "release_date": "2026-03-03", - "last_updated": "2026-03-03", + "release_date": "2025-01-28", + "last_updated": "2025-11-25", "cost": { - "input": 0.25, - "output": 1.5, - "cache_read": 0.025, - "input_audio": 0.5 + "input": 0.59, + "output": 0.59 }, "type": "chat" }, { - "id": "gemini-flash-lite-latest", - "name": "Gemini Flash-Lite Latest", - "display_name": "Gemini Flash-Lite Latest", + "id": "Qwen/Qwen3-Omni-30B-A3B-Thinking", + "name": "Qwen/Qwen3-Omni-30B-A3B-Thinking", + "display_name": "Qwen/Qwen3-Omni-30B-A3B-Thinking", "modalities": { "input": [ - "text", - "image", - "audio", - "video", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 1048576, - "output": 65536 + "context": 131072, + "output": 8192 }, "temperature": true, "tool_call": true, @@ -54360,510 +56895,299 @@ "supported": true, "default": true }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } + }, "attachment": true, "open_weights": false, - "knowledge": "2025-01", - "release_date": "2025-09-25", - "last_updated": "2025-09-25", + "release_date": "2025-10-04", + "last_updated": "2025-11-25", "cost": { "input": 0.1, - "output": 0.4, - "cache_read": 0.025 + "output": 0.4 }, "type": "chat" }, { - "id": "gemini-3-flash-preview", - "name": "Gemini 3 Flash Preview", - "display_name": "Gemini 3 Flash Preview", + "id": "PaddlePaddle/PaddleOCR-VL-1.5", + "name": "PaddlePaddle/PaddleOCR-VL-1.5", + "display_name": "PaddlePaddle/PaddleOCR-VL-1.5", "modalities": { "input": [ "text", - "image", - "video", - "audio", - "pdf" + "image" ], "output": [ "text" ] }, "limit": { - "context": 1048576, - "output": 65536 + "context": 16384, + "output": 16384 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": true, - "mode": "level", - "level": "high", - "level_options": [ - "minimal", - "low", - "medium", - "high" - ], - "summaries": true, - "visibility": "summary", - "continuation": [ - "thought_signatures" - ] - } + "supported": false }, "attachment": true, - "open_weights": false, - "knowledge": "2025-01", - "release_date": "2025-12-17", - "last_updated": "2025-12-17", + "open_weights": true, + "release_date": "2026-01-29", + "last_updated": "2026-01-29", "cost": { - "input": 0.5, - "output": 3, - "cache_read": 0.05, - "input_audio": 1 + "input": 0, + "output": 0 }, "type": "chat" }, { - "id": "gemini-3.1-pro-preview-customtools", - "name": "Gemini 3.1 Pro Preview Custom Tools", - "display_name": "Gemini 3.1 Pro Preview Custom Tools", + "id": "PaddlePaddle/PaddleOCR-VL", + "name": "PaddlePaddle/PaddleOCR-VL", + "display_name": "PaddlePaddle/PaddleOCR-VL", "modalities": { "input": [ "text", - "image", - "video", - "audio", - "pdf" + "image" ], "output": [ "text" ] }, "limit": { - "context": 1048576, - "output": 65536 + "context": 16384, + "output": 16384 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": true, - "mode": "level", - "level": "high", - "level_options": [ - "low", - "high" - ], - "summaries": true, - "visibility": "summary", - "continuation": [ - "thought_signatures" - ] - } + "supported": false }, "attachment": true, - "open_weights": false, - "knowledge": "2025-01", - "release_date": "2026-02-19", - "last_updated": "2026-02-19", + "open_weights": true, + "release_date": "2025-10-16", + "last_updated": "2025-10-16", "cost": { - "input": 2, - "output": 12, - "cache_read": 0.2, - "tiers": [ - { - "input": 4, - "output": 18, - "cache_read": 0.4, - "tier": { - "type": "context", - "size": 200000 - } - } - ], - "context_over_200k": { - "input": 4, - "output": 18, - "cache_read": 0.4 - } + "input": 0, + "output": 0 }, "type": "chat" }, { - "id": "gemini-flash-latest", - "name": "Gemini Flash Latest", - "display_name": "Gemini Flash Latest", + "id": "tencent/Hunyuan-A13B-Instruct", + "name": "tencent/Hunyuan-A13B-Instruct", + "display_name": "tencent/Hunyuan-A13B-Instruct", "modalities": { "input": [ - "text", - "image", - "audio", - "video", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 1048576, - "output": 65536 + "context": 131072, + "output": 8192 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, - "attachment": true, + "attachment": false, "open_weights": false, - "knowledge": "2025-01", - "release_date": "2025-09-25", - "last_updated": "2025-09-25", + "release_date": "2025-06-30", + "last_updated": "2025-11-25", "cost": { - "input": 0.3, - "output": 2.5, - "cache_read": 0.075, - "cache_write": 0.383 + "input": 0.14, + "output": 0.57 }, "type": "chat" }, { - "id": "gemini-2.5-pro", - "name": "Gemini 2.5 Pro", - "display_name": "Gemini 2.5 Pro", + "id": "tencent/Hunyuan-MT-7B", + "name": "tencent/Hunyuan-MT-7B", + "display_name": "tencent/Hunyuan-MT-7B", "modalities": { "input": [ - "text", - "image", - "audio", - "video", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 1048576, - "output": 65536 + "context": 131072, + "output": 8192 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": true, - "mode": "budget", - "budget": { - "default": -1, - "min": 128, - "max": 32768, - "auto": -1, - "unit": "tokens" - }, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thought_signatures" - ] - } + "supported": false }, - "attachment": true, + "attachment": false, "open_weights": false, - "knowledge": "2025-01", - "release_date": "2025-03-20", - "last_updated": "2025-06-05", + "release_date": "2025-09-18", + "last_updated": "2025-11-25", "cost": { - "input": 1.25, - "output": 10, - "cache_read": 0.125, - "tiers": [ - { - "input": 2.5, - "output": 15, - "cache_read": 0.25, - "tier": { - "type": "context", - "size": 200000 - } - } - ], - "context_over_200k": { - "input": 2.5, - "output": 15, - "cache_read": 0.25 - } + "input": 0, + "output": 0 }, "type": "chat" }, { - "id": "gemini-3.1-pro-preview", - "name": "Gemini 3.1 Pro Preview", - "display_name": "Gemini 3.1 Pro Preview", + "id": "zai-org/GLM-4.5-Air", + "name": "zai-org/GLM-4.5-Air", + "display_name": "zai-org/GLM-4.5-Air", "modalities": { "input": [ - "text", - "image", - "video", - "audio", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 1048576, - "output": 65536 + "context": 131072, + "output": 8192 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": true, - "mode": "level", - "level": "high", - "level_options": [ - "low", - "high" - ], - "summaries": true, - "visibility": "summary", - "continuation": [ - "thought_signatures" - ] - } + "supported": false }, - "attachment": true, + "attachment": false, "open_weights": false, - "knowledge": "2025-01", - "release_date": "2026-02-19", - "last_updated": "2026-02-19", + "release_date": "2025-07-28", + "last_updated": "2025-11-25", "cost": { - "input": 2, - "output": 12, - "cache_read": 0.2, - "tiers": [ - { - "input": 4, - "output": 18, - "cache_read": 0.4, - "tier": { - "type": "context", - "size": 200000 - } - } - ], - "context_over_200k": { - "input": 4, - "output": 18, - "cache_read": 0.4 - } + "input": 0.14, + "output": 0.86 }, "type": "chat" }, { - "id": "gemini-3.1-flash-lite", - "name": "Gemini 3.1 Flash Lite", - "display_name": "Gemini 3.1 Flash Lite", + "id": "zai-org/GLM-4.5V", + "name": "zai-org/GLM-4.5V", + "display_name": "zai-org/GLM-4.5V", "modalities": { "input": [ - "text", - "image", - "video", - "audio", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 1048576, - "output": 65536 + "context": 131072, + "output": 8192 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true - } + "supported": false }, "attachment": true, "open_weights": false, - "knowledge": "2025-01", - "release_date": "2026-05-07", - "last_updated": "2026-05-07", + "release_date": "2025-08-13", + "last_updated": "2025-11-25", "cost": { - "input": 0.25, - "output": 1.5, - "cache_read": 0.025, - "input_audio": 0.5 + "input": 0.14, + "output": 0.86 }, "type": "chat" }, { - "id": "gemini-2.5-flash-lite", - "name": "Gemini 2.5 Flash-Lite", - "display_name": "Gemini 2.5 Flash-Lite", + "id": "zai-org/GLM-4.6V", + "name": "zai-org/GLM-4.6V", + "display_name": "zai-org/GLM-4.6V", "modalities": { "input": [ "text", - "image", - "audio", - "video", - "pdf" + "image" ], "output": [ "text" ] }, "limit": { - "context": 1048576, - "output": 65536 + "context": 131000, + "output": 131000 }, "temperature": true, "tool_call": true, "reasoning": { "supported": true, - "default": false - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": false, - "mode": "budget", - "budget": { - "default": -1, - "min": 512, - "max": 24576, - "auto": -1, - "unit": "tokens" - }, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thought_signatures" - ] - } + "default": true }, "attachment": true, "open_weights": false, - "knowledge": "2025-01", - "release_date": "2025-06-17", - "last_updated": "2025-06-17", + "release_date": "2025-12-07", + "last_updated": "2025-12-07", "cost": { - "input": 0.1, - "output": 0.4, - "cache_read": 0.01, - "input_audio": 0.3 + "input": 0.3, + "output": 0.9 }, "type": "chat" }, { - "id": "gemini-2.5-flash", - "name": "Gemini 2.5 Flash", - "display_name": "Gemini 2.5 Flash", + "id": "zai-org/GLM-4.6", + "name": "zai-org/GLM-4.6", + "display_name": "zai-org/GLM-4.6", "modalities": { "input": [ - "text", - "image", - "audio", - "video", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 1048576, - "output": 65536 + "context": 131072, + "output": 8192 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": true }, "extra_capabilities": { "reasoning": { - "supported": true, - "default_enabled": true, - "mode": "budget", - "budget": { - "default": -1, - "min": 0, - "max": 24576, - "auto": -1, - "off": 0, - "unit": "tokens" - }, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thought_signatures" - ] + "supported": true } }, - "attachment": true, + "attachment": false, "open_weights": false, - "knowledge": "2025-01", - "release_date": "2025-06-17", - "last_updated": "2025-06-17", + "release_date": "2025-10-04", + "last_updated": "2025-11-25", "cost": { - "input": 0.3, - "output": 2.5, - "cache_read": 0.075, - "cache_write": 0.383 + "input": 0.5, + "output": 1.9 }, "type": "chat" }, { - "id": "gemini-3.5-flash", - "name": "Gemini 3.5 Flash", - "display_name": "Gemini 3.5 Flash", + "id": "deepseek-ai/DeepSeek-V4-Pro", + "name": "deepseek-ai/DeepSeek-V4-Pro", + "display_name": "deepseek-ai/DeepSeek-V4-Pro", "modalities": { "input": [ - "text", - "image", - "video", - "audio", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 1048576, - "output": 65536 + "context": 1049000, + "output": 393000 }, "temperature": true, "tool_call": true, @@ -54874,168 +57198,122 @@ "extra_capabilities": { "reasoning": { "supported": true, - "default_enabled": true, - "mode": "level", - "level": "high", - "level_options": [ - "minimal", - "low", - "medium", - "high" - ], + "interleaved": true, "summaries": true, "visibility": "summary", "continuation": [ - "thought_signatures" + "thinking_blocks" ] } }, - "attachment": true, - "open_weights": false, - "knowledge": "2025-01", - "release_date": "2026-05-19", - "last_updated": "2026-05-19", + "attachment": false, + "open_weights": true, + "release_date": "2026-04-24", + "last_updated": "2026-04-24", "cost": { - "input": 1.5, - "output": 9, - "cache_read": 0.15, - "input_audio": 1.5 + "input": 1.74, + "output": 3.48, + "cache_read": 0.145 }, "type": "chat" }, { - "id": "gemini-embedding-001", - "name": "Gemini Embedding 001", - "display_name": "Gemini Embedding 001", + "id": "deepseek-ai/DeepSeek-OCR", + "name": "deepseek-ai/DeepSeek-OCR", + "display_name": "deepseek-ai/DeepSeek-OCR", "modalities": { "input": [ - "text" + "image" ], "output": [ "text" ] }, "limit": { - "context": 2048, - "output": 1 + "context": 8192, + "output": 8192 }, - "temperature": false, + "temperature": true, "tool_call": false, "reasoning": { "supported": false }, - "attachment": false, - "open_weights": false, - "knowledge": "2025-05", - "release_date": "2025-05-20", - "last_updated": "2025-05-20", + "attachment": true, + "open_weights": true, + "release_date": "2025-10-20", + "last_updated": "2025-10-20", "cost": { - "input": 0.15, + "input": 0, "output": 0 - }, - "type": "embedding" + } }, { - "id": "gemini-2.5-pro-tts", - "name": "Gemini 2.5 Pro TTS", - "display_name": "Gemini 2.5 Pro TTS", + "id": "deepseek-ai/DeepSeek-R1-Distill-Qwen-14B", + "name": "deepseek-ai/DeepSeek-R1-Distill-Qwen-14B", + "display_name": "deepseek-ai/DeepSeek-R1-Distill-Qwen-14B", "modalities": { "input": [ "text" ], "output": [ - "audio" + "text" ] }, "limit": { - "context": 32768, - "output": 16384 + "context": 131072, + "output": 8192 }, - "temperature": false, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { "supported": true, "default": true }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": true, - "mode": "budget", - "budget": { - "default": -1, - "min": 128, - "max": 32768, - "auto": -1, - "unit": "tokens" - }, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thought_signatures" - ] - } - }, "attachment": false, "open_weights": false, - "knowledge": "2025-01", - "release_date": "2025-09-30", - "last_updated": "2025-12-10", + "release_date": "2025-01-20", + "last_updated": "2025-11-25", "cost": { - "input": 1, - "output": 20 + "input": 0.1, + "output": 0.1 }, "type": "chat" }, { - "id": "zai-org/glm-4.7-maas", - "name": "GLM-4.7", - "display_name": "GLM-4.7", + "id": "deepseek-ai/DeepSeek-V3", + "name": "deepseek-ai/DeepSeek-V3", + "display_name": "deepseek-ai/DeepSeek-V3", "modalities": { "input": [ - "text", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 128000 + "context": 131072, + "output": 8192 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } + "supported": false }, "attachment": false, - "open_weights": true, - "knowledge": "2025-04", - "release_date": "2026-01-06", - "last_updated": "2026-01-06", + "open_weights": false, + "release_date": "2024-12-26", + "last_updated": "2025-11-25", "cost": { - "input": 0.6, - "output": 2.2 + "input": 0.25, + "output": 1 }, "type": "chat" }, { - "id": "zai-org/glm-5-maas", - "name": "GLM-5", - "display_name": "GLM-5", + "id": "deepseek-ai/DeepSeek-V3.2", + "name": "deepseek-ai/DeepSeek-V3.2", + "display_name": "deepseek-ai/DeepSeek-V3.2", "modalities": { "input": [ "text" @@ -55045,8 +57323,8 @@ ] }, "limit": { - "context": 202752, - "output": 131072 + "context": 164000, + "output": 164000 }, "temperature": true, "tool_call": true, @@ -55056,30 +57334,23 @@ }, "extra_capabilities": { "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] + "supported": true } }, "attachment": false, - "open_weights": true, - "release_date": "2026-02-11", - "last_updated": "2026-02-11", + "open_weights": false, + "release_date": "2025-12-03", + "last_updated": "2025-12-03", "cost": { - "input": 1, - "output": 3.2, - "cache_read": 0.1 + "input": 0.27, + "output": 0.42 }, "type": "chat" }, { - "id": "qwen/qwen3-235b-a22b-instruct-2507-maas", - "name": "Qwen3 235B A22B Instruct", - "display_name": "Qwen3 235B A22B Instruct", + "id": "deepseek-ai/deepseek-vl2", + "name": "deepseek-ai/deepseek-vl2", + "display_name": "deepseek-ai/deepseek-vl2", "modalities": { "input": [ "text" @@ -55089,29 +57360,28 @@ ] }, "limit": { - "context": 262144, - "output": 16384 + "context": 131072, + "output": 8192 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, - "attachment": false, - "open_weights": true, - "release_date": "2025-08-13", - "last_updated": "2025-08-13", + "attachment": true, + "open_weights": false, + "release_date": "2024-12-13", + "last_updated": "2025-11-25", "cost": { - "input": 0.22, - "output": 0.88 + "input": 0.15, + "output": 0.15 }, "type": "chat" }, { - "id": "moonshotai/kimi-k2-thinking-maas", - "name": "Kimi K2 Thinking", - "display_name": "Kimi K2 Thinking", + "id": "deepseek-ai/DeepSeek-V3.1-Terminus", + "name": "deepseek-ai/DeepSeek-V3.1-Terminus", + "display_name": "deepseek-ai/DeepSeek-V3.1-Terminus", "modalities": { "input": [ "text" @@ -55121,8 +57391,8 @@ ] }, "limit": { - "context": 262144, - "output": 262144 + "context": 131072, + "output": 8192 }, "temperature": true, "tool_call": true, @@ -55130,44 +57400,31 @@ "supported": true, "default": true }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } - }, "attachment": false, - "open_weights": true, - "knowledge": "2024-08", - "release_date": "2025-11-13", - "last_updated": "2025-11-13", + "open_weights": false, + "release_date": "2025-09-29", + "last_updated": "2025-11-25", "cost": { - "input": 0.6, - "output": 2.5 + "input": 0.27, + "output": 1 }, "type": "chat" }, { - "id": "deepseek-ai/deepseek-v3.2-maas", - "name": "DeepSeek V3.2", - "display_name": "DeepSeek V3.2", + "id": "deepseek-ai/DeepSeek-R1-Distill-Qwen-32B", + "name": "deepseek-ai/DeepSeek-R1-Distill-Qwen-32B", + "display_name": "deepseek-ai/DeepSeek-R1-Distill-Qwen-32B", "modalities": { "input": [ - "text", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 163840, - "output": 65536 + "context": 131072, + "output": 8192 }, "temperature": true, "tool_call": true, @@ -55176,32 +57433,30 @@ "default": true }, "attachment": false, - "open_weights": true, - "release_date": "2025-12-17", - "last_updated": "2026-04-04", + "open_weights": false, + "release_date": "2025-01-20", + "last_updated": "2025-11-25", "cost": { - "input": 0.56, - "output": 1.68, - "cache_read": 0.056 + "input": 0.18, + "output": 0.18 }, "type": "chat" }, { - "id": "deepseek-ai/deepseek-v3.1-maas", - "name": "DeepSeek V3.1", - "display_name": "DeepSeek V3.1", + "id": "deepseek-ai/DeepSeek-R1", + "name": "deepseek-ai/DeepSeek-R1", + "display_name": "deepseek-ai/DeepSeek-R1", "modalities": { "input": [ - "text", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 163840, - "output": 32768 + "context": 131072, + "output": 8192 }, "temperature": true, "tool_call": true, @@ -55209,31 +57464,41 @@ "supported": true, "default": true }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } + }, "attachment": false, - "open_weights": true, - "release_date": "2025-08-28", - "last_updated": "2025-08-28", + "open_weights": false, + "release_date": "2025-05-28", + "last_updated": "2025-11-25", "cost": { - "input": 0.6, - "output": 1.7 + "input": 0.5, + "output": 2.18 }, "type": "chat" }, { - "id": "meta/llama-4-maverick-17b-128e-instruct-maas", - "name": "Llama 4 Maverick 17B 128E Instruct", - "display_name": "Llama 4 Maverick 17B 128E Instruct", + "id": "ascend-tribe/pangu-pro-moe", + "name": "ascend-tribe/pangu-pro-moe", + "display_name": "ascend-tribe/pangu-pro-moe", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 524288, + "context": 131072, "output": 8192 }, "temperature": true, @@ -55241,21 +57506,20 @@ "reasoning": { "supported": false }, - "attachment": true, - "open_weights": true, - "knowledge": "2024-08", - "release_date": "2025-04-29", - "last_updated": "2025-04-29", - "cost": { - "input": 0.35, - "output": 1.15 + "attachment": false, + "open_weights": false, + "release_date": "2025-07-02", + "last_updated": "2026-01-16", + "cost": { + "input": 0.2, + "output": 0.6 }, "type": "chat" }, { - "id": "meta/llama-3.3-70b-instruct-maas", - "name": "Llama 3.3 70B Instruct", - "display_name": "Llama 3.3 70B Instruct", + "id": "Kwaipilot/KAT-Dev", + "name": "Kwaipilot/KAT-Dev", + "display_name": "Kwaipilot/KAT-Dev", "modalities": { "input": [ "text" @@ -55266,7 +57530,7 @@ }, "limit": { "context": 128000, - "output": 8192 + "output": 128000 }, "temperature": true, "tool_call": true, @@ -55274,20 +57538,19 @@ "supported": false }, "attachment": false, - "open_weights": true, - "knowledge": "2023-12", - "release_date": "2025-04-29", - "last_updated": "2025-04-29", + "open_weights": false, + "release_date": "2025-09-27", + "last_updated": "2026-01-16", "cost": { - "input": 0.72, - "output": 0.72 + "input": 0.2, + "output": 0.6 }, "type": "chat" }, { - "id": "openai/gpt-oss-120b-maas", - "name": "GPT OSS 120B", - "display_name": "GPT OSS 120B", + "id": "deepseek-ai/DeepSeek-V3.2-Exp", + "name": "deepseek-ai/DeepSeek-V3.2-Exp", + "display_name": "deepseek-ai/DeepSeek-V3.2-Exp", "modalities": { "input": [ "text" @@ -55298,28 +57561,18 @@ }, "limit": { "context": 131072, - "output": 32768 + "output": 8192 }, - "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true - }, - "attachment": false, - "open_weights": true, - "release_date": "2025-08-05", - "last_updated": "2025-08-05", - "cost": { - "input": 0.09, - "output": 0.36 + "supported": false }, "type": "chat" }, { - "id": "openai/gpt-oss-20b-maas", - "name": "GPT OSS 20B", - "display_name": "GPT OSS 20B", + "id": "Pro/deepseek-ai/DeepSeek-V3.2-Exp", + "name": "Pro/deepseek-ai/DeepSeek-V3.2-Exp", + "display_name": "Pro/deepseek-ai/DeepSeek-V3.2-Exp", "modalities": { "input": [ "text" @@ -55330,37 +57583,18 @@ }, "limit": { "context": 131072, - "output": 32768 + "output": 8192 }, - "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true - }, - "attachment": false, - "open_weights": true, - "release_date": "2025-08-05", - "last_updated": "2025-08-05", - "cost": { - "input": 0.07, - "output": 0.25 + "supported": false }, "type": "chat" - } - ] - }, - "deepseek": { - "id": "deepseek", - "name": "DeepSeek", - "display_name": "DeepSeek", - "api": "https://api.deepseek.com", - "doc": "https://api-docs.deepseek.com/zh-cn/quick_start/pricing", - "models": [ + }, { - "id": "deepseek-reasoner", - "name": "DeepSeek Reasoner", - "display_name": "DeepSeek Reasoner", + "id": "inclusionAI/Ring-1T", + "name": "inclusionAI/Ring-1T", + "display_name": "inclusionAI/Ring-1T", "modalities": { "input": [ "text" @@ -55370,10 +57604,9 @@ ] }, "limit": { - "context": 1048576, - "output": 393216 + "context": 131072, + "output": 8192 }, - "temperature": false, "tool_call": true, "reasoning": { "supported": true, @@ -55381,41 +57614,15 @@ }, "extra_capabilities": { "reasoning": { - "supported": true, - "default_enabled": true, - "mode": "effort", - "effort": "high", - "effort_options": [ - "high", - "max" - ], - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ], - "notes": [ - "Compatibility alias for deepseek-v4-flash thinking mode." - ] + "supported": true } }, - "attachment": true, - "open_weights": true, - "knowledge": "2025-09", - "release_date": "2025-01-20", - "last_updated": "2026-04-24", - "cost": { - "input": 0.14, - "output": 0.28, - "cache_read": 0.028 - }, "type": "chat" }, { - "id": "deepseek-chat", - "name": "DeepSeek Chat", - "display_name": "DeepSeek Chat", + "id": "inclusionAI/Ling-1T", + "name": "inclusionAI/Ling-1T", + "display_name": "inclusionAI/Ling-1T", "modalities": { "input": [ "text" @@ -55425,85 +57632,107 @@ ] }, "limit": { - "context": 1048576, - "output": 393216 + "context": 131072, + "output": 8192 }, - "temperature": true, "tool_call": true, "reasoning": { "supported": false }, - "attachment": true, - "open_weights": true, - "knowledge": "2025-09", - "release_date": "2024-12-26", - "last_updated": "2026-04-24", - "cost": { - "input": 0.14, - "output": 0.28, - "cache_read": 0.028 - }, "type": "chat" }, { - "id": "deepseek-v4-flash", - "name": "DeepSeek V4 Flash", - "display_name": "DeepSeek V4 Flash", + "id": "Qwen/Qwen-Image-Edit-2509", + "name": "Qwen/Qwen-Image-Edit-2509", + "display_name": "Qwen/Qwen-Image-Edit-2509", "modalities": { "input": [ + "image", "text" ], "output": [ - "text" + "image" ] }, - "limit": { - "context": 1048576, - "output": 393216 + "tool_call": false, + "reasoning": { + "supported": false + } + }, + { + "id": "Qwen/Qwen-Image-Edit", + "name": "Qwen/Qwen-Image-Edit", + "display_name": "Qwen/Qwen-Image-Edit", + "modalities": { + "input": [ + "image", + "text" + ], + "output": [ + "image" + ] }, - "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": true + "supported": false + } + }, + { + "id": "Qwen/Qwen-Image", + "name": "Qwen/Qwen-Image", + "display_name": "Qwen/Qwen-Image", + "modalities": { + "input": [ + "text" + ], + "output": [ + "image" + ] }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": true, - "mode": "effort", - "effort": "high", - "effort_options": [ - "high", - "max" - ], - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ], - "notes": [ - "Thinking mode is controlled through the thinking parameter; non-thinking mode disables reasoning." - ] - } + "tool_call": false, + "reasoning": { + "supported": false + } + }, + { + "id": "Wan-AI/Wan2.2-I2V-A14B", + "name": "Wan-AI/Wan2.2-I2V-A14B", + "display_name": "Wan-AI/Wan2.2-I2V-A14B", + "modalities": { + "input": [ + "image", + "text" + ], + "output": [ + "video" + ] }, - "attachment": true, - "open_weights": true, - "knowledge": "2025-05", - "release_date": "2026-04-24", - "last_updated": "2026-04-24", - "cost": { - "input": 0.14, - "output": 0.28, - "cache_read": 0.028 + "tool_call": false, + "reasoning": { + "supported": false + } + }, + { + "id": "Wan-AI/Wan2.2-T2V-A14B", + "name": "Wan-AI/Wan2.2-T2V-A14B", + "display_name": "Wan-AI/Wan2.2-T2V-A14B", + "modalities": { + "input": [ + "text" + ], + "output": [ + "video" + ] }, - "type": "chat" + "tool_call": false, + "reasoning": { + "supported": false + } }, { - "id": "deepseek-v4-pro", - "name": "DeepSeek V4 Pro", - "display_name": "DeepSeek V4 Pro", + "id": "zai-org/GLM-4.5", + "name": "zai-org/GLM-4.5", + "display_name": "zai-org/GLM-4.5", "modalities": { "input": [ "text" @@ -55513,61 +57742,19 @@ ] }, "limit": { - "context": 1048576, - "output": 393216 + "context": 131072, + "output": 8192 }, - "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": true, - "mode": "effort", - "effort": "high", - "effort_options": [ - "high", - "max" - ], - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ], - "notes": [ - "Thinking mode is controlled through the thinking parameter; non-thinking mode disables reasoning." - ] - } - }, - "attachment": true, - "open_weights": true, - "knowledge": "2025-05", - "release_date": "2026-04-24", - "last_updated": "2026-04-24", - "cost": { - "input": 1.74, - "output": 3.48, - "cache_read": 0.145 + "supported": false }, "type": "chat" - } - ] - }, - "orcarouter": { - "id": "orcarouter", - "name": "OrcaRouter", - "display_name": "OrcaRouter", - "api": "https://api.orcarouter.ai/v1", - "doc": "https://docs.orcarouter.ai", - "models": [ + }, { - "id": "z-ai/glm-4.6", - "name": "GLM-4.6", - "display_name": "GLM-4.6", + "id": "stepfun-ai/step3", + "name": "stepfun-ai/step3", + "display_name": "stepfun-ai/step3", "modalities": { "input": [ "text" @@ -55577,37 +57764,36 @@ ] }, "limit": { - "context": 204800, - "output": 131072 + "context": 131072, + "output": 8192 }, - "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true - } - }, - "attachment": false, - "open_weights": true, - "knowledge": "2025-04", - "release_date": "2025-09-30", - "last_updated": "2025-09-30", - "cost": { - "input": 0.6, - "output": 2.2, - "cache_read": 0.11, - "cache_write": 0 + "supported": false }, "type": "chat" }, { - "id": "z-ai/glm-4.7", - "name": "GLM-4.7", - "display_name": "GLM-4.7", + "id": "TeleAI/TeleSpeechASR", + "name": "TeleAI/TeleSpeechASR", + "display_name": "TeleAI/TeleSpeechASR", + "modalities": { + "input": [ + "audio" + ], + "output": [ + "text" + ] + }, + "tool_call": false, + "reasoning": { + "supported": false + } + }, + { + "id": "THUDM/GLM-4.1V-9B-Thinking", + "name": "THUDM/GLM-4.1V-9B-Thinking", + "display_name": "THUDM/GLM-4.1V-9B-Thinking", "modalities": { "input": [ "text" @@ -55617,43 +57803,20 @@ ] }, "limit": { - "context": 204800, - "output": 131072 + "context": 131072, + "output": 8192 }, - "temperature": true, "tool_call": true, "reasoning": { "supported": true, "default": true }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } - }, - "attachment": false, - "open_weights": true, - "knowledge": "2025-04", - "release_date": "2025-12-22", - "last_updated": "2025-12-22", - "cost": { - "input": 0.6, - "output": 2.2, - "cache_read": 0.11, - "cache_write": 0 - }, "type": "chat" }, { - "id": "z-ai/glm-5", - "name": "GLM-5", - "display_name": "GLM-5", + "id": "Pro/THUDM/GLM-4.1V-9B-Thinking", + "name": "Pro/THUDM/GLM-4.1V-9B-Thinking", + "display_name": "Pro/THUDM/GLM-4.1V-9B-Thinking", "modalities": { "input": [ "text" @@ -55663,42 +57826,42 @@ ] }, "limit": { - "context": 204800, - "output": 131072 + "context": 131072, + "output": 8192 }, - "temperature": true, "tool_call": true, "reasoning": { "supported": true, "default": true }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } + "type": "chat" + }, + { + "id": "moonshotai/Kimi-Dev-72B", + "name": "moonshotai/Kimi-Dev-72B", + "display_name": "moonshotai/Kimi-Dev-72B", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] }, - "attachment": false, - "open_weights": true, - "release_date": "2026-02-11", - "last_updated": "2026-02-11", - "cost": { - "input": 1, - "output": 3.2, - "cache_read": 0.2, - "cache_write": 0 + "limit": { + "context": 131072, + "output": 8192 + }, + "tool_call": true, + "reasoning": { + "supported": false }, "type": "chat" }, { - "id": "z-ai/glm-4.5", - "name": "GLM-4.5", - "display_name": "GLM-4.5", + "id": "MiniMaxAI/MiniMax-M1-80k", + "name": "MiniMaxAI/MiniMax-M1-80k", + "display_name": "MiniMaxAI/MiniMax-M1-80k", "modalities": { "input": [ "text" @@ -55709,31 +57872,18 @@ }, "limit": { "context": 131072, - "output": 98304 + "output": 8192 }, - "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true - }, - "attachment": false, - "open_weights": true, - "knowledge": "2025-04", - "release_date": "2025-07-28", - "last_updated": "2025-07-28", - "cost": { - "input": 0.6, - "output": 2.2, - "cache_read": 0.11, - "cache_write": 0 + "supported": false }, "type": "chat" }, { - "id": "z-ai/glm-4.5-air", - "name": "GLM-4.5-Air", - "display_name": "GLM-4.5-Air", + "id": "Tongyi-Zhiwen/QwenLong-L1-32B", + "name": "Tongyi-Zhiwen/QwenLong-L1-32B", + "display_name": "Tongyi-Zhiwen/QwenLong-L1-32B", "modalities": { "input": [ "text" @@ -55744,31 +57894,19 @@ }, "limit": { "context": 131072, - "output": 98304 + "output": 8192 }, - "temperature": true, "tool_call": true, "reasoning": { "supported": true, "default": true }, - "attachment": false, - "open_weights": true, - "knowledge": "2025-04", - "release_date": "2025-07-28", - "last_updated": "2025-07-28", - "cost": { - "input": 0.2, - "output": 1.1, - "cache_read": 0.03, - "cache_write": 0 - }, "type": "chat" }, { - "id": "z-ai/glm-5.1", - "name": "GLM-5.1", - "display_name": "GLM-5.1", + "id": "deepseek-ai/DeepSeek-R1-0528-Qwen3-8B", + "name": "deepseek-ai/DeepSeek-R1-0528-Qwen3-8B", + "display_name": "deepseek-ai/DeepSeek-R1-0528-Qwen3-8B", "modalities": { "input": [ "text" @@ -55778,42 +57916,20 @@ ] }, "limit": { - "context": 200000, - "output": 131072 + "context": 131072, + "output": 8192 }, - "temperature": true, "tool_call": true, "reasoning": { "supported": true, "default": true }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } - }, - "attachment": false, - "open_weights": true, - "release_date": "2026-03-27", - "last_updated": "2026-03-27", - "cost": { - "input": 1.4, - "output": 4.4, - "cache_read": 0.26, - "cache_write": 0 - }, "type": "chat" }, { - "id": "deepseek/deepseek-reasoner", - "name": "DeepSeek Reasoner", - "display_name": "DeepSeek Reasoner", + "id": "Qwen/Qwen3-30B-A3B", + "name": "Qwen/Qwen3-30B-A3B", + "display_name": "Qwen/Qwen3-30B-A3B", "modalities": { "input": [ "text" @@ -55823,14 +57939,12 @@ ] }, "limit": { - "context": 1000000, - "output": 384000 + "context": 131072, + "output": 8192 }, - "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": true }, "extra_capabilities": { "reasoning": { @@ -55843,612 +57957,1638 @@ ] } }, - "attachment": true, - "open_weights": true, - "knowledge": "2025-09", - "release_date": "2025-12-01", - "last_updated": "2026-02-28", - "cost": { - "input": 0.435, - "output": 0.87, - "cache_read": 0.028 - }, "type": "chat" }, { - "id": "deepseek/deepseek-chat", - "name": "DeepSeek Chat", - "display_name": "DeepSeek Chat", + "id": "Qwen/Qwen3-Reranker-8B", + "name": "Qwen/Qwen3-Reranker-8B", + "display_name": "Qwen/Qwen3-Reranker-8B", "modalities": { "input": [ "text" ], "output": [ - "text" + "score" ] }, "limit": { - "context": 1000000, - "output": 384000 + "context": 8192, + "output": 2048 }, - "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": false }, - "attachment": true, - "open_weights": true, - "knowledge": "2025-09", - "release_date": "2025-12-01", - "last_updated": "2026-02-28", - "cost": { - "input": 0.14, - "output": 0.28, - "cache_read": 0.028 - }, - "type": "chat" + "type": "rerank" }, { - "id": "deepseek/deepseek-v4-flash", - "name": "DeepSeek V4 Flash", - "display_name": "DeepSeek V4 Flash", + "id": "Qwen/Qwen3-Embedding-8B", + "name": "Qwen/Qwen3-Embedding-8B", + "display_name": "Qwen/Qwen3-Embedding-8B", "modalities": { "input": [ "text" ], "output": [ - "text" + "embedding" ] }, "limit": { - "context": 1000000, - "output": 384000 + "context": 8192, + "output": 2048 }, - "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } - }, - "attachment": false, - "open_weights": true, - "knowledge": "2025-05", - "release_date": "2026-04-24", - "last_updated": "2026-04-24", - "cost": { - "input": 0.19, - "output": 0.37, - "cache_read": 0.0028 + "supported": false }, - "type": "chat" + "type": "embedding" }, { - "id": "deepseek/deepseek-v4-pro", - "name": "DeepSeek V4 Pro", - "display_name": "DeepSeek V4 Pro", + "id": "Qwen/Qwen3-Reranker-4B", + "name": "Qwen/Qwen3-Reranker-4B", + "display_name": "Qwen/Qwen3-Reranker-4B", "modalities": { "input": [ "text" ], "output": [ - "text" + "score" ] }, "limit": { - "context": 1000000, - "output": 384000 + "context": 8192, + "output": 2048 }, - "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } - }, - "attachment": false, - "open_weights": true, - "knowledge": "2025-05", - "release_date": "2026-04-24", - "last_updated": "2026-04-24", - "cost": { - "input": 0.56, - "output": 1.12, - "cache_read": 0.003625 + "supported": false }, - "type": "chat" + "type": "rerank" }, { - "id": "orcarouter/auto", - "name": "OrcaRouter Auto", - "display_name": "OrcaRouter Auto", + "id": "Qwen/Qwen3-Embedding-4B", + "name": "Qwen/Qwen3-Embedding-4B", + "display_name": "Qwen/Qwen3-Embedding-4B", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ - "text" + "embedding" ] }, "limit": { - "context": 128000, - "output": 16384 + "context": 8192, + "output": 2048 }, - "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": false }, - "attachment": true, - "open_weights": false, - "release_date": "2025-01-01", - "last_updated": "2026-05-14", - "cost": { - "input": 0, - "output": 0 - }, - "type": "chat" + "type": "embedding" }, { - "id": "anthropic/claude-sonnet-4", - "name": "Claude Sonnet 4 (latest)", - "display_name": "Claude Sonnet 4 (latest)", + "id": "Qwen/Qwen3-Reranker-0.6B", + "name": "Qwen/Qwen3-Reranker-0.6B", + "display_name": "Qwen/Qwen3-Reranker-0.6B", "modalities": { "input": [ - "text", - "image", - "pdf" + "text" ], "output": [ - "text" + "score" ] }, "limit": { - "context": 200000, - "output": 64000 + "context": 8192, + "output": 2048 }, - "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": false - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": false, - "mode": "budget", - "budget": { - "min": 1024, - "unit": "tokens" - }, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ], - "notes": [ - "Claude 4 manual thinking uses thinking.type = \"enabled\" with budget_tokens.", - "Interleaved thinking requires the interleaved-thinking-2025-05-14 beta header for this model family." - ] - } - }, - "attachment": true, - "open_weights": false, - "knowledge": "2025-03-31", - "release_date": "2025-05-22", - "last_updated": "2025-05-22", - "cost": { - "input": 3, - "output": 15, - "cache_read": 0.3, - "cache_write": 3.75 + "supported": false }, - "type": "chat" + "type": "rerank" }, { - "id": "anthropic/claude-sonnet-4.6", - "name": "Claude Sonnet 4.6", - "display_name": "Claude Sonnet 4.6", + "id": "Qwen/Qwen3-Embedding-0.6B", + "name": "Qwen/Qwen3-Embedding-0.6B", + "display_name": "Qwen/Qwen3-Embedding-0.6B", "modalities": { "input": [ - "text", - "image", - "pdf" + "text" ], "output": [ - "text" + "embedding" ] }, "limit": { - "context": 1000000, - "output": 64000 + "context": 8192, + "output": 2048 }, - "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": false - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": false, - "mode": "mixed", - "budget": { - "min": 1024, - "unit": "tokens" - }, - "effort": "high", - "effort_options": [ - "low", - "medium", - "high", - "max" - ], - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ], - "notes": [ - "Anthropic recommends adaptive thinking with effort for Claude 4.6; budget_tokens remains a deprecated compatibility path.", - "Anthropic API defaults effort to high; lower effort levels should be chosen per workload." - ] - } - }, - "attachment": true, - "open_weights": false, - "knowledge": "2025-08-31", - "release_date": "2026-02-17", - "last_updated": "2026-03-13", - "cost": { - "input": 3, - "output": 15, - "cache_read": 0.3, - "cache_write": 3.75 + "supported": false }, - "type": "chat" + "type": "embedding" }, { - "id": "anthropic/claude-opus-4.5", - "name": "Claude Opus 4.5 (latest)", - "display_name": "Claude Opus 4.5 (latest)", + "id": "Qwen/Qwen3-235B-A22B", + "name": "Qwen/Qwen3-235B-A22B", + "display_name": "Qwen/Qwen3-235B-A22B", "modalities": { "input": [ - "text", - "image", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 64000 + "context": 131072, + "output": 8192 }, - "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": false + "supported": true }, "extra_capabilities": { "reasoning": { "supported": true, - "default_enabled": false, - "mode": "mixed", - "budget": { - "min": 1024, - "unit": "tokens" - }, - "effort": "high", - "effort_options": [ - "low", - "medium", - "high" - ], "interleaved": true, "summaries": true, "visibility": "summary", "continuation": [ "thinking_blocks" - ], - "notes": [ - "Claude Opus 4.5 uses manual thinking.type = \"enabled\" with budget_tokens; effort can be used alongside the thinking budget.", - "Interleaved thinking requires the interleaved-thinking-2025-05-14 beta header." ] } }, - "attachment": true, - "open_weights": false, - "knowledge": "2025-03-31", - "release_date": "2025-11-24", - "last_updated": "2025-11-24", - "cost": { - "input": 5, - "output": 25, - "cache_read": 0.5, - "cache_write": 6.25 - }, "type": "chat" }, { - "id": "anthropic/claude-opus-4.7", - "name": "Claude Opus 4.7", - "display_name": "Claude Opus 4.7", + "id": "Pro/Qwen/Qwen2.5-VL-7B-Instruct", + "name": "Pro/Qwen/Qwen2.5-VL-7B-Instruct", + "display_name": "Pro/Qwen/Qwen2.5-VL-7B-Instruct", "modalities": { "input": [ - "text", - "image", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 1000000, - "output": 128000 + "context": 131072, + "output": 8192 }, - "temperature": false, "tool_call": true, "reasoning": { - "supported": true, - "default": false - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": false, - "mode": "effort", - "effort": "high", - "effort_options": [ - "low", - "medium", - "high", - "xhigh", - "max" - ], - "interleaved": true, - "summaries": true, - "visibility": "omitted", - "continuation": [ - "thinking_blocks" - ], - "notes": [ - "Claude Opus 4.7 and newer Opus models require thinking.type = \"adaptive\" to enable thinking explicitly.", - "Manual budget_tokens requests return 400 on Claude Opus 4.7 and newer adaptive-only Opus models.", - "task_budget is separate from thinking control and should not be treated as a thinking budget." - ] - } - }, - "attachment": true, - "open_weights": false, - "knowledge": "2026-01-31", - "release_date": "2026-04-16", - "last_updated": "2026-04-16", - "cost": { - "input": 5, - "output": 25, - "cache_read": 0.5, - "cache_write": 6.25 + "supported": false }, "type": "chat" }, { - "id": "anthropic/claude-sonnet-4.5", - "name": "Claude Sonnet 4.5 (latest)", - "display_name": "Claude Sonnet 4.5 (latest)", + "id": "deepseek-ai/DeepSeek-R1-Distill-Qwen-7B", + "name": "deepseek-ai/DeepSeek-R1-Distill-Qwen-7B", + "display_name": "deepseek-ai/DeepSeek-R1-Distill-Qwen-7B", "modalities": { "input": [ - "text", - "image", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 64000 + "context": 131072, + "output": 8192 }, - "temperature": true, "tool_call": true, "reasoning": { "supported": true, - "default": false - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": false, - "mode": "budget", - "budget": { - "min": 1024, - "unit": "tokens" - }, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ], - "notes": [ - "Claude 4 manual thinking uses thinking.type = \"enabled\" with budget_tokens.", - "Interleaved thinking requires the interleaved-thinking-2025-05-14 beta header for this model family." - ] - } - }, - "attachment": true, - "open_weights": false, - "knowledge": "2025-07-31", - "release_date": "2025-09-29", - "last_updated": "2025-09-29", - "cost": { - "input": 3, - "output": 15, - "cache_read": 0.3, - "cache_write": 3.75 + "default": true }, "type": "chat" }, { - "id": "anthropic/claude-opus-4.6", - "name": "Claude Opus 4.6", - "display_name": "Claude Opus 4.6", + "id": "Qwen/QVQ-72B-Preview", + "name": "Qwen/QVQ-72B-Preview", + "display_name": "Qwen/QVQ-72B-Preview", "modalities": { "input": [ - "text", - "image", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 1000000, - "output": 128000 + "context": 131072, + "output": 8192 }, - "temperature": true, "tool_call": true, "reasoning": { "supported": true, - "default": false - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": false, - "mode": "mixed", - "budget": { - "min": 1024, - "unit": "tokens" - }, - "effort": "high", - "effort_options": [ - "low", - "medium", - "high", - "max" - ], - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ], - "notes": [ - "Anthropic recommends adaptive thinking with effort for Claude 4.6; budget_tokens remains a deprecated compatibility path.", - "Anthropic API defaults effort to high; lower effort levels should be chosen per workload." - ] - } - }, - "attachment": true, - "open_weights": false, - "knowledge": "2025-05-31", - "release_date": "2026-02-05", - "last_updated": "2026-03-13", - "cost": { - "input": 5, - "output": 25, - "cache_read": 0.5, - "cache_write": 6.25 + "default": true }, "type": "chat" }, { - "id": "anthropic/claude-haiku-4.5", - "name": "Claude Haiku 4.5 (latest)", - "display_name": "Claude Haiku 4.5 (latest)", + "id": "deepseek-ai/DeepSeek-V2.5", + "name": "deepseek-ai/DeepSeek-V2.5", + "display_name": "deepseek-ai/DeepSeek-V2.5", "modalities": { "input": [ - "text", - "image", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 64000 + "context": 131072, + "output": 8192 }, - "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": false + "supported": false }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": false, - "mode": "budget", - "budget": { - "min": 1024, - "unit": "tokens" - }, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ], - "notes": [ - "Claude 4 manual thinking uses thinking.type = \"enabled\" with budget_tokens.", - "Interleaved thinking requires the interleaved-thinking-2025-05-14 beta header for this model family." - ] + "type": "chat" + }, + { + "id": "fnlp/MOSS-TTSD-v0.5", + "name": "fnlp/MOSS-TTSD-v0.5", + "display_name": "fnlp/MOSS-TTSD-v0.5", + "modalities": { + "input": [ + "text" + ], + "output": [ + "audio" + ] + }, + "tool_call": false, + "reasoning": { + "supported": false + } + }, + { + "id": "FunAudioLLM/CosyVoice2-0.5B", + "name": "FunAudioLLM/CosyVoice2-0.5B", + "display_name": "FunAudioLLM/CosyVoice2-0.5B", + "modalities": { + "input": [ + "text" + ], + "output": [ + "audio" + ] + }, + "tool_call": false, + "reasoning": { + "supported": false + } + }, + { + "id": "FunAudioLLM/SenseVoiceSmall", + "name": "FunAudioLLM/SenseVoiceSmall", + "display_name": "FunAudioLLM/SenseVoiceSmall", + "modalities": { + "input": [ + "audio" + ], + "output": [ + "text" + ] + }, + "tool_call": false, + "reasoning": { + "supported": false + } + }, + { + "id": "IndexTeam/IndexTTS-2", + "name": "IndexTeam/IndexTTS-2", + "display_name": "IndexTeam/IndexTTS-2", + "modalities": { + "input": [ + "text" + ], + "output": [ + "audio" + ] + }, + "tool_call": false, + "reasoning": { + "supported": false + } + }, + { + "id": "BAAI/bge-m3", + "name": "BAAI/bge-m3", + "display_name": "BAAI/bge-m3", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 131072, + "output": 8192 + }, + "tool_call": true, + "reasoning": { + "supported": false + }, + "type": "embedding" + }, + { + "id": "BAAI/bge-reranker-v2-m3", + "name": "BAAI/bge-reranker-v2-m3", + "display_name": "BAAI/bge-reranker-v2-m3", + "modalities": { + "input": [ + "text" + ], + "output": [ + "score" + ] + }, + "limit": { + "context": 8192, + "output": 2048 + }, + "tool_call": false, + "reasoning": { + "supported": false + }, + "type": "rerank" + }, + { + "id": "netease-youdao/bce-embedding-base_v1", + "name": "netease-youdao/bce-embedding-base_v1", + "display_name": "netease-youdao/bce-embedding-base_v1", + "modalities": { + "input": [ + "text" + ], + "output": [ + "embedding" + ] + }, + "limit": { + "context": 8192, + "output": 2048 + }, + "tool_call": false, + "reasoning": { + "supported": false + }, + "type": "embedding" + }, + { + "id": "netease-youdao/bce-reranker-base_v1", + "name": "netease-youdao/bce-reranker-base_v1", + "display_name": "netease-youdao/bce-reranker-base_v1", + "modalities": { + "input": [ + "text" + ], + "output": [ + "score" + ] + }, + "limit": { + "context": 8192, + "output": 2048 + }, + "tool_call": false, + "reasoning": { + "supported": false + } + }, + { + "id": "Kwai-Kolors/Kolors", + "name": "Kwai-Kolors/Kolors", + "display_name": "Kwai-Kolors/Kolors", + "modalities": { + "input": [ + "text" + ], + "output": [ + "image" + ] + }, + "tool_call": false, + "reasoning": { + "supported": false + } + }, + { + "id": "Qwen/Qwen2-VL-72B-Instruct", + "name": "Qwen/Qwen2-VL-72B-Instruct", + "display_name": "Qwen/Qwen2-VL-72B-Instruct", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 131072, + "output": 8192 + }, + "tool_call": true, + "reasoning": { + "supported": false + }, + "type": "chat" + }, + { + "id": "Qwen/Qwen2.5-Coder-7B-Instruct", + "name": "Qwen/Qwen2.5-Coder-7B-Instruct", + "display_name": "Qwen/Qwen2.5-Coder-7B-Instruct", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 131072, + "output": 8192 + }, + "tool_call": true, + "reasoning": { + "supported": false + } + }, + { + "id": "internlm/internlm2_5-7b-chat", + "name": "internlm/internlm2_5-7b-chat", + "display_name": "internlm/internlm2_5-7b-chat", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 131072, + "output": 8192 + }, + "tool_call": true, + "reasoning": { + "supported": false + }, + "type": "chat" + }, + { + "id": "Qwen/Qwen2-7B-Instruct", + "name": "Qwen/Qwen2-7B-Instruct", + "display_name": "Qwen/Qwen2-7B-Instruct", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 131072, + "output": 8192 + }, + "tool_call": true, + "reasoning": { + "supported": false + }, + "type": "chat" + }, + { + "id": "THUDM/glm-4-9b-chat", + "name": "THUDM/glm-4-9b-chat", + "display_name": "THUDM/glm-4-9b-chat", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 131072, + "output": 8192 + }, + "tool_call": true, + "reasoning": { + "supported": false + }, + "type": "chat" + }, + { + "id": "BAAI/bge-large-en-v1.5", + "name": "BAAI/bge-large-en-v1.5", + "display_name": "BAAI/bge-large-en-v1.5", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 131072, + "output": 8192 + }, + "tool_call": true, + "reasoning": { + "supported": false + }, + "type": "embedding" + }, + { + "id": "BAAI/bge-large-zh-v1.5", + "name": "BAAI/bge-large-zh-v1.5", + "display_name": "BAAI/bge-large-zh-v1.5", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 131072, + "output": 8192 + }, + "tool_call": true, + "reasoning": { + "supported": false + }, + "type": "embedding" + }, + { + "id": "LoRA/Qwen/Qwen2.5-32B-Instruct", + "name": "LoRA/Qwen/Qwen2.5-32B-Instruct", + "display_name": "LoRA/Qwen/Qwen2.5-32B-Instruct", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 131072, + "output": 8192 + }, + "tool_call": true, + "reasoning": { + "supported": false + }, + "type": "chat" + }, + { + "id": "LoRA/Qwen/Qwen2.5-14B-Instruct", + "name": "LoRA/Qwen/Qwen2.5-14B-Instruct", + "display_name": "LoRA/Qwen/Qwen2.5-14B-Instruct", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 131072, + "output": 8192 + }, + "tool_call": true, + "reasoning": { + "supported": false + }, + "type": "chat" + }, + { + "id": "Pro/deepseek-ai/DeepSeek-R1-Distill-Qwen-7B", + "name": "Pro/deepseek-ai/DeepSeek-R1-Distill-Qwen-7B", + "display_name": "Pro/deepseek-ai/DeepSeek-R1-Distill-Qwen-7B", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 131072, + "output": 8192 + }, + "tool_call": true, + "reasoning": { + "supported": true, + "default": true + }, + "type": "chat" + }, + { + "id": "Pro/Qwen/Qwen2.5-Coder-7B-Instruct", + "name": "Pro/Qwen/Qwen2.5-Coder-7B-Instruct", + "display_name": "Pro/Qwen/Qwen2.5-Coder-7B-Instruct", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 131072, + "output": 8192 + }, + "tool_call": true, + "reasoning": { + "supported": false + } + }, + { + "id": "Pro/BAAI/bge-m3", + "name": "Pro/BAAI/bge-m3", + "display_name": "Pro/BAAI/bge-m3", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 131072, + "output": 8192 + }, + "tool_call": true, + "reasoning": { + "supported": false + }, + "type": "embedding" + }, + { + "id": "Pro/Qwen/Qwen2.5-7B-Instruct", + "name": "Pro/Qwen/Qwen2.5-7B-Instruct", + "display_name": "Pro/Qwen/Qwen2.5-7B-Instruct", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 131072, + "output": 8192 + }, + "tool_call": true, + "reasoning": { + "supported": false + }, + "type": "chat" + }, + { + "id": "Pro/BAAI/bge-reranker-v2-m3", + "name": "Pro/BAAI/bge-reranker-v2-m3", + "display_name": "Pro/BAAI/bge-reranker-v2-m3", + "modalities": { + "input": [ + "text" + ], + "output": [ + "score" + ] + }, + "limit": { + "context": 8192, + "output": 2048 + }, + "tool_call": false, + "reasoning": { + "supported": false + }, + "type": "rerank" + }, + { + "id": "LoRA/Qwen/Qwen2.5-72B-Instruct", + "name": "LoRA/Qwen/Qwen2.5-72B-Instruct", + "display_name": "LoRA/Qwen/Qwen2.5-72B-Instruct", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 131072, + "output": 8192 + }, + "tool_call": true, + "reasoning": { + "supported": false + }, + "type": "chat" + }, + { + "id": "Pro/Qwen/Qwen2-7B-Instruct", + "name": "Pro/Qwen/Qwen2-7B-Instruct", + "display_name": "Pro/Qwen/Qwen2-7B-Instruct", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 131072, + "output": 8192 + }, + "tool_call": true, + "reasoning": { + "supported": false + }, + "type": "chat" + }, + { + "id": "LoRA/Qwen/Qwen2.5-7B-Instruct", + "name": "LoRA/Qwen/Qwen2.5-7B-Instruct", + "display_name": "LoRA/Qwen/Qwen2.5-7B-Instruct", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 131072, + "output": 8192 + }, + "tool_call": true, + "reasoning": { + "supported": false + }, + "type": "chat" + }, + { + "id": "Pro/THUDM/glm-4-9b-chat", + "name": "Pro/THUDM/glm-4-9b-chat", + "display_name": "Pro/THUDM/glm-4-9b-chat", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 131072, + "output": 8192 + }, + "tool_call": true, + "reasoning": { + "supported": false + }, + "type": "chat" + }, + { + "id": "THUDM/GLM-Z1-Rumination-32B-0414", + "name": "THUDM/GLM-Z1-Rumination-32B-0414", + "display_name": "THUDM/GLM-Z1-Rumination-32B-0414", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 131072, + "output": 8192 + }, + "tool_call": true, + "reasoning": { + "supported": true, + "default": true + }, + "type": "chat" + }, + { + "id": "stabilityai/stable-diffusion-xl-base-1.0", + "name": "stabilityai/stable-diffusion-xl-base-1.0", + "display_name": "stabilityai/stable-diffusion-xl-base-1.0", + "modalities": { + "input": [ + "text" + ], + "output": [ + "image" + ] + }, + "tool_call": false, + "reasoning": { + "supported": false + } + }, + { + "id": "black-forest-labs/FLUX.1-schnell", + "name": "black-forest-labs/FLUX.1-schnell", + "display_name": "black-forest-labs/FLUX.1-schnell", + "modalities": { + "input": [ + "text" + ], + "output": [ + "image" + ] + }, + "tool_call": false, + "reasoning": { + "supported": false + } + }, + { + "id": "black-forest-labs/FLUX.1-dev", + "name": "black-forest-labs/FLUX.1-dev", + "display_name": "black-forest-labs/FLUX.1-dev", + "modalities": { + "input": [ + "text" + ], + "output": [ + "image" + ] + }, + "tool_call": false, + "reasoning": { + "supported": false + } + }, + { + "id": "Pro/black-forest-labs/FLUX.1-schnell", + "name": "Pro/black-forest-labs/FLUX.1-schnell", + "display_name": "Pro/black-forest-labs/FLUX.1-schnell", + "modalities": { + "input": [ + "text" + ], + "output": [ + "image" + ] + }, + "tool_call": false, + "reasoning": { + "supported": false + } + }, + { + "id": "stabilityai/stable-diffusion-3-5-large", + "name": "stabilityai/stable-diffusion-3-5-large", + "display_name": "stabilityai/stable-diffusion-3-5-large", + "modalities": { + "input": [ + "text" + ], + "output": [ + "image" + ] + }, + "tool_call": false, + "reasoning": { + "supported": false + } + }, + { + "id": "fishaudio/fish-speech-1.4", + "name": "fishaudio/fish-speech-1.4", + "display_name": "fishaudio/fish-speech-1.4", + "modalities": { + "input": [ + "text" + ], + "output": [ + "audio" + ] + }, + "tool_call": false, + "reasoning": { + "supported": false + } + }, + { + "id": "RVC-Boss/GPT-SoVITS", + "name": "RVC-Boss/GPT-SoVITS", + "display_name": "RVC-Boss/GPT-SoVITS", + "modalities": { + "input": [ + "text" + ], + "output": [ + "audio" + ] + }, + "tool_call": false, + "reasoning": { + "supported": false + } + }, + { + "id": "fishaudio/fish-speech-1.5", + "name": "fishaudio/fish-speech-1.5", + "display_name": "fishaudio/fish-speech-1.5", + "modalities": { + "input": [ + "text" + ], + "output": [ + "audio" + ] + }, + "tool_call": false, + "reasoning": { + "supported": false + } + }, + { + "id": "black-forest-labs/FLUX.1-pro", + "name": "black-forest-labs/FLUX.1-pro", + "display_name": "black-forest-labs/FLUX.1-pro", + "modalities": { + "input": [ + "text" + ], + "output": [ + "image" + ] + }, + "tool_call": false, + "reasoning": { + "supported": false + } + }, + { + "id": "LoRA/black-forest-labs/FLUX.1-dev", + "name": "LoRA/black-forest-labs/FLUX.1-dev", + "display_name": "LoRA/black-forest-labs/FLUX.1-dev", + "modalities": { + "input": [ + "text" + ], + "output": [ + "image" + ] + }, + "tool_call": false, + "reasoning": { + "supported": false + } + }, + { + "id": "SeedLLM/Seed-Rice-7B", + "name": "SeedLLM/Seed-Rice-7B", + "display_name": "SeedLLM/Seed-Rice-7B", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 131072, + "output": 8192 + }, + "tool_call": true, + "reasoning": { + "supported": false + }, + "type": "chat" + } + ] + }, + "merge-gateway": { + "id": "merge-gateway", + "name": "Merge Gateway", + "display_name": "Merge Gateway", + "doc": "https://docs.merge.dev/merge-gateway", + "models": [ + { + "id": "xai/grok-4.3", + "name": "Grok 4.3", + "display_name": "Grok 4.3", + "modalities": { + "input": [ + "text", + "image", + "pdf" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 1000000, + "output": 30000 + }, + "temperature": true, + "tool_call": true, + "reasoning": { + "supported": true, + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true + } + }, + "attachment": true, + "open_weights": false, + "release_date": "2026-04-17", + "last_updated": "2026-04-17", + "cost": { + "input": 1.25, + "output": 2.5, + "cache_read": 0.2, + "tiers": [ + { + "input": 2.5, + "output": 5, + "cache_read": 0.4, + "tier": { + "type": "context", + "size": 200000 + } + } + ], + "context_over_200k": { + "input": 2.5, + "output": 5, + "cache_read": 0.4 + } + }, + "type": "chat" + }, + { + "id": "xai/grok-4.20-0309-reasoning", + "name": "Grok 4.20 (Reasoning)", + "display_name": "Grok 4.20 (Reasoning)", + "modalities": { + "input": [ + "text", + "image", + "pdf" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 1000000, + "output": 30000 + }, + "temperature": true, + "tool_call": true, + "reasoning": { + "supported": true, + "default": true + }, + "attachment": true, + "open_weights": false, + "release_date": "2026-03-09", + "last_updated": "2026-03-09", + "cost": { + "input": 1.25, + "output": 2.5, + "cache_read": 0.2, + "tiers": [ + { + "input": 2.5, + "output": 5, + "cache_read": 0.4, + "tier": { + "type": "context", + "size": 200000 + } + } + ], + "context_over_200k": { + "input": 2.5, + "output": 5, + "cache_read": 0.4 + } + }, + "type": "chat" + }, + { + "id": "mistral/codestral-latest", + "name": "Codestral (latest)", + "display_name": "Codestral (latest)", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 256000, + "output": 4096 + }, + "temperature": true, + "tool_call": true, + "reasoning": { + "supported": false + }, + "attachment": false, + "open_weights": true, + "knowledge": "2024-10", + "release_date": "2024-05-29", + "last_updated": "2025-01-04", + "cost": { + "input": 0.3, + "output": 0.9 + }, + "type": "chat" + }, + { + "id": "mistral/mistral-large-latest", + "name": "Mistral Large (latest)", + "display_name": "Mistral Large (latest)", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 262144, + "output": 262144 + }, + "temperature": true, + "tool_call": true, + "reasoning": { + "supported": false + }, + "attachment": true, + "open_weights": true, + "knowledge": "2024-11", + "release_date": "2024-11-01", + "last_updated": "2025-12-02", + "cost": { + "input": 0.5, + "output": 1.5 + }, + "type": "chat" + }, + { + "id": "mistral/devstral-small-2507", + "name": "Devstral Small", + "display_name": "Devstral Small", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 128000, + "output": 128000 + }, + "temperature": true, + "tool_call": true, + "reasoning": { + "supported": false + }, + "attachment": false, + "open_weights": true, + "knowledge": "2025-05", + "release_date": "2025-07-10", + "last_updated": "2025-07-10", + "cost": { + "input": 0.1, + "output": 0.3 + }, + "type": "chat" + }, + { + "id": "mistral/pixtral-large-latest", + "name": "Pixtral Large (latest)", + "display_name": "Pixtral Large (latest)", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 128000, + "output": 128000 + }, + "temperature": true, + "tool_call": true, + "reasoning": { + "supported": false + }, + "attachment": true, + "open_weights": true, + "knowledge": "2024-11", + "release_date": "2024-11-01", + "last_updated": "2024-11-04", + "cost": { + "input": 2, + "output": 6 + }, + "type": "chat" + }, + { + "id": "mistral/mistral-medium-latest", + "name": "Mistral Medium (latest)", + "display_name": "Mistral Medium (latest)", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 262144, + "output": 262144 + }, + "temperature": true, + "tool_call": true, + "reasoning": { + "supported": false + }, + "attachment": true, + "open_weights": false, + "knowledge": "2025-05", + "release_date": "2025-08-12", + "last_updated": "2025-08-12", + "cost": { + "input": 0.4, + "output": 2 + }, + "type": "chat" + }, + { + "id": "mistral/mistral-small-latest", + "name": "Mistral Small (latest)", + "display_name": "Mistral Small (latest)", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 256000, + "output": 256000 + }, + "temperature": true, + "tool_call": true, + "reasoning": { + "supported": true, + "default": true + }, + "attachment": true, + "open_weights": true, + "knowledge": "2025-06", + "release_date": "2026-03-16", + "last_updated": "2026-03-16", + "cost": { + "input": 0.15, + "output": 0.6 + }, + "type": "chat" + }, + { + "id": "mistral/mistral-medium-2505", + "name": "Mistral Medium 3", + "display_name": "Mistral Medium 3", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 131072, + "output": 131072 + }, + "temperature": true, + "tool_call": true, + "reasoning": { + "supported": false + }, + "attachment": true, + "open_weights": false, + "knowledge": "2025-05", + "release_date": "2025-05-07", + "last_updated": "2025-05-07", + "cost": { + "input": 0.4, + "output": 2 + }, + "type": "chat" + }, + { + "id": "mistral/mistral-large-2411", + "name": "Mistral Large 2.1", + "display_name": "Mistral Large 2.1", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 131072, + "output": 16384 + }, + "temperature": true, + "tool_call": true, + "reasoning": { + "supported": false + }, + "attachment": false, + "open_weights": true, + "knowledge": "2024-11", + "release_date": "2024-11-01", + "last_updated": "2024-11-04", + "cost": { + "input": 2, + "output": 6 + }, + "type": "chat" + }, + { + "id": "mistral/magistral-medium-latest", + "name": "Magistral Medium (latest)", + "display_name": "Magistral Medium (latest)", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 128000, + "output": 16384 + }, + "temperature": true, + "tool_call": true, + "reasoning": { + "supported": true, + "default": true + }, + "attachment": false, + "open_weights": false, + "knowledge": "2025-06", + "release_date": "2025-03-17", + "last_updated": "2025-03-20", + "cost": { + "input": 2, + "output": 5 + }, + "type": "chat" + }, + { + "id": "mistral/devstral-medium-latest", + "name": "Devstral 2 (latest)", + "display_name": "Devstral 2 (latest)", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 262144, + "output": 262144 + }, + "temperature": true, + "tool_call": true, + "reasoning": { + "supported": false + }, + "attachment": false, + "open_weights": true, + "knowledge": "2025-12", + "release_date": "2025-12-02", + "last_updated": "2025-12-02", + "cost": { + "input": 0.4, + "output": 2 + }, + "type": "chat" + }, + { + "id": "mistral/devstral-2512", + "name": "Devstral 2", + "display_name": "Devstral 2", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 262144, + "output": 262144 + }, + "temperature": true, + "tool_call": true, + "reasoning": { + "supported": false + }, + "attachment": false, + "open_weights": true, + "knowledge": "2025-12", + "release_date": "2025-12-09", + "last_updated": "2025-12-09", + "cost": { + "input": 0.4, + "output": 2 + }, + "type": "chat" + }, + { + "id": "mistral/mistral-large-2512", + "name": "Mistral Large 3", + "display_name": "Mistral Large 3", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 262144, + "output": 262144 + }, + "temperature": true, + "tool_call": true, + "reasoning": { + "supported": false + }, + "attachment": true, + "open_weights": true, + "knowledge": "2024-11", + "release_date": "2024-11-01", + "last_updated": "2025-12-02", + "cost": { + "input": 0.5, + "output": 1.5 + }, + "type": "chat" + }, + { + "id": "mistral/devstral-medium-2507", + "name": "Devstral Medium", + "display_name": "Devstral Medium", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 128000, + "output": 128000 + }, + "temperature": true, + "tool_call": true, + "reasoning": { + "supported": false + }, + "attachment": false, + "open_weights": false, + "knowledge": "2025-05", + "release_date": "2025-07-10", + "last_updated": "2025-07-10", + "cost": { + "input": 0.4, + "output": 2 + }, + "type": "chat" + }, + { + "id": "google/gemini-3.1-flash-lite", + "name": "Gemini 3.1 Flash Lite", + "display_name": "Gemini 3.1 Flash Lite", + "modalities": { + "input": [ + "text", + "image", + "video", + "audio", + "pdf" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 1048576, + "output": 65536 + }, + "temperature": true, + "tool_call": true, + "reasoning": { + "supported": true, + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true } }, "attachment": true, "open_weights": false, - "knowledge": "2025-02-28", - "release_date": "2025-10-15", - "last_updated": "2025-10-15", + "knowledge": "2025-01", + "release_date": "2026-05-07", + "last_updated": "2026-05-07", "cost": { - "input": 1, - "output": 5, - "cache_read": 0.1, - "cache_write": 1.25 + "input": 0.25, + "output": 1.5, + "cache_read": 0.025, + "input_audio": 0.5 }, "type": "chat" }, { - "id": "anthropic/claude-opus-4.1", - "name": "Claude Opus 4.1 (latest)", - "display_name": "Claude Opus 4.1 (latest)", + "id": "google/gemini-2.5-pro", + "name": "Gemini 2.5 Pro", + "display_name": "Gemini 2.5 Pro", "modalities": { "input": [ "text", "image", + "audio", + "video", "pdf" ], "output": [ @@ -56456,57 +59596,72 @@ ] }, "limit": { - "context": 200000, - "output": 32000 + "context": 1048576, + "output": 65536 }, "temperature": true, "tool_call": true, "reasoning": { "supported": true, - "default": false + "default": true }, "extra_capabilities": { "reasoning": { "supported": true, - "default_enabled": false, + "default_enabled": true, "mode": "budget", "budget": { - "min": 1024, + "default": -1, + "min": 128, + "max": 32768, + "auto": -1, "unit": "tokens" }, - "interleaved": true, "summaries": true, "visibility": "summary", "continuation": [ - "thinking_blocks" - ], - "notes": [ - "Claude 4 manual thinking uses thinking.type = \"enabled\" with budget_tokens.", - "Interleaved thinking requires the interleaved-thinking-2025-05-14 beta header for this model family." + "thought_signatures" ] } }, "attachment": true, "open_weights": false, - "knowledge": "2025-03-31", - "release_date": "2025-08-05", - "last_updated": "2025-08-05", + "knowledge": "2025-01", + "release_date": "2025-03-20", + "last_updated": "2025-06-05", "cost": { - "input": 15, - "output": 75, - "cache_read": 1.5, - "cache_write": 18.75 + "input": 1.25, + "output": 10, + "cache_read": 0.125, + "tiers": [ + { + "input": 2.5, + "output": 15, + "cache_read": 0.25, + "tier": { + "type": "context", + "size": 200000 + } + } + ], + "context_over_200k": { + "input": 2.5, + "output": 15, + "cache_read": 0.25 + } }, "type": "chat" }, { - "id": "anthropic/claude-opus-4", - "name": "Claude Opus 4 (latest)", - "display_name": "Claude Opus 4 (latest)", + "id": "google/gemini-2.5-flash", + "name": "Gemini 2.5 Flash", + "display_name": "Gemini 2.5 Flash", "modalities": { "input": [ "text", "image", + "audio", + "video", "pdf" ], "output": [ @@ -56514,66 +59669,66 @@ ] }, "limit": { - "context": 200000, - "output": 32000 + "context": 1048576, + "output": 65536 }, "temperature": true, "tool_call": true, "reasoning": { "supported": true, - "default": false + "default": true }, "extra_capabilities": { "reasoning": { "supported": true, - "default_enabled": false, + "default_enabled": true, "mode": "budget", "budget": { - "min": 1024, + "default": -1, + "min": 0, + "max": 24576, + "auto": -1, + "off": 0, "unit": "tokens" }, - "interleaved": true, "summaries": true, "visibility": "summary", "continuation": [ - "thinking_blocks" - ], - "notes": [ - "Claude 4 manual thinking uses thinking.type = \"enabled\" with budget_tokens.", - "Interleaved thinking requires the interleaved-thinking-2025-05-14 beta header for this model family." + "thought_signatures" ] } }, "attachment": true, "open_weights": false, - "knowledge": "2025-03-31", - "release_date": "2025-05-22", - "last_updated": "2025-05-22", + "knowledge": "2025-01", + "release_date": "2025-03-20", + "last_updated": "2025-06-05", "cost": { - "input": 15, - "output": 75, - "cache_read": 1.5, - "cache_write": 18.75 + "input": 0.3, + "output": 2.5, + "cache_read": 0.03, + "input_audio": 1 }, "type": "chat" }, { - "id": "qwen/qwen3.5-122b-a10b", - "name": "Qwen3.5 122B-A10B", - "display_name": "Qwen3.5 122B-A10B", + "id": "google/gemini-3.5-flash", + "name": "Gemini 3.5 Flash", + "display_name": "Gemini 3.5 Flash", "modalities": { "input": [ "text", "image", "video", - "audio" + "audio", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 262144, + "context": 1048576, "output": 65536 }, "temperature": true, @@ -56585,40 +59740,82 @@ "extra_capabilities": { "reasoning": { "supported": true, - "interleaved": true, + "default_enabled": true, + "mode": "level", + "level": "high", + "level_options": [ + "minimal", + "low", + "medium", + "high" + ], "summaries": true, "visibility": "summary", "continuation": [ - "thinking_blocks" + "thought_signatures" ] } }, "attachment": true, - "open_weights": true, - "release_date": "2026-02-23", - "last_updated": "2026-02-23", + "open_weights": false, + "knowledge": "2025-01", + "release_date": "2026-05-19", + "last_updated": "2026-05-19", "cost": { - "input": 0.115, - "output": 0.917 + "input": 1.5, + "output": 9, + "cache_read": 0.15, + "input_audio": 1.5 }, "type": "chat" }, { - "id": "qwen/qwen3.5-plus", - "name": "Qwen3.5 Plus", - "display_name": "Qwen3.5 Plus", + "id": "google/gemma-4-31b-it", + "name": "Gemma 4 31B IT", + "display_name": "Gemma 4 31B IT", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 262144, + "output": 32768 + }, + "temperature": true, + "tool_call": true, + "reasoning": { + "supported": true, + "default": true + }, + "attachment": true, + "open_weights": true, + "release_date": "2026-04-02", + "last_updated": "2026-04-02", + "type": "chat" + }, + { + "id": "google/gemini-3.1-pro-preview-customtools", + "name": "Gemini 3.1 Pro Preview Custom Tools", + "display_name": "Gemini 3.1 Pro Preview Custom Tools", "modalities": { "input": [ "text", "image", - "video" + "video", + "audio", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 1000000, + "context": 1048576, "output": 65536 }, "temperature": true, @@ -56630,85 +59827,162 @@ "extra_capabilities": { "reasoning": { "supported": true, - "interleaved": true, + "default_enabled": true, + "mode": "level", + "level": "high", + "level_options": [ + "low", + "high" + ], "summaries": true, "visibility": "summary", "continuation": [ - "thinking_blocks" + "thought_signatures" ] } }, - "attachment": false, + "attachment": true, "open_weights": false, - "knowledge": "2025-04", - "release_date": "2026-02-16", - "last_updated": "2026-02-16", + "knowledge": "2025-01", + "release_date": "2026-02-19", + "last_updated": "2026-02-19", "cost": { - "input": 0.115, - "output": 0.688, - "reasoning": 2.4 + "input": 2, + "output": 12, + "cache_read": 0.2, + "tiers": [ + { + "input": 4, + "output": 18, + "cache_read": 0.4, + "tier": { + "type": "context", + "size": 200000 + } + } + ], + "context_over_200k": { + "input": 4, + "output": 18, + "cache_read": 0.4 + } }, "type": "chat" }, { - "id": "qwen/qwen3-max", - "name": "Qwen3 Max", - "display_name": "Qwen3 Max", + "id": "google/gemini-flash-lite-latest", + "name": "Gemini Flash-Lite Latest", + "display_name": "Gemini Flash-Lite Latest", "modalities": { "input": [ + "text", + "image", + "audio", + "video", + "pdf" + ], + "output": [ "text" + ] + }, + "limit": { + "context": 1048576, + "output": 65536 + }, + "temperature": true, + "tool_call": true, + "reasoning": { + "supported": true, + "default": true + }, + "attachment": true, + "open_weights": false, + "knowledge": "2025-01", + "release_date": "2025-09-25", + "last_updated": "2025-09-25", + "cost": { + "input": 0.1, + "output": 0.4, + "cache_read": 0.025 + }, + "type": "chat" + }, + { + "id": "google/gemini-2.5-flash-lite", + "name": "Gemini 2.5 Flash-Lite", + "display_name": "Gemini 2.5 Flash-Lite", + "modalities": { + "input": [ + "text", + "image", + "audio", + "video", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 262144, + "context": 1048576, "output": 65536 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true + "supported": true, + "default": false }, "extra_capabilities": { "reasoning": { "supported": true, - "interleaved": true, + "default_enabled": false, + "mode": "budget", + "budget": { + "default": -1, + "min": 512, + "max": 24576, + "auto": -1, + "unit": "tokens" + }, "summaries": true, "visibility": "summary", "continuation": [ - "thinking_blocks" + "thought_signatures" ] } }, - "attachment": false, + "attachment": true, "open_weights": false, - "knowledge": "2025-04", - "release_date": "2025-09-23", - "last_updated": "2025-09-23", + "knowledge": "2025-01", + "release_date": "2025-06-17", + "last_updated": "2025-06-17", "cost": { - "input": 0.359, - "output": 1.434 + "input": 0.1, + "output": 0.4, + "cache_read": 0.01, + "input_audio": 0.3 }, "type": "chat" }, { - "id": "qwen/qwen3.6-plus", - "name": "Qwen3.6 Plus", - "display_name": "Qwen3.6 Plus", + "id": "google/gemini-3.1-pro-preview", + "name": "Gemini 3.1 Pro Preview", + "display_name": "Gemini 3.1 Pro Preview", "modalities": { "input": [ "text", "image", - "video" + "video", + "audio", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 1000000, + "context": 1048576, "output": 65536 }, "temperature": true, @@ -56720,248 +59994,689 @@ "extra_capabilities": { "reasoning": { "supported": true, - "interleaved": true, + "default_enabled": true, + "mode": "level", + "level": "high", + "level_options": [ + "low", + "high" + ], "summaries": true, "visibility": "summary", "continuation": [ - "thinking_blocks" + "thought_signatures" ] } }, - "attachment": false, + "attachment": true, "open_weights": false, - "knowledge": "2025-04", + "knowledge": "2025-01", + "release_date": "2026-02-19", + "last_updated": "2026-02-19", + "cost": { + "input": 2, + "output": 12, + "cache_read": 0.2, + "tiers": [ + { + "input": 4, + "output": 18, + "cache_read": 0.4, + "tier": { + "type": "context", + "size": 200000 + } + } + ], + "context_over_200k": { + "input": 4, + "output": 18, + "cache_read": 0.4 + } + }, + "type": "chat" + }, + { + "id": "google/gemma-4-26b-a4b-it", + "name": "Gemma 4 26B A4B IT", + "display_name": "Gemma 4 26B A4B IT", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 262144, + "output": 32768 + }, + "temperature": true, + "tool_call": true, + "reasoning": { + "supported": true, + "default": true + }, + "attachment": true, + "open_weights": true, "release_date": "2026-04-02", "last_updated": "2026-04-02", + "type": "chat" + }, + { + "id": "google/gemini-3-pro-preview", + "name": "Gemini 3 Pro Preview", + "display_name": "Gemini 3 Pro Preview", + "modalities": { + "input": [ + "text", + "image", + "video", + "audio", + "pdf" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 1048576, + "output": 65536 + }, + "temperature": true, + "tool_call": true, + "reasoning": { + "supported": true, + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": true, + "mode": "level", + "level": "high", + "level_options": [ + "low", + "high" + ], + "summaries": true, + "visibility": "summary", + "continuation": [ + "thought_signatures" + ] + } + }, + "attachment": true, + "open_weights": false, + "knowledge": "2025-01", + "release_date": "2025-11-18", + "last_updated": "2025-11-18", "cost": { - "input": 0.5, - "output": 3, - "cache_read": 0.05, - "cache_write": 0.625, + "input": 2, + "output": 12, + "cache_read": 0.2, "tiers": [ { - "input": 2, - "output": 6, - "cache_read": 0.2, - "cache_write": 2.5, + "input": 4, + "output": 18, + "cache_read": 0.4, "tier": { "type": "context", - "size": 256000 + "size": 200000 } } ], "context_over_200k": { - "input": 2, - "output": 6, - "cache_read": 0.2, - "cache_write": 2.5 + "input": 4, + "output": 18, + "cache_read": 0.4 + } + }, + "type": "chat" + }, + { + "id": "google/gemini-3-flash-preview", + "name": "Gemini 3 Flash Preview", + "display_name": "Gemini 3 Flash Preview", + "modalities": { + "input": [ + "text", + "image", + "video", + "audio", + "pdf" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 1048576, + "output": 65536 + }, + "temperature": true, + "tool_call": true, + "reasoning": { + "supported": true, + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": true, + "mode": "level", + "level": "high", + "level_options": [ + "minimal", + "low", + "medium", + "high" + ], + "summaries": true, + "visibility": "summary", + "continuation": [ + "thought_signatures" + ] + } + }, + "attachment": true, + "open_weights": false, + "knowledge": "2025-01", + "release_date": "2025-12-17", + "last_updated": "2025-12-17", + "cost": { + "input": 0.5, + "output": 3, + "cache_read": 0.05, + "input_audio": 1 + }, + "type": "chat" + }, + { + "id": "google/gemini-flash-latest", + "name": "Gemini Flash Latest", + "display_name": "Gemini Flash Latest", + "modalities": { + "input": [ + "text", + "image", + "audio", + "video", + "pdf" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 1048576, + "output": 65536 + }, + "temperature": true, + "tool_call": true, + "reasoning": { + "supported": true, + "default": true + }, + "attachment": true, + "open_weights": false, + "knowledge": "2025-01", + "release_date": "2025-09-25", + "last_updated": "2025-09-25", + "cost": { + "input": 0.3, + "output": 2.5, + "cache_read": 0.075, + "input_audio": 1 + }, + "type": "chat" + }, + { + "id": "google/gemini-3.1-flash-lite-preview", + "name": "Gemini 3.1 Flash Lite Preview", + "display_name": "Gemini 3.1 Flash Lite Preview", + "modalities": { + "input": [ + "text", + "image", + "video", + "audio", + "pdf" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 1048576, + "output": 65536 + }, + "temperature": true, + "tool_call": true, + "reasoning": { + "supported": true, + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true + } + }, + "attachment": true, + "open_weights": false, + "knowledge": "2025-01", + "release_date": "2026-03-03", + "last_updated": "2026-03-03", + "cost": { + "input": 0.25, + "output": 1.5, + "cache_read": 0.025, + "input_audio": 0.5 + }, + "type": "chat" + }, + { + "id": "openai/o3", + "name": "o3", + "display_name": "o3", + "modalities": { + "input": [ + "text", + "image", + "pdf" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 200000, + "output": 100000 + }, + "temperature": false, + "tool_call": true, + "reasoning": { + "supported": true, + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": true, + "mode": "effort", + "effort": "medium", + "effort_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" + } + }, + "attachment": true, + "open_weights": false, + "knowledge": "2024-05", + "release_date": "2025-04-16", + "last_updated": "2025-04-16", + "cost": { + "input": 2, + "output": 8, + "cache_read": 0.5 + }, + "type": "chat" + }, + { + "id": "openai/gpt-5", + "name": "GPT-5", + "display_name": "GPT-5", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 400000, + "output": 128000 + }, + "temperature": false, + "tool_call": true, + "reasoning": { + "supported": true, + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": true, + "mode": "effort", + "effort": "medium", + "effort_options": [ + "minimal", + "low", + "medium", + "high" + ], + "verbosity": "medium", + "verbosity_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" + } + }, + "attachment": true, + "open_weights": false, + "knowledge": "2024-09-30", + "release_date": "2025-08-07", + "last_updated": "2025-08-07", + "cost": { + "input": 1.25, + "output": 10, + "cache_read": 0.125 + }, + "type": "chat" + }, + { + "id": "openai/gpt-4o", + "name": "GPT-4o", + "display_name": "GPT-4o", + "modalities": { + "input": [ + "text", + "image", + "pdf" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 128000, + "output": 16384 + }, + "temperature": true, + "tool_call": true, + "reasoning": { + "supported": false + }, + "attachment": true, + "open_weights": false, + "knowledge": "2023-09", + "release_date": "2024-05-13", + "last_updated": "2024-08-06", + "cost": { + "input": 2.5, + "output": 10, + "cache_read": 1.25 + }, + "type": "chat" + }, + { + "id": "openai/o4-mini", + "name": "o4-mini", + "display_name": "o4-mini", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 200000, + "output": 100000 + }, + "temperature": false, + "tool_call": true, + "reasoning": { + "supported": true, + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": true, + "mode": "effort", + "effort": "medium", + "effort_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" } }, + "attachment": true, + "open_weights": false, + "knowledge": "2024-05", + "release_date": "2025-04-16", + "last_updated": "2025-04-16", + "cost": { + "input": 1.1, + "output": 4.4, + "cache_read": 0.275 + }, + "type": "chat" + }, + { + "id": "openai/gpt-4o-2024-05-13", + "name": "GPT-4o (2024-05-13)", + "display_name": "GPT-4o (2024-05-13)", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 128000, + "output": 4096 + }, + "temperature": true, + "tool_call": true, + "reasoning": { + "supported": false + }, + "attachment": true, + "open_weights": false, + "knowledge": "2023-09", + "release_date": "2024-05-13", + "last_updated": "2024-05-13", + "cost": { + "input": 5, + "output": 15 + }, "type": "chat" }, { - "id": "qwen/qwen3.5-35b-a3b", - "name": "Qwen3.5 35B-A3B", - "display_name": "Qwen3.5 35B-A3B", + "id": "openai/gpt-5.4-nano", + "name": "GPT-5.4 nano", + "display_name": "GPT-5.4 nano", "modalities": { "input": [ "text", - "image", - "video", - "audio" + "image" ], "output": [ "text" ] }, "limit": { - "context": 262144, - "output": 65536 + "context": 400000, + "output": 128000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { "supported": true, - "default": true + "default": false }, "extra_capabilities": { "reasoning": { "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] + "default_enabled": false, + "mode": "effort", + "effort": "none", + "effort_options": [ + "none", + "low", + "medium", + "high", + "xhigh" + ], + "verbosity": "medium", + "verbosity_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" } }, "attachment": true, - "open_weights": true, - "release_date": "2026-02-23", - "last_updated": "2026-02-23", + "open_weights": false, + "knowledge": "2025-08-31", + "release_date": "2026-03-17", + "last_updated": "2026-03-17", "cost": { - "input": 0.057, - "output": 0.459 + "input": 0.2, + "output": 1.25, + "cache_read": 0.02 }, "type": "chat" }, { - "id": "qwen/qwen3.6-35b-a3b", - "name": "Qwen3.6 35B-A3B", - "display_name": "Qwen3.6 35B-A3B", + "id": "openai/gpt-5-chat-latest", + "name": "GPT-5 Chat (latest)", + "display_name": "GPT-5 Chat (latest)", "modalities": { "input": [ "text", - "image", - "video", - "audio" + "image" ], "output": [ "text" ] }, "limit": { - "context": 262144, - "output": 65536 + "context": 400000, + "output": 128000 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": true, "default": true }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } - }, "attachment": true, - "open_weights": true, - "release_date": "2026-04-17", - "last_updated": "2026-04-17", + "open_weights": false, + "knowledge": "2024-09-30", + "release_date": "2025-08-07", + "last_updated": "2025-08-07", "cost": { - "input": 0.248, - "output": 1.485 + "input": 1.25, + "output": 10, + "cache_read": 0.125 }, "type": "chat" }, { - "id": "qwen/qwen3.5-397b-a17b", - "name": "Qwen3.5 397B-A17B", - "display_name": "Qwen3.5 397B-A17B", + "id": "openai/gpt-5.3-chat-latest", + "name": "GPT-5.3 Chat (latest)", + "display_name": "GPT-5.3 Chat (latest)", "modalities": { "input": [ "text", - "image", - "video", - "audio" + "image" ], "output": [ "text" ] }, "limit": { - "context": 262144, - "output": 65536 + "context": 128000, + "output": 16384 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } + "supported": false }, "attachment": true, - "open_weights": true, - "release_date": "2026-02-15", - "last_updated": "2026-02-15", + "open_weights": false, + "knowledge": "2025-08-31", + "release_date": "2026-03-03", + "last_updated": "2026-03-03", "cost": { - "input": 0.172, - "output": 1.032 + "input": 1.75, + "output": 14, + "cache_read": 0.175 }, "type": "chat" }, { - "id": "qwen/qwen3.5-27b", - "name": "Qwen3.5 27B", - "display_name": "Qwen3.5 27B", + "id": "openai/gpt-4o-2024-08-06", + "name": "GPT-4o (2024-08-06)", + "display_name": "GPT-4o (2024-08-06)", "modalities": { "input": [ "text", - "image", - "video", - "audio" + "image" ], "output": [ "text" ] }, "limit": { - "context": 262144, - "output": 65536 + "context": 128000, + "output": 16384 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } + "supported": false }, "attachment": true, - "open_weights": true, - "release_date": "2026-02-23", - "last_updated": "2026-02-23", + "open_weights": false, + "knowledge": "2023-09", + "release_date": "2024-08-06", + "last_updated": "2024-08-06", "cost": { - "input": 0.086, - "output": 0.688 + "input": 2.5, + "output": 10, + "cache_read": 1.25 }, "type": "chat" }, { - "id": "grok/grok-4.3", - "name": "Grok 4.3", - "display_name": "Grok 4.3", + "id": "openai/o3-mini", + "name": "o3-mini", + "display_name": "o3-mini", "modalities": { "input": [ - "text", - "image", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 1000000, - "output": 30000 + "context": 200000, + "output": 100000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { "supported": true, @@ -56969,84 +60684,91 @@ }, "extra_capabilities": { "reasoning": { - "supported": true + "supported": true, + "default_enabled": true, + "mode": "effort", + "effort": "medium", + "effort_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" } }, - "attachment": true, + "attachment": false, "open_weights": false, - "release_date": "2026-04-17", - "last_updated": "2026-04-17", + "knowledge": "2024-05", + "release_date": "2024-12-20", + "last_updated": "2025-01-29", "cost": { - "input": 1.25, - "output": 2.5, - "cache_read": 0.2, - "tiers": [ - { - "input": 2.5, - "output": 5, - "cache_read": 0.4, - "tier": { - "type": "context", - "size": 200000 - } - } - ], - "context_over_200k": { - "input": 2.5, - "output": 5, - "cache_read": 0.4 - } + "input": 1.1, + "output": 4.4, + "cache_read": 0.55 }, "type": "chat" }, { - "id": "google/gemini-3.1-flash-lite-preview", - "name": "Gemini 3.1 Flash Lite Preview", - "display_name": "Gemini 3.1 Flash Lite Preview", + "id": "openai/gpt-5.2", + "name": "GPT-5.2", + "display_name": "GPT-5.2", "modalities": { "input": [ "text", - "image", - "video", - "audio", - "pdf" + "image" ], "output": [ "text" ] }, "limit": { - "context": 1048576, - "output": 65536 + "context": 400000, + "output": 128000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { "supported": true, - "default": true + "default": false }, "extra_capabilities": { "reasoning": { - "supported": true + "supported": true, + "default_enabled": false, + "mode": "effort", + "effort": "none", + "effort_options": [ + "none", + "low", + "medium", + "high", + "xhigh" + ], + "verbosity": "medium", + "verbosity_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" } }, "attachment": true, "open_weights": false, - "knowledge": "2025-01", - "release_date": "2026-03-03", - "last_updated": "2026-03-03", + "knowledge": "2025-08-31", + "release_date": "2025-12-11", + "last_updated": "2025-12-11", "cost": { - "input": 0.25, - "output": 1.5, - "cache_read": 0.025, - "input_audio": 0.5 + "input": 1.75, + "output": 14, + "cache_read": 0.175 }, "type": "chat" }, { - "id": "google/gemma-4-31b-it", - "name": "Gemma 4 31B IT", - "display_name": "Gemma 4 31B IT", + "id": "openai/gpt-5.1-chat-latest", + "name": "GPT-5.1 Chat", + "display_name": "GPT-5.1 Chat", "modalities": { "input": [ "text", @@ -57057,46 +60779,45 @@ ] }, "limit": { - "context": 262144, - "output": 32768 + "context": 128000, + "output": 16384 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { "supported": true, "default": true }, "attachment": true, - "open_weights": true, - "release_date": "2026-04-02", - "last_updated": "2026-04-02", + "open_weights": false, + "knowledge": "2024-09-30", + "release_date": "2025-11-13", + "last_updated": "2025-11-13", "cost": { - "input": 0.13, - "output": 0.38 + "input": 1.25, + "output": 10, + "cache_read": 0.125 }, "type": "chat" }, { - "id": "google/gemini-flash-lite-latest", - "name": "Gemini Flash-Lite Latest", - "display_name": "Gemini Flash-Lite Latest", + "id": "openai/gpt-5.2-chat-latest", + "name": "GPT-5.2 Chat", + "display_name": "GPT-5.2 Chat", "modalities": { "input": [ "text", - "image", - "audio", - "video", - "pdf" + "image" ], "output": [ "text" ] }, "limit": { - "context": 1048576, - "output": 65536 + "context": 128000, + "output": 16384 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { "supported": true, @@ -57104,155 +60825,92 @@ }, "attachment": true, "open_weights": false, - "knowledge": "2025-01", - "release_date": "2025-09-25", - "last_updated": "2025-09-25", + "knowledge": "2025-08-31", + "release_date": "2025-12-11", + "last_updated": "2025-12-11", "cost": { - "input": 0.25, - "output": 1.5, - "cache_read": 0.025 + "input": 1.75, + "output": 14, + "cache_read": 0.175 }, "type": "chat" }, { - "id": "google/gemini-3-flash-preview", - "name": "Gemini 3 Flash Preview", - "display_name": "Gemini 3 Flash Preview", + "id": "openai/gpt-4.1-nano", + "name": "GPT-4.1 nano", + "display_name": "GPT-4.1 nano", "modalities": { "input": [ "text", - "image", - "video", - "audio", - "pdf" + "image" ], "output": [ "text" ] }, "limit": { - "context": 1048576, - "output": 65536 + "context": 1047576, + "output": 32768 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": true, - "mode": "level", - "level": "high", - "level_options": [ - "minimal", - "low", - "medium", - "high" - ], - "summaries": true, - "visibility": "summary", - "continuation": [ - "thought_signatures" - ] - } + "supported": false }, "attachment": true, "open_weights": false, - "knowledge": "2025-01", - "release_date": "2025-12-17", - "last_updated": "2025-12-17", + "knowledge": "2024-04", + "release_date": "2025-04-14", + "last_updated": "2025-04-14", "cost": { - "input": 0.5, - "output": 3, - "cache_read": 0.05, - "input_audio": 1 + "input": 0.1, + "output": 0.4, + "cache_read": 0.025 }, "type": "chat" }, { - "id": "google/gemini-3.1-pro-preview-customtools", - "name": "Gemini 3.1 Pro Preview Custom Tools", - "display_name": "Gemini 3.1 Pro Preview Custom Tools", + "id": "openai/gpt-4o-2024-11-20", + "name": "GPT-4o (2024-11-20)", + "display_name": "GPT-4o (2024-11-20)", "modalities": { "input": [ "text", - "image", - "video", - "audio", - "pdf" + "image" ], "output": [ "text" ] }, "limit": { - "context": 1048576, - "output": 65536 + "context": 128000, + "output": 16384 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": true, - "mode": "level", - "level": "high", - "level_options": [ - "low", - "high" - ], - "summaries": true, - "visibility": "summary", - "continuation": [ - "thought_signatures" - ] - } + "supported": false }, "attachment": true, "open_weights": false, - "knowledge": "2025-01", - "release_date": "2026-02-19", - "last_updated": "2026-02-19", + "knowledge": "2023-09", + "release_date": "2024-11-20", + "last_updated": "2024-11-20", "cost": { - "input": 4, - "output": 18, - "cache_read": 0.2, - "tiers": [ - { - "input": 4, - "output": 18, - "cache_read": 0.4, - "tier": { - "type": "context", - "size": 200000 - } - } - ], - "context_over_200k": { - "input": 4, - "output": 18, - "cache_read": 0.4 - } + "input": 2.5, + "output": 10, + "cache_read": 1.25 }, "type": "chat" }, { - "id": "google/gemini-flash-latest", - "name": "Gemini Flash Latest", - "display_name": "Gemini Flash Latest", + "id": "openai/o1", + "name": "o1", + "display_name": "o1", "modalities": { "input": [ "text", "image", - "audio", - "video", "pdf" ], "output": [ @@ -57260,38 +60918,49 @@ ] }, "limit": { - "context": 1048576, - "output": 65536 + "context": 200000, + "output": 100000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { "supported": true, "default": true }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": true, + "mode": "effort", + "effort": "medium", + "effort_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" + } + }, "attachment": true, "open_weights": false, - "knowledge": "2025-01", - "release_date": "2025-09-25", - "last_updated": "2025-09-25", + "knowledge": "2023-09", + "release_date": "2024-12-05", + "last_updated": "2024-12-05", "cost": { - "input": 0.5, - "output": 3, - "cache_read": 0.075, - "input_audio": 1 + "input": 15, + "output": 60, + "cache_read": 7.5 }, "type": "chat" }, { - "id": "google/gemini-2.5-pro", - "name": "Gemini 2.5 Pro", - "display_name": "Gemini 2.5 Pro", + "id": "openai/gpt-5.4", + "name": "GPT-5.4", + "display_name": "GPT-5.4", "modalities": { "input": [ "text", "image", - "audio", - "video", "pdf" ], "output": [ @@ -57299,143 +60968,130 @@ ] }, "limit": { - "context": 1048576, - "output": 65536 + "context": 1050000, + "output": 128000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { "supported": true, - "default": true + "default": false }, "extra_capabilities": { "reasoning": { "supported": true, - "default_enabled": true, - "mode": "budget", - "budget": { - "default": -1, - "min": 128, - "max": 32768, - "auto": -1, - "unit": "tokens" - }, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thought_signatures" - ] + "default_enabled": false, + "mode": "effort", + "effort": "none", + "effort_options": [ + "none", + "low", + "medium", + "high", + "xhigh" + ], + "verbosity": "medium", + "verbosity_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" } }, "attachment": true, "open_weights": false, - "knowledge": "2025-01", - "release_date": "2025-03-20", - "last_updated": "2025-06-05", + "knowledge": "2025-08-31", + "release_date": "2026-03-05", + "last_updated": "2026-03-05", "cost": { "input": 2.5, "output": 15, - "cache_read": 0.125, + "cache_read": 0.25, "tiers": [ { - "input": 2.5, - "output": 15, - "cache_read": 0.25, + "input": 5, + "output": 22.5, + "cache_read": 0.5, "tier": { "type": "context", - "size": 200000 + "size": 272000 } } ], "context_over_200k": { - "input": 2.5, - "output": 15, - "cache_read": 0.25 + "input": 5, + "output": 22.5, + "cache_read": 0.5 } }, "type": "chat" }, { - "id": "google/gemini-3.1-pro-preview", - "name": "Gemini 3.1 Pro Preview", - "display_name": "Gemini 3.1 Pro Preview", + "id": "openai/gpt-5.4-mini", + "name": "GPT-5.4 mini", + "display_name": "GPT-5.4 mini", "modalities": { "input": [ "text", - "image", - "video", - "audio", - "pdf" + "image" ], "output": [ "text" ] }, "limit": { - "context": 1048576, - "output": 65536 + "context": 400000, + "output": 128000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { "supported": true, - "default": true + "default": false }, "extra_capabilities": { "reasoning": { "supported": true, - "default_enabled": true, - "mode": "level", - "level": "high", - "level_options": [ + "default_enabled": false, + "mode": "effort", + "effort": "none", + "effort_options": [ + "none", + "low", + "medium", + "high", + "xhigh" + ], + "verbosity": "medium", + "verbosity_options": [ "low", + "medium", "high" ], - "summaries": true, - "visibility": "summary", - "continuation": [ - "thought_signatures" - ] + "visibility": "hidden" } }, "attachment": true, "open_weights": false, - "knowledge": "2025-01", - "release_date": "2026-02-19", - "last_updated": "2026-02-19", + "knowledge": "2025-08-31", + "release_date": "2026-03-17", + "last_updated": "2026-03-17", "cost": { - "input": 4, - "output": 18, - "cache_read": 0.2, - "tiers": [ - { - "input": 4, - "output": 18, - "cache_read": 0.4, - "tier": { - "type": "context", - "size": 200000 - } - } - ], - "context_over_200k": { - "input": 4, - "output": 18, - "cache_read": 0.4 - } + "input": 0.75, + "output": 4.5, + "cache_read": 0.075 }, "type": "chat" }, { - "id": "google/gemini-2.5-flash-lite", - "name": "Gemini 2.5 Flash-Lite", - "display_name": "Gemini 2.5 Flash-Lite", + "id": "openai/gpt-4.1", + "name": "GPT-4.1", + "display_name": "GPT-4.1", "modalities": { "input": [ "text", "image", - "audio", - "video", "pdf" ], "output": [ @@ -57443,68 +61099,44 @@ ] }, "limit": { - "context": 1048576, - "output": 65536 + "context": 1047576, + "output": 32768 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": false - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": false, - "mode": "budget", - "budget": { - "default": -1, - "min": 512, - "max": 24576, - "auto": -1, - "unit": "tokens" - }, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thought_signatures" - ] - } + "supported": false }, "attachment": true, "open_weights": false, - "knowledge": "2025-01", - "release_date": "2025-06-17", - "last_updated": "2025-06-17", + "knowledge": "2024-04", + "release_date": "2025-04-14", + "last_updated": "2025-04-14", "cost": { - "input": 0.1, - "output": 0.4, - "cache_read": 0.01, - "input_audio": 0.3 + "input": 2, + "output": 8, + "cache_read": 0.5 }, "type": "chat" }, { - "id": "google/gemini-2.5-flash", - "name": "Gemini 2.5 Flash", - "display_name": "Gemini 2.5 Flash", + "id": "openai/gpt-5-mini", + "name": "GPT-5 Mini", + "display_name": "GPT-5 Mini", "modalities": { "input": [ "text", - "image", - "audio", - "video", - "pdf" + "image" ], "output": [ "text" ] }, "limit": { - "context": 1048576, - "output": 65536 + "context": 400000, + "output": 128000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { "supported": true, @@ -57514,89 +61146,88 @@ "reasoning": { "supported": true, "default_enabled": true, - "mode": "budget", - "budget": { - "default": -1, - "min": 0, - "max": 24576, - "auto": -1, - "off": 0, - "unit": "tokens" - }, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thought_signatures" - ] + "mode": "effort", + "effort": "medium", + "effort_options": [ + "minimal", + "low", + "medium", + "high" + ], + "verbosity": "medium", + "verbosity_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" } }, "attachment": true, "open_weights": false, - "knowledge": "2025-01", - "release_date": "2025-03-20", - "last_updated": "2025-06-05", + "knowledge": "2024-05-30", + "release_date": "2025-08-07", + "last_updated": "2025-08-07", "cost": { - "input": 0.3, - "output": 2.5, - "cache_read": 0.03, - "input_audio": 1 + "input": 0.25, + "output": 2, + "cache_read": 0.025 }, "type": "chat" }, { - "id": "google/gemma-4-26b-a4b-it", - "name": "Gemma 4 26B A4B IT", - "display_name": "Gemma 4 26B A4B IT", + "id": "openai/gpt-4.1-mini", + "name": "GPT-4.1 mini", + "display_name": "GPT-4.1 mini", "modalities": { "input": [ "text", - "image" + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 262144, + "context": 1047576, "output": 32768 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, "attachment": true, - "open_weights": true, - "release_date": "2026-04-02", - "last_updated": "2026-04-02", + "open_weights": false, + "knowledge": "2024-04", + "release_date": "2025-04-14", + "last_updated": "2025-04-14", "cost": { - "input": 0.06, - "output": 0.33 + "input": 0.4, + "output": 1.6, + "cache_read": 0.1 }, "type": "chat" }, { - "id": "google/gemini-3-pro-preview", - "name": "Gemini 3 Pro Preview", - "display_name": "Gemini 3 Pro Preview", + "id": "openai/gpt-5-nano", + "name": "GPT-5 Nano", + "display_name": "GPT-5 Nano", "modalities": { "input": [ "text", - "image", - "video", - "audio", - "pdf" + "image" ], "output": [ "text" ] }, "limit": { - "context": 1048576, - "output": 65536 + "context": 400000, + "output": 128000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { "supported": true, @@ -57606,55 +61237,44 @@ "reasoning": { "supported": true, "default_enabled": true, - "mode": "level", - "level": "high", - "level_options": [ + "mode": "effort", + "effort": "medium", + "effort_options": [ + "minimal", "low", + "medium", "high" ], - "summaries": true, - "visibility": "summary", - "continuation": [ - "thought_signatures" - ] + "verbosity": "medium", + "verbosity_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" } }, "attachment": true, "open_weights": false, - "knowledge": "2025-01", - "release_date": "2025-11-18", - "last_updated": "2025-11-18", + "knowledge": "2024-05-30", + "release_date": "2025-08-07", + "last_updated": "2025-08-07", "cost": { - "input": 4, - "output": 18, - "cache_read": 0.2, - "tiers": [ - { - "input": 4, - "output": 18, - "cache_read": 0.4, - "tier": { - "type": "context", - "size": 200000 - } - } - ], - "context_over_200k": { - "input": 4, - "output": 18, - "cache_read": 0.4 - } + "input": 0.05, + "output": 0.4, + "cache_read": 0.005 }, "type": "chat" }, { - "id": "openai/gpt-4o-2024-08-06", - "name": "GPT-4o (2024-08-06)", - "display_name": "GPT-4o (2024-08-06)", + "id": "openai/gpt-4o-mini", + "name": "GPT-4o mini", + "display_name": "GPT-4o mini", "modalities": { "input": [ "text", - "image" + "image", + "pdf" ], "output": [ "text" @@ -57672,19 +61292,19 @@ "attachment": true, "open_weights": false, "knowledge": "2023-09", - "release_date": "2024-08-06", - "last_updated": "2024-08-06", + "release_date": "2024-07-18", + "last_updated": "2024-07-18", "cost": { - "input": 2.5, - "output": 10, - "cache_read": 1.25 + "input": 0.15, + "output": 0.6, + "cache_read": 0.075 }, "type": "chat" }, { - "id": "openai/gpt-5-pro", - "name": "GPT-5 Pro", - "display_name": "GPT-5 Pro", + "id": "openai/gpt-5.1", + "name": "GPT-5.1", + "display_name": "GPT-5.1", "modalities": { "input": [ "text", @@ -57696,20 +61316,26 @@ }, "limit": { "context": 400000, - "output": 272000 + "output": 128000 }, "temperature": false, "tool_call": true, "reasoning": { "supported": true, - "default": true + "default": false }, "extra_capabilities": { "reasoning": { "supported": true, - "default_enabled": true, - "mode": "fixed", - "effort": "high", + "default_enabled": false, + "mode": "effort", + "effort": "none", + "effort_options": [ + "none", + "low", + "medium", + "high" + ], "verbosity": "medium", "verbosity_options": [ "low", @@ -57722,29 +61348,31 @@ "attachment": true, "open_weights": false, "knowledge": "2024-09-30", - "release_date": "2025-10-06", - "last_updated": "2025-10-06", + "release_date": "2025-11-13", + "last_updated": "2025-11-13", "cost": { - "input": 15, - "output": 120 + "input": 1.25, + "output": 10, + "cache_read": 0.125 }, "type": "chat" }, { - "id": "openai/gpt-5-mini", - "name": "GPT-5 Mini", - "display_name": "GPT-5 Mini", + "id": "openai/gpt-5.5", + "name": "GPT-5.5", + "display_name": "GPT-5.5", "modalities": { "input": [ "text", - "image" + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 400000, + "context": 1050000, "output": 128000 }, "temperature": false, @@ -57760,10 +61388,10 @@ "mode": "effort", "effort": "medium", "effort_options": [ - "minimal", "low", "medium", - "high" + "high", + "xhigh" ], "verbosity": "medium", "verbosity_options": [ @@ -57776,161 +61404,165 @@ }, "attachment": true, "open_weights": false, - "knowledge": "2024-05-30", - "release_date": "2025-08-07", - "last_updated": "2025-08-07", + "knowledge": "2025-12-01", + "release_date": "2026-04-23", + "last_updated": "2026-04-23", "cost": { - "input": 0.25, - "output": 2, - "cache_read": 0.025 + "input": 5, + "output": 30, + "cache_read": 0.5, + "tiers": [ + { + "input": 10, + "output": 45, + "cache_read": 1, + "tier": { + "type": "context", + "size": 272000 + } + } + ], + "context_over_200k": { + "input": 10, + "output": 45, + "cache_read": 1 + } }, "type": "chat" }, { - "id": "openai/gpt-4o", - "name": "GPT-4o", - "display_name": "GPT-4o", + "id": "zai/glm-4.7", + "name": "GLM-4.7", + "display_name": "GLM-4.7", "modalities": { "input": [ - "text", - "image", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 16384 + "context": 204800, + "output": 131072 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": true, - "open_weights": false, - "knowledge": "2023-09", - "release_date": "2024-05-13", - "last_updated": "2024-08-06", + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } + }, + "attachment": false, + "open_weights": true, + "knowledge": "2025-04", + "release_date": "2025-12-22", + "last_updated": "2025-12-22", "cost": { - "input": 2.5, - "output": 10, - "cache_read": 1.25 + "input": 0.6, + "output": 2.2, + "cache_read": 0.11, + "cache_write": 0 }, "type": "chat" }, { - "id": "openai/gpt-5.2", - "name": "GPT-5.2", - "display_name": "GPT-5.2", + "id": "zai/glm-4.5", + "name": "GLM-4.5", + "display_name": "GLM-4.5", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 400000, - "output": 128000 + "context": 131072, + "output": 98304 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, - "default": false - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": false, - "mode": "effort", - "effort": "none", - "effort_options": [ - "none", - "low", - "medium", - "high", - "xhigh" - ], - "verbosity": "medium", - "verbosity_options": [ - "low", - "medium", - "high" - ], - "visibility": "hidden" - } + "default": true }, - "attachment": true, - "open_weights": false, - "knowledge": "2025-08-31", - "release_date": "2025-12-11", - "last_updated": "2025-12-11", + "attachment": false, + "open_weights": true, + "knowledge": "2025-04", + "release_date": "2025-07-28", + "last_updated": "2025-07-28", "cost": { - "input": 1.75, - "output": 14, - "cache_read": 0.175 + "input": 0.6, + "output": 2.2, + "cache_read": 0.11, + "cache_write": 0 }, "type": "chat" }, { - "id": "openai/gpt-5-chat-latest", - "name": "GPT-5 Chat (latest)", - "display_name": "GPT-5 Chat (latest)", + "id": "zai/glm-4.7-flashx", + "name": "GLM-4.7-FlashX", + "display_name": "GLM-4.7-FlashX", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 400000, - "output": 128000 + "context": 200000, + "output": 131072 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { "supported": true, "default": true }, - "attachment": true, - "open_weights": false, - "knowledge": "2024-09-30", - "release_date": "2025-08-07", - "last_updated": "2025-08-07", + "attachment": false, + "open_weights": true, + "knowledge": "2025-04", + "release_date": "2026-01-19", + "last_updated": "2026-01-19", "cost": { - "input": 1.25, - "output": 10, - "cache_read": 0.125 + "input": 0.07, + "output": 0.4, + "cache_read": 0.01, + "cache_write": 0 }, "type": "chat" }, { - "id": "openai/gpt-5-codex", - "name": "GPT-5-Codex", - "display_name": "GPT-5-Codex", + "id": "zai/glm-5.1", + "name": "GLM-5.1", + "display_name": "GLM-5.1", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 400000, - "output": 128000 + "context": 200000, + "output": 131072 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, @@ -57939,122 +61571,118 @@ "extra_capabilities": { "reasoning": { "supported": true, - "default_enabled": true, - "mode": "effort", - "effort": "medium", - "effort_options": [ - "minimal", - "low", - "medium", - "high" - ], - "verbosity": "medium", - "verbosity_options": [ - "low", - "medium", - "high" - ], - "visibility": "hidden" + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] } }, "attachment": false, - "open_weights": false, - "knowledge": "2024-09-30", - "release_date": "2025-09-15", - "last_updated": "2025-09-15", + "open_weights": true, + "release_date": "2026-03-27", + "last_updated": "2026-03-27", "cost": { - "input": 1.25, - "output": 10, - "cache_read": 0.125 + "input": 1.4, + "output": 4.4, + "cache_read": 0.26, + "cache_write": 0 }, "type": "chat" }, { - "id": "openai/gpt-5.3-chat-latest", - "name": "GPT-5.3 Chat (latest)", - "display_name": "GPT-5.3 Chat (latest)", + "id": "zai/glm-4.6", + "name": "GLM-4.6", + "display_name": "GLM-4.6", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 16384 + "context": 204800, + "output": 131072 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": true, - "open_weights": false, - "knowledge": "2025-08-31", - "release_date": "2026-03-03", - "last_updated": "2026-03-03", + "extra_capabilities": { + "reasoning": { + "supported": true + } + }, + "attachment": false, + "open_weights": true, + "knowledge": "2025-04", + "release_date": "2025-09-30", + "last_updated": "2025-09-30", "cost": { - "input": 1.75, - "output": 14, - "cache_read": 0.175 + "input": 0.6, + "output": 2.2, + "cache_read": 0.11, + "cache_write": 0 }, "type": "chat" }, { - "id": "openai/gpt-4o-2024-11-20", - "name": "GPT-4o (2024-11-20)", - "display_name": "GPT-4o (2024-11-20)", + "id": "zai/glm-4.5-air", + "name": "GLM-4.5-Air", + "display_name": "GLM-4.5-Air", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 16384 + "context": 131072, + "output": 98304 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": true, - "open_weights": false, - "knowledge": "2023-09", - "release_date": "2024-11-20", - "last_updated": "2024-11-20", + "attachment": false, + "open_weights": true, + "knowledge": "2025-04", + "release_date": "2025-07-28", + "last_updated": "2025-07-28", "cost": { - "input": 2.5, - "output": 10, - "cache_read": 1.25 + "input": 0.2, + "output": 1.1, + "cache_read": 0.03, + "cache_write": 0 }, "type": "chat" }, { - "id": "openai/gpt-5", - "name": "GPT-5", - "display_name": "GPT-5", + "id": "zai/glm-5", + "name": "GLM-5", + "display_name": "GLM-5", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 400000, - "output": 128000 + "context": 204800, + "output": 131072 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, @@ -58063,54 +61691,43 @@ "extra_capabilities": { "reasoning": { "supported": true, - "default_enabled": true, - "mode": "effort", - "effort": "medium", - "effort_options": [ - "minimal", - "low", - "medium", - "high" - ], - "verbosity": "medium", - "verbosity_options": [ - "low", - "medium", - "high" - ], - "visibility": "hidden" + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] } }, - "attachment": true, - "open_weights": false, - "knowledge": "2024-09-30", - "release_date": "2025-08-07", - "last_updated": "2025-08-07", + "attachment": false, + "open_weights": true, + "release_date": "2026-02-11", + "last_updated": "2026-02-11", "cost": { - "input": 1.25, - "output": 10, - "cache_read": 0.125 + "input": 1, + "output": 3.2, + "cache_read": 0.2, + "cache_write": 0 }, "type": "chat" }, { - "id": "openai/gpt-5.4-pro", - "name": "GPT-5.4 Pro", - "display_name": "GPT-5.4 Pro", + "id": "zai/glm-5-turbo", + "name": "GLM-5-Turbo", + "display_name": "GLM-5-Turbo", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 1050000, - "output": 128000 + "context": 200000, + "output": 131072 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, @@ -58119,52 +61736,30 @@ "extra_capabilities": { "reasoning": { "supported": true, - "default_enabled": true, - "mode": "effort", - "effort": "high", - "effort_options": [ - "medium", - "high", - "xhigh" - ], - "verbosity": "medium", - "verbosity_options": [ - "low", - "medium", - "high" - ], - "visibility": "hidden" + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] } }, - "attachment": true, + "attachment": false, "open_weights": false, - "knowledge": "2025-08-31", - "release_date": "2026-03-05", - "last_updated": "2026-03-05", + "release_date": "2026-03-16", + "last_updated": "2026-03-16", "cost": { - "input": 60, - "output": 270, - "tiers": [ - { - "input": 60, - "output": 270, - "tier": { - "type": "context", - "size": 272000 - } - } - ], - "context_over_200k": { - "input": 60, - "output": 270 - } + "input": 1.2, + "output": 4, + "cache_read": 0.24, + "cache_write": 0 }, "type": "chat" }, { - "id": "openai/gpt-4.1-mini", - "name": "GPT-4.1 mini", - "display_name": "GPT-4.1 mini", + "id": "anthropic/claude-haiku-4-5-20251001", + "name": "Claude Haiku 4.5", + "display_name": "Claude Haiku 4.5", "modalities": { "input": [ "text", @@ -58176,84 +61771,111 @@ ] }, "limit": { - "context": 1047576, - "output": 32768 + "context": 200000, + "output": 64000 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": false + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": false, + "mode": "budget", + "budget": { + "min": 1024, + "unit": "tokens" + }, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ], + "notes": [ + "Claude 4 manual thinking uses thinking.type = \"enabled\" with budget_tokens.", + "Interleaved thinking requires the interleaved-thinking-2025-05-14 beta header for this model family." + ] + } }, "attachment": true, "open_weights": false, - "knowledge": "2024-04", - "release_date": "2025-04-14", - "last_updated": "2025-04-14", + "knowledge": "2025-02-28", + "release_date": "2025-10-15", + "last_updated": "2025-10-15", "cost": { - "input": 0.4, - "output": 1.6, - "cache_read": 0.1 + "input": 1, + "output": 5, + "cache_read": 0.1, + "cache_write": 1.25 }, "type": "chat" }, { - "id": "openai/gpt-5.2-pro", - "name": "GPT-5.2 Pro", - "display_name": "GPT-5.2 Pro", + "id": "anthropic/claude-opus-4-1-20250805", + "name": "Claude Opus 4.1", + "display_name": "Claude Opus 4.1", "modalities": { "input": [ "text", - "image" + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 400000, - "output": 128000 + "context": 200000, + "output": 32000 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, - "default": true + "default": false }, "extra_capabilities": { "reasoning": { "supported": true, - "default_enabled": true, - "mode": "effort", - "effort": "high", - "effort_options": [ - "medium", - "high", - "xhigh" - ], - "verbosity": "medium", - "verbosity_options": [ - "low", - "medium", - "high" + "default_enabled": false, + "mode": "budget", + "budget": { + "min": 1024, + "unit": "tokens" + }, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" ], - "visibility": "hidden" + "notes": [ + "Claude 4 manual thinking uses thinking.type = \"enabled\" with budget_tokens.", + "Interleaved thinking requires the interleaved-thinking-2025-05-14 beta header for this model family." + ] } }, "attachment": true, "open_weights": false, - "knowledge": "2025-08-31", - "release_date": "2025-12-11", - "last_updated": "2025-12-11", + "knowledge": "2025-03-31", + "release_date": "2025-08-05", + "last_updated": "2025-08-05", "cost": { - "input": 21, - "output": 168 + "input": 15, + "output": 75, + "cache_read": 1.5, + "cache_write": 18.75 }, "type": "chat" }, { - "id": "openai/gpt-5.4", - "name": "GPT-5.4", - "display_name": "GPT-5.4", + "id": "anthropic/claude-opus-4-7", + "name": "Claude Opus 4.7", + "display_name": "Claude Opus 4.7", "modalities": { "input": [ "text", @@ -58265,7 +61887,7 @@ ] }, "limit": { - "context": 1050000, + "context": 1000000, "output": 128000 }, "temperature": false, @@ -58279,55 +61901,44 @@ "supported": true, "default_enabled": false, "mode": "effort", - "effort": "none", + "effort": "high", "effort_options": [ - "none", "low", "medium", "high", - "xhigh" + "xhigh", + "max" ], - "verbosity": "medium", - "verbosity_options": [ - "low", - "medium", - "high" + "interleaved": true, + "summaries": true, + "visibility": "omitted", + "continuation": [ + "thinking_blocks" ], - "visibility": "hidden" + "notes": [ + "Claude Opus 4.7 and newer Opus models require thinking.type = \"adaptive\" to enable thinking explicitly.", + "Manual budget_tokens requests return 400 on Claude Opus 4.7 and newer adaptive-only Opus models.", + "task_budget is separate from thinking control and should not be treated as a thinking budget." + ] } }, "attachment": true, "open_weights": false, - "knowledge": "2025-08-31", - "release_date": "2026-03-05", - "last_updated": "2026-03-05", + "knowledge": "2026-01-31", + "release_date": "2026-04-16", + "last_updated": "2026-04-16", "cost": { "input": 5, - "output": 22.5, - "cache_read": 0.25, - "tiers": [ - { - "input": 5, - "output": 22.5, - "cache_read": 0.5, - "tier": { - "type": "context", - "size": 272000 - } - } - ], - "context_over_200k": { - "input": 5, - "output": 22.5, - "cache_read": 0.5 - } + "output": 25, + "cache_read": 0.5, + "cache_write": 6.25 }, "type": "chat" }, { - "id": "openai/gpt-5.5", - "name": "GPT-5.5", - "display_name": "GPT-5.5", + "id": "anthropic/claude-opus-4-5-20251101", + "name": "Claude Opus 4.5", + "display_name": "Claude Opus 4.5", "modalities": { "input": [ "text", @@ -58339,117 +61950,132 @@ ] }, "limit": { - "context": 1050000, - "output": 128000 + "context": 200000, + "output": 64000 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, - "default": true + "default": false }, "extra_capabilities": { "reasoning": { "supported": true, - "default_enabled": true, - "mode": "effort", - "effort": "medium", + "default_enabled": false, + "mode": "mixed", + "budget": { + "min": 1024, + "unit": "tokens" + }, + "effort": "high", "effort_options": [ - "low", - "medium", - "high", - "xhigh" - ], - "verbosity": "medium", - "verbosity_options": [ "low", "medium", "high" ], - "visibility": "hidden" + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ], + "notes": [ + "Claude Opus 4.5 uses manual thinking.type = \"enabled\" with budget_tokens; effort can be used alongside the thinking budget.", + "Interleaved thinking requires the interleaved-thinking-2025-05-14 beta header." + ] } }, "attachment": true, "open_weights": false, - "knowledge": "2025-12-01", - "release_date": "2026-04-23", - "last_updated": "2026-04-23", + "knowledge": "2025-03-31", + "release_date": "2025-11-01", + "last_updated": "2025-11-01", "cost": { "input": 5, - "output": 30, + "output": 25, "cache_read": 0.5, - "tiers": [ - { - "input": 10, - "output": 45, - "cache_read": 1, - "tier": { - "type": "context", - "size": 272000 - } - } - ], - "context_over_200k": { - "input": 10, - "output": 45, - "cache_read": 1 - } + "cache_write": 6.25 }, "type": "chat" }, { - "id": "openai/gpt-5.2-chat-latest", - "name": "GPT-5.2 Chat", - "display_name": "GPT-5.2 Chat", + "id": "anthropic/claude-opus-4-20250514", + "name": "Claude Opus 4", + "display_name": "Claude Opus 4", "modalities": { "input": [ "text", - "image" + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 16384 + "context": 200000, + "output": 32000 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, - "default": true + "default": false + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": false, + "mode": "budget", + "budget": { + "min": 1024, + "unit": "tokens" + }, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ], + "notes": [ + "Claude 4 manual thinking uses thinking.type = \"enabled\" with budget_tokens.", + "Interleaved thinking requires the interleaved-thinking-2025-05-14 beta header for this model family." + ] + } }, "attachment": true, "open_weights": false, - "knowledge": "2025-08-31", - "release_date": "2025-12-11", - "last_updated": "2025-12-11", + "knowledge": "2025-03-31", + "release_date": "2025-05-22", + "last_updated": "2025-05-22", "cost": { - "input": 1.75, - "output": 14, - "cache_read": 0.175 + "input": 15, + "output": 75, + "cache_read": 1.5, + "cache_write": 18.75 }, "type": "chat" }, { - "id": "openai/gpt-5.1", - "name": "GPT-5.1", - "display_name": "GPT-5.1", + "id": "anthropic/claude-sonnet-4-20250514", + "name": "Claude Sonnet 4", + "display_name": "Claude Sonnet 4", "modalities": { "input": [ "text", - "image" + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 400000, - "output": 128000 + "context": 200000, + "output": 64000 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, @@ -58459,95 +62085,105 @@ "reasoning": { "supported": true, "default_enabled": false, - "mode": "effort", - "effort": "none", - "effort_options": [ - "none", - "low", - "medium", - "high" - ], - "verbosity": "medium", - "verbosity_options": [ - "low", - "medium", - "high" + "mode": "budget", + "budget": { + "min": 1024, + "unit": "tokens" + }, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" ], - "visibility": "hidden" + "notes": [ + "Claude 4 manual thinking uses thinking.type = \"enabled\" with budget_tokens.", + "Interleaved thinking requires the interleaved-thinking-2025-05-14 beta header for this model family." + ] } }, "attachment": true, "open_weights": false, - "knowledge": "2024-09-30", - "release_date": "2025-11-13", - "last_updated": "2025-11-13", + "knowledge": "2025-03-31", + "release_date": "2025-05-22", + "last_updated": "2025-05-22", "cost": { - "input": 1.25, - "output": 10, - "cache_read": 0.125 + "input": 3, + "output": 15, + "cache_read": 0.3, + "cache_write": 3.75 }, "type": "chat" }, { - "id": "openai/gpt-5-nano", - "name": "GPT-5 Nano", - "display_name": "GPT-5 Nano", + "id": "anthropic/claude-opus-4-6", + "name": "Claude Opus 4.6", + "display_name": "Claude Opus 4.6", "modalities": { "input": [ "text", - "image" + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 400000, + "context": 1000000, "output": 128000 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, - "default": true + "default": false }, "extra_capabilities": { "reasoning": { "supported": true, - "default_enabled": true, - "mode": "effort", - "effort": "medium", + "default_enabled": false, + "mode": "mixed", + "budget": { + "min": 1024, + "unit": "tokens" + }, + "effort": "high", "effort_options": [ - "minimal", "low", "medium", - "high" + "high", + "max" ], - "verbosity": "medium", - "verbosity_options": [ - "low", - "medium", - "high" + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" ], - "visibility": "hidden" + "notes": [ + "Anthropic recommends adaptive thinking with effort for Claude 4.6; budget_tokens remains a deprecated compatibility path.", + "Anthropic API defaults effort to high; lower effort levels should be chosen per workload." + ] } }, "attachment": true, "open_weights": false, - "knowledge": "2024-05-30", - "release_date": "2025-08-07", - "last_updated": "2025-08-07", + "knowledge": "2025-05-31", + "release_date": "2026-02-05", + "last_updated": "2026-03-13", "cost": { - "input": 0.05, - "output": 0.4, - "cache_read": 0.005 + "input": 5, + "output": 25, + "cache_read": 0.5, + "cache_write": 6.25 }, "type": "chat" }, { - "id": "openai/gpt-4o-mini", - "name": "GPT-4o mini", - "display_name": "GPT-4o mini", + "id": "anthropic/claude-sonnet-4-5-20250929", + "name": "Claude Sonnet 4.5", + "display_name": "Claude Sonnet 4.5", "modalities": { "input": [ "text", @@ -58559,44 +62195,68 @@ ] }, "limit": { - "context": 128000, - "output": 16384 + "context": 200000, + "output": 64000 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": false + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": false, + "mode": "budget", + "budget": { + "min": 1024, + "unit": "tokens" + }, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ], + "notes": [ + "Claude 4 manual thinking uses thinking.type = \"enabled\" with budget_tokens.", + "Interleaved thinking requires the interleaved-thinking-2025-05-14 beta header for this model family." + ] + } }, "attachment": true, "open_weights": false, - "knowledge": "2023-09", - "release_date": "2024-07-18", - "last_updated": "2024-07-18", + "knowledge": "2025-07-31", + "release_date": "2025-09-29", + "last_updated": "2025-09-29", "cost": { - "input": 0.15, - "output": 0.6, - "cache_read": 0.075 + "input": 3, + "output": 15, + "cache_read": 0.3, + "cache_write": 3.75 }, "type": "chat" }, { - "id": "openai/gpt-5.1-codex-max", - "name": "GPT-5.1 Codex Max", - "display_name": "GPT-5.1 Codex Max", + "id": "anthropic/claude-sonnet-4-6", + "name": "Claude Sonnet 4.6", + "display_name": "Claude Sonnet 4.6", "modalities": { "input": [ "text", - "image" + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 400000, - "output": 128000 + "context": 1000000, + "output": 64000 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, @@ -58606,202 +62266,233 @@ "reasoning": { "supported": true, "default_enabled": false, - "mode": "effort", - "effort": "none", + "mode": "mixed", + "budget": { + "min": 1024, + "unit": "tokens" + }, + "effort": "high", "effort_options": [ - "none", "low", "medium", - "high" + "high", + "max" ], - "verbosity": "medium", - "verbosity_options": [ - "low", - "medium", - "high" + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" ], - "visibility": "hidden" + "notes": [ + "Anthropic recommends adaptive thinking with effort for Claude 4.6; budget_tokens remains a deprecated compatibility path.", + "Anthropic API defaults effort to high; lower effort levels should be chosen per workload." + ] } }, "attachment": true, "open_weights": false, - "knowledge": "2024-09-30", - "release_date": "2025-11-13", - "last_updated": "2025-11-13", + "knowledge": "2025-08-31", + "release_date": "2026-02-17", + "last_updated": "2026-03-13", "cost": { - "input": 1.25, - "output": 10, - "cache_read": 0.125 + "input": 3, + "output": 15, + "cache_read": 0.3, + "cache_write": 3.75 }, "type": "chat" }, { - "id": "openai/gpt-5.1-codex-mini", - "name": "GPT-5.1 Codex mini", - "display_name": "GPT-5.1 Codex mini", + "id": "cohere/command-a-03-2025", + "name": "Command A", + "display_name": "Command A", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 400000, - "output": 128000 + "context": 256000, + "output": 8000 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": false + "supported": false }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": false, - "mode": "effort", - "effort": "none", - "effort_options": [ - "none", - "low", - "medium", - "high" - ], - "verbosity": "medium", - "verbosity_options": [ - "low", - "medium", - "high" - ], - "visibility": "hidden" - } + "attachment": false, + "open_weights": true, + "knowledge": "2024-06-01", + "release_date": "2025-03-13", + "last_updated": "2025-03-13", + "cost": { + "input": 2.5, + "output": 10 }, - "attachment": true, - "open_weights": false, - "knowledge": "2024-09-30", - "release_date": "2025-11-13", - "last_updated": "2025-11-13", + "type": "chat" + }, + { + "id": "cohere/command-r-08-2024", + "name": "Command R", + "display_name": "Command R", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 128000, + "output": 4000 + }, + "temperature": true, + "tool_call": true, + "reasoning": { + "supported": false + }, + "attachment": false, + "open_weights": true, + "knowledge": "2024-06-01", + "release_date": "2024-08-30", + "last_updated": "2024-08-30", "cost": { - "input": 0.25, - "output": 2, - "cache_read": 0.025 + "input": 0.15, + "output": 0.6 }, "type": "chat" }, { - "id": "openai/gpt-4.1", - "name": "GPT-4.1", - "display_name": "GPT-4.1", + "id": "cohere/command-r7b-12-2024", + "name": "Command R7B", + "display_name": "Command R7B", "modalities": { "input": [ - "text", - "image", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 1047576, - "output": 32768 + "context": 128000, + "output": 4000 }, "temperature": true, "tool_call": true, "reasoning": { "supported": false }, - "attachment": true, - "open_weights": false, - "knowledge": "2024-04", - "release_date": "2025-04-14", - "last_updated": "2025-04-14", + "attachment": false, + "open_weights": true, + "knowledge": "2024-06-01", + "release_date": "2024-02-27", + "last_updated": "2024-02-27", "cost": { - "input": 2, - "output": 8, - "cache_read": 0.5 + "input": 0.0375, + "output": 0.15 }, "type": "chat" }, { - "id": "openai/gpt-5.4-nano", - "name": "GPT-5.4 nano", - "display_name": "GPT-5.4 nano", + "id": "cohere/command-r-plus-08-2024", + "name": "Command R+", + "display_name": "Command R+", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 400000, - "output": 128000 + "context": 128000, + "output": 4000 }, - "temperature": false, + "temperature": true, + "tool_call": true, + "reasoning": { + "supported": false + }, + "attachment": false, + "open_weights": true, + "knowledge": "2024-06-01", + "release_date": "2024-08-30", + "last_updated": "2024-08-30", + "cost": { + "input": 2.5, + "output": 10 + }, + "type": "chat" + }, + { + "id": "deepseek/deepseek-v4-flash", + "name": "DeepSeek V4 Flash", + "display_name": "DeepSeek V4 Flash", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 1000000, + "output": 384000 + }, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, - "default": false + "default": true }, "extra_capabilities": { "reasoning": { "supported": true, - "default_enabled": false, - "mode": "effort", - "effort": "none", - "effort_options": [ - "none", - "low", - "medium", - "high", - "xhigh" - ], - "verbosity": "medium", - "verbosity_options": [ - "low", - "medium", - "high" - ], - "visibility": "hidden" + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] } }, - "attachment": true, - "open_weights": false, - "knowledge": "2025-08-31", - "release_date": "2026-03-17", - "last_updated": "2026-03-17", + "attachment": false, + "open_weights": true, + "knowledge": "2025-05", + "release_date": "2026-04-24", + "last_updated": "2026-04-24", "cost": { - "input": 0.2, - "output": 1.25, - "cache_read": 0.02 + "input": 0.14, + "output": 0.28, + "cache_read": 0.0028 }, "type": "chat" }, { - "id": "openai/gpt-5.3-codex", - "name": "GPT-5.3 Codex", - "display_name": "GPT-5.3 Codex", + "id": "deepseek/deepseek-v4-pro", + "name": "DeepSeek V4 Pro", + "display_name": "DeepSeek V4 Pro", "modalities": { "input": [ - "text", - "image", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 400000, - "output": 128000 + "context": 1000000, + "output": 384000 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, @@ -58810,55 +62501,43 @@ "extra_capabilities": { "reasoning": { "supported": true, - "default_enabled": true, - "mode": "effort", - "effort": "medium", - "effort_options": [ - "low", - "medium", - "high", - "xhigh" - ], - "verbosity": "medium", - "verbosity_options": [ - "low", - "medium", - "high" - ], - "visibility": "hidden" + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] } }, - "attachment": true, - "open_weights": false, - "knowledge": "2025-08-31", - "release_date": "2026-02-05", - "last_updated": "2026-02-05", + "attachment": false, + "open_weights": true, + "knowledge": "2025-05", + "release_date": "2026-04-24", + "last_updated": "2026-04-24", "cost": { - "input": 1.75, - "output": 14, - "cache_read": 0.175 + "input": 0.435, + "output": 0.87, + "cache_read": 0.003625 }, "type": "chat" }, { - "id": "openai/gpt-5.5-pro", - "name": "GPT-5.5 Pro", - "display_name": "GPT-5.5 Pro", + "id": "minimax/minimax-m2.7-highspeed", + "name": "MiniMax-M2.7-highspeed", + "display_name": "MiniMax-M2.7-highspeed", "modalities": { "input": [ - "text", - "image", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 1050000, - "output": 128000 + "context": 204800, + "output": 131072 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, @@ -58866,38 +62545,31 @@ }, "extra_capabilities": { "reasoning": { - "supported": true + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] } }, - "attachment": true, - "open_weights": false, - "knowledge": "2025-12-01", - "release_date": "2026-04-23", - "last_updated": "2026-04-23", + "attachment": false, + "open_weights": true, + "release_date": "2026-03-18", + "last_updated": "2026-03-18", "cost": { - "input": 30, - "output": 180, - "tiers": [ - { - "input": 60, - "output": 270, - "tier": { - "type": "context", - "size": 272000 - } - } - ], - "context_over_200k": { - "input": 60, - "output": 270 - } + "input": 0.6, + "output": 2.4, + "cache_read": 0.06, + "cache_write": 0.375 }, "type": "chat" }, { - "id": "openai/gpt-3.5-turbo", - "name": "GPT-3.5-turbo", - "display_name": "GPT-3.5-turbo", + "id": "minimax/minimax-m2.5", + "name": "MiniMax-M2.5", + "display_name": "MiniMax-M2.5", "modalities": { "input": [ "text" @@ -58907,45 +62579,49 @@ ] }, "limit": { - "context": 16385, - "output": 4096 + "context": 204800, + "output": 131072 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true + } }, "attachment": false, - "open_weights": false, - "knowledge": "2021-09-01", - "release_date": "2023-03-01", - "last_updated": "2023-11-06", + "open_weights": true, + "release_date": "2026-02-12", + "last_updated": "2026-02-12", "cost": { - "input": 0.5, - "output": 1.5, - "cache_read": 0 + "input": 0.3, + "output": 1.2, + "cache_read": 0.03, + "cache_write": 0.375 }, "type": "chat" }, { - "id": "openai/gpt-5.2-codex", - "name": "GPT-5.2 Codex", - "display_name": "GPT-5.2 Codex", + "id": "minimax/minimax-m2.1", + "name": "MiniMax-M2.1", + "display_name": "MiniMax-M2.1", "modalities": { "input": [ - "text", - "image", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 400000, - "output": 128000 + "context": 204800, + "output": 131072 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, @@ -58953,287 +62629,341 @@ }, "extra_capabilities": { "reasoning": { - "supported": true, - "default_enabled": true, - "mode": "effort", - "effort": "medium", - "effort_options": [ - "low", - "medium", - "high", - "xhigh" - ], - "verbosity": "medium", - "verbosity_options": [ - "low", - "medium", - "high" - ], - "visibility": "hidden" + "supported": true } }, - "attachment": true, - "open_weights": false, - "knowledge": "2025-08-31", - "release_date": "2025-12-11", - "last_updated": "2025-12-11", + "attachment": false, + "open_weights": true, + "release_date": "2025-12-23", + "last_updated": "2025-12-23", "cost": { - "input": 1.75, - "output": 14, - "cache_read": 0.175 + "input": 0.3, + "output": 1.2 }, "type": "chat" }, { - "id": "openai/gpt-5.1-codex", - "name": "GPT-5.1 Codex", - "display_name": "GPT-5.1 Codex", + "id": "minimax/minimax-m2", + "name": "MiniMax-M2", + "display_name": "MiniMax-M2", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 400000, + "context": 196608, "output": 128000 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, - "default": false + "default": true }, "extra_capabilities": { "reasoning": { - "supported": true, - "default_enabled": false, - "mode": "effort", - "effort": "none", - "effort_options": [ - "none", - "low", - "medium", - "high" - ], - "verbosity": "medium", - "verbosity_options": [ - "low", - "medium", - "high" - ], - "visibility": "hidden" + "supported": true } }, - "attachment": true, - "open_weights": false, - "knowledge": "2024-09-30", - "release_date": "2025-11-13", - "last_updated": "2025-11-13", + "attachment": false, + "open_weights": true, + "release_date": "2025-10-27", + "last_updated": "2025-10-27", "cost": { - "input": 1.25, - "output": 10, - "cache_read": 0.125 + "input": 0.3, + "output": 1.2 }, "type": "chat" }, { - "id": "openai/gpt-4o-2024-05-13", - "name": "GPT-4o (2024-05-13)", - "display_name": "GPT-4o (2024-05-13)", + "id": "minimax/minimax-m2.7", + "name": "MiniMax-M2.7", + "display_name": "MiniMax-M2.7", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 4096 + "context": 204800, + "output": 131072 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": true, - "open_weights": false, - "knowledge": "2023-09", - "release_date": "2024-05-13", - "last_updated": "2024-05-13", + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } + }, + "attachment": false, + "open_weights": true, + "release_date": "2026-03-18", + "last_updated": "2026-03-18", "cost": { - "input": 5, - "output": 15 + "input": 0.3, + "output": 1.2, + "cache_read": 0.06, + "cache_write": 0.375 }, "type": "chat" }, { - "id": "openai/gpt-5.4-mini", - "name": "GPT-5.4 mini", - "display_name": "GPT-5.4 mini", + "id": "minimax/minimax-m2.5-highspeed", + "name": "MiniMax-M2.5-highspeed", + "display_name": "MiniMax-M2.5-highspeed", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 400000, - "output": 128000 + "context": 204800, + "output": 131072 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, - "default": false + "default": true }, "extra_capabilities": { "reasoning": { - "supported": true, - "default_enabled": false, - "mode": "effort", - "effort": "none", - "effort_options": [ - "none", - "low", - "medium", - "high", - "xhigh" - ], - "verbosity": "medium", - "verbosity_options": [ - "low", - "medium", - "high" - ], - "visibility": "hidden" + "supported": true } }, - "attachment": true, - "open_weights": false, - "knowledge": "2025-08-31", - "release_date": "2026-03-17", - "last_updated": "2026-03-17", + "attachment": false, + "open_weights": true, + "release_date": "2026-02-13", + "last_updated": "2026-02-13", "cost": { - "input": 0.75, - "output": 4.5, - "cache_read": 0.075 + "input": 0.6, + "output": 2.4, + "cache_read": 0.06, + "cache_write": 0.375 }, "type": "chat" - }, + } + ] + }, + "qihang-ai": { + "id": "qihang-ai", + "name": "QiHang", + "display_name": "QiHang", + "api": "https://api.qhaigc.net/v1", + "doc": "https://www.qhaigc.net/docs", + "models": [ { - "id": "openai/gpt-4-turbo", - "name": "GPT-4 Turbo", - "display_name": "GPT-4 Turbo", + "id": "claude-haiku-4-5-20251001", + "name": "Claude Haiku 4.5", + "display_name": "Claude Haiku 4.5", "modalities": { "input": [ "text", - "image" + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 4096 + "context": 200000, + "output": 64000 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": false + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": false, + "mode": "budget", + "budget": { + "min": 1024, + "unit": "tokens" + }, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ], + "notes": [ + "Claude 4 manual thinking uses thinking.type = \"enabled\" with budget_tokens.", + "Interleaved thinking requires the interleaved-thinking-2025-05-14 beta header for this model family." + ] + } }, "attachment": true, "open_weights": false, - "knowledge": "2023-12", - "release_date": "2023-11-06", - "last_updated": "2024-04-09", + "knowledge": "2025-07-31", + "release_date": "2025-10-01", + "last_updated": "2025-10-01", "cost": { - "input": 10, - "output": 30 + "input": 0.14, + "output": 0.71 }, "type": "chat" }, { - "id": "openai/gpt-5.1-chat-latest", - "name": "GPT-5.1 Chat", - "display_name": "GPT-5.1 Chat", + "id": "gemini-2.5-flash", + "name": "Gemini 2.5 Flash", + "display_name": "Gemini 2.5 Flash", "modalities": { "input": [ "text", - "image" + "image", + "video", + "audio", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 16384 + "context": 1048576, + "output": 65536 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, "default": true }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": true, + "mode": "budget", + "budget": { + "default": -1, + "min": 0, + "max": 24576, + "auto": -1, + "off": 0, + "unit": "tokens" + }, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thought_signatures" + ] + } + }, "attachment": true, "open_weights": false, - "knowledge": "2024-09-30", - "release_date": "2025-11-13", - "last_updated": "2025-11-13", + "knowledge": "2025-01", + "release_date": "2025-12-17", + "last_updated": "2025-12-17", "cost": { - "input": 1.25, - "output": 10, - "cache_read": 0.125 + "input": 0.09, + "output": 0.71, + "tiers": [ + { + "input": 0.09, + "output": 0.71, + "tier": { + "type": "context", + "size": 200000 + } + } + ], + "context_over_200k": { + "input": 0.09, + "output": 0.71 + } }, "type": "chat" }, { - "id": "openai/gpt-4", - "name": "GPT-4", - "display_name": "GPT-4", + "id": "claude-opus-4-5-20251101", + "name": "Claude Opus 4.5", + "display_name": "Claude Opus 4.5", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 8192, - "output": 8192 + "context": 200000, + "output": 32000 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": false + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": false, + "mode": "mixed", + "budget": { + "min": 1024, + "unit": "tokens" + }, + "effort": "high", + "effort_options": [ + "low", + "medium", + "high" + ], + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ], + "notes": [ + "Claude Opus 4.5 uses manual thinking.type = \"enabled\" with budget_tokens; effort can be used alongside the thinking budget.", + "Interleaved thinking requires the interleaved-thinking-2025-05-14 beta header." + ] + } }, "attachment": true, "open_weights": false, - "knowledge": "2023-11", - "release_date": "2023-11-06", - "last_updated": "2024-04-09", + "knowledge": "2025-03", + "release_date": "2025-11-01", + "last_updated": "2025-11-01", "cost": { - "input": 30, - "output": 60 + "input": 0.71, + "output": 3.57 }, "type": "chat" }, { - "id": "openai/gpt-4.1-nano", - "name": "GPT-4.1 nano", - "display_name": "GPT-4.1 nano", + "id": "gpt-5.2", + "name": "GPT-5.2", + "display_name": "GPT-5.2", "modalities": { "input": [ "text", @@ -59244,81 +62974,113 @@ ] }, "limit": { - "context": 1047576, - "output": 32768 + "context": 400000, + "output": 128000 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": false + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": false, + "mode": "effort", + "effort": "none", + "effort_options": [ + "none", + "low", + "medium", + "high", + "xhigh" + ], + "verbosity": "medium", + "verbosity_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" + } }, "attachment": true, "open_weights": false, - "knowledge": "2024-04", - "release_date": "2025-04-14", - "last_updated": "2025-04-14", + "knowledge": "2025-08-31", + "release_date": "2025-12-11", + "last_updated": "2025-12-11", "cost": { - "input": 0.1, - "output": 0.4, - "cache_read": 0.025 + "input": 0.25, + "output": 2 }, "type": "chat" }, { - "id": "kimi/kimi-k2.6", - "name": "Kimi K2.6", - "display_name": "Kimi K2.6", + "id": "claude-sonnet-4-5-20250929", + "name": "Claude Sonnet 4.5", + "display_name": "Claude Sonnet 4.5", "modalities": { "input": [ "text", "image", - "video" + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 262144, - "output": 262144 + "context": 200000, + "output": 64000 }, "temperature": true, "tool_call": true, "reasoning": { "supported": true, - "default": true + "default": false }, "extra_capabilities": { "reasoning": { "supported": true, + "default_enabled": false, + "mode": "budget", + "budget": { + "min": 1024, + "unit": "tokens" + }, "interleaved": true, "summaries": true, "visibility": "summary", "continuation": [ "thinking_blocks" + ], + "notes": [ + "Claude 4 manual thinking uses thinking.type = \"enabled\" with budget_tokens.", + "Interleaved thinking requires the interleaved-thinking-2025-05-14 beta header for this model family." ] } }, "attachment": true, - "open_weights": true, - "knowledge": "2025-01", - "release_date": "2026-04-21", - "last_updated": "2026-04-21", + "open_weights": false, + "knowledge": "2025-07-31", + "release_date": "2025-09-29", + "last_updated": "2025-09-29", "cost": { - "input": 0.95, - "output": 4, - "cache_read": 0.16 + "input": 0.43, + "output": 2.14 }, "type": "chat" }, { - "id": "kimi/kimi-k2.5", - "name": "Kimi K2.5", - "display_name": "Kimi K2.5", + "id": "gemini-3-pro-preview", + "name": "Gemini 3 Pro Preview", + "display_name": "Gemini 3 Pro Preview", "modalities": { "input": [ "text", "image", + "audio", "video" ], "output": [ @@ -59326,10 +63088,10 @@ ] }, "limit": { - "context": 262144, - "output": 262144 + "context": 1000000, + "output": 65000 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, @@ -59338,41 +63100,47 @@ "extra_capabilities": { "reasoning": { "supported": true, - "interleaved": true, + "default_enabled": true, + "mode": "level", + "level": "high", + "level_options": [ + "low", + "high" + ], "summaries": true, "visibility": "summary", "continuation": [ - "thinking_blocks" + "thought_signatures" ] } }, - "attachment": false, - "open_weights": true, - "knowledge": "2025-01", - "release_date": "2026-01", - "last_updated": "2026-01", + "attachment": true, + "open_weights": false, + "knowledge": "2025-11", + "release_date": "2025-11-19", + "last_updated": "2025-11-19", "cost": { - "input": 0.6, - "output": 3, - "cache_read": 0.1 + "input": 0.57, + "output": 3.43 }, "type": "chat" }, { - "id": "minimax/minimax-m2.7-highspeed", - "name": "MiniMax-M2.7-highspeed", - "display_name": "MiniMax-M2.7-highspeed", + "id": "gpt-5-mini", + "name": "GPT-5-Mini", + "display_name": "GPT-5-Mini", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 204800, - "output": 131072 + "context": 200000, + "output": 64000 }, "temperature": true, "tool_call": true, @@ -59383,41 +63151,54 @@ "extra_capabilities": { "reasoning": { "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] + "default_enabled": true, + "mode": "effort", + "effort": "medium", + "effort_options": [ + "minimal", + "low", + "medium", + "high" + ], + "verbosity": "medium", + "verbosity_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" } }, - "attachment": false, - "open_weights": true, - "release_date": "2026-03-18", - "last_updated": "2026-03-18", + "attachment": true, + "open_weights": false, + "knowledge": "2024-09-30", + "release_date": "2025-09-15", + "last_updated": "2025-09-15", "cost": { - "input": 0.6, - "output": 2.4, - "cache_read": 0.06, - "cache_write": 0.375 + "input": 0.04, + "output": 0.29 }, "type": "chat" }, { - "id": "minimax/minimax-m2.7", - "name": "MiniMax-M2.7", - "display_name": "MiniMax-M2.7", + "id": "gemini-3-flash-preview", + "name": "Gemini 3 Flash Preview", + "display_name": "Gemini 3 Flash Preview", "modalities": { "input": [ - "text" + "text", + "image", + "video", + "audio", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 204800, - "output": 131072 + "context": 1048576, + "output": 65536 }, "temperature": true, "tool_call": true, @@ -59428,43 +63209,65 @@ "extra_capabilities": { "reasoning": { "supported": true, - "interleaved": true, + "default_enabled": true, + "mode": "level", + "level": "high", + "level_options": [ + "minimal", + "low", + "medium", + "high" + ], "summaries": true, "visibility": "summary", "continuation": [ - "thinking_blocks" + "thought_signatures" ] } }, - "attachment": false, - "open_weights": true, - "release_date": "2026-03-18", - "last_updated": "2026-03-18", + "attachment": true, + "open_weights": false, + "knowledge": "2025-01", + "release_date": "2025-12-17", + "last_updated": "2025-12-17", "cost": { - "input": 0.3, - "output": 1.2, - "cache_read": 0.06, - "cache_write": 0.375 + "input": 0.07, + "output": 0.43, + "tiers": [ + { + "input": 0.07, + "output": 0.43, + "tier": { + "type": "context", + "size": 200000 + } + } + ], + "context_over_200k": { + "input": 0.07, + "output": 0.43 + } }, "type": "chat" }, { - "id": "minimax/minimax-m2.5", - "name": "MiniMax-M2.5", - "display_name": "MiniMax-M2.5", + "id": "gpt-5.2-codex", + "name": "GPT-5.2 Codex", + "display_name": "GPT-5.2 Codex", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 204800, - "output": 131072 + "context": 400000, + "output": 128000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { "supported": true, @@ -59472,88 +63275,92 @@ }, "extra_capabilities": { "reasoning": { - "supported": true + "supported": true, + "default_enabled": true, + "mode": "effort", + "effort": "medium", + "effort_options": [ + "low", + "medium", + "high", + "xhigh" + ], + "verbosity": "medium", + "verbosity_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" } }, - "attachment": false, - "open_weights": true, - "release_date": "2026-02-12", - "last_updated": "2026-02-12", + "attachment": true, + "open_weights": false, + "knowledge": "2025-08-31", + "release_date": "2025-12-11", + "last_updated": "2025-12-11", "cost": { - "input": 0.3, - "output": 1.2, - "cache_read": 0.03, - "cache_write": 0.375 + "input": 0.14, + "output": 1.14 }, "type": "chat" - }, + } + ] + }, + "xiaomi-token-plan-ams": { + "id": "xiaomi-token-plan-ams", + "name": "Xiaomi Token Plan (Europe)", + "display_name": "Xiaomi Token Plan (Europe)", + "api": "https://token-plan-ams.xiaomimimo.com/v1", + "doc": "https://platform.xiaomimimo.com/#/docs", + "models": [ { - "id": "minimax/minimax-m2.5-highspeed", - "name": "MiniMax-M2.5-highspeed", - "display_name": "MiniMax-M2.5-highspeed", + "id": "mimo-v2.5-tts", + "name": "MiMo-V2.5-TTS", + "display_name": "MiMo-V2.5-TTS", "modalities": { "input": [ "text" ], "output": [ - "text" + "audio" ] }, "limit": { - "context": 204800, - "output": 131072 + "context": 8192, + "output": 8192 }, - "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true - } + "supported": false }, "attachment": false, "open_weights": true, - "release_date": "2026-02-13", - "last_updated": "2026-02-13", + "release_date": "2026-04-22", + "last_updated": "2026-04-22", "cost": { - "input": 0.6, - "output": 2.4, - "cache_read": 0.06, - "cache_write": 0.375 + "input": 0, + "output": 0 }, "type": "chat" - } - ] - }, - "moonshot": { - "id": "moonshot", - "name": "Moonshot AI (China)", - "display_name": "Moonshot AI (China)", - "api": "https://api.moonshot.cn/v1", - "doc": "https://platform.moonshot.cn/docs/api/chat", - "models": [ + }, { - "id": "kimi-k2.5", - "name": "Kimi K2.5", - "display_name": "Kimi K2.5", + "id": "mimo-v2.5-pro", + "name": "MiMo-V2.5-Pro", + "display_name": "MiMo-V2.5-Pro", "modalities": { "input": [ - "text", - "image", - "video" + "text" ], "output": [ "text" ] }, "limit": { - "context": 262144, - "output": 262144 + "context": 1048576, + "output": 131072 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, @@ -59572,20 +63379,20 @@ }, "attachment": false, "open_weights": true, - "knowledge": "2025-01", - "release_date": "2026-01", - "last_updated": "2026-01", + "knowledge": "2024-12", + "release_date": "2026-04-22", + "last_updated": "2026-04-22", "cost": { - "input": 0.6, - "output": 3, - "cache_read": 0.1 + "input": 0, + "output": 0, + "cache_read": 0 }, "type": "chat" }, { - "id": "kimi-k2-0711-preview", - "name": "Kimi K2 0711", - "display_name": "Kimi K2 0711", + "id": "mimo-v2-pro", + "name": "MiMo-V2-Pro", + "display_name": "MiMo-V2-Pro", "modalities": { "input": [ "text" @@ -59595,66 +63402,79 @@ ] }, "limit": { - "context": 131072, - "output": 16384 + "context": 1048576, + "output": 131072 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } }, "attachment": false, - "open_weights": true, - "knowledge": "2024-10", - "release_date": "2025-07-14", - "last_updated": "2025-07-14", + "open_weights": false, + "knowledge": "2024-12", + "release_date": "2026-03-18", + "last_updated": "2026-03-18", "cost": { - "input": 0.6, - "output": 2.5, - "cache_read": 0.15 + "input": 0, + "output": 0, + "cache_read": 0 }, "type": "chat" }, { - "id": "kimi-k2-0905-preview", - "name": "Kimi K2 0905", - "display_name": "Kimi K2 0905", + "id": "mimo-v2-tts", + "name": "MiMo-V2-TTS", + "display_name": "MiMo-V2-TTS", "modalities": { "input": [ "text" ], "output": [ - "text" + "audio" ] }, "limit": { - "context": 262144, - "output": 262144 + "context": 8192, + "output": 8192 }, - "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": false }, "attachment": false, "open_weights": true, - "knowledge": "2024-10", - "release_date": "2025-09-05", - "last_updated": "2025-09-05", + "release_date": "2026-03-18", + "last_updated": "2026-03-18", "cost": { - "input": 0.6, - "output": 2.5, - "cache_read": 0.15 + "input": 0, + "output": 0 }, "type": "chat" }, { - "id": "kimi-k2-turbo-preview", - "name": "Kimi K2 Turbo", - "display_name": "Kimi K2 Turbo", + "id": "mimo-v2-omni", + "name": "MiMo-V2-Omni", + "display_name": "MiMo-V2-Omni", "modalities": { "input": [ - "text" + "text", + "image", + "audio", + "video", + "pdf" ], "output": [ "text" @@ -59662,33 +63482,46 @@ }, "limit": { "context": 262144, - "output": 262144 + "output": 131072 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": false, - "open_weights": true, - "knowledge": "2024-10", - "release_date": "2025-09-05", - "last_updated": "2025-09-05", + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } + }, + "attachment": true, + "open_weights": false, + "knowledge": "2024-12", + "release_date": "2026-03-18", + "last_updated": "2026-03-18", "cost": { - "input": 2.4, - "output": 10, - "cache_read": 0.6 + "input": 0, + "output": 0, + "cache_read": 0 }, "type": "chat" }, { - "id": "kimi-k2.6", - "name": "Kimi K2.6", - "display_name": "Kimi K2.6", + "id": "mimo-v2.5", + "name": "MiMo-V2.5", + "display_name": "MiMo-V2.5", "modalities": { "input": [ "text", "image", + "audio", "video" ], "output": [ @@ -59696,8 +63529,8 @@ ] }, "limit": { - "context": 262144, - "output": 262144 + "context": 1048576, + "output": 131072 }, "temperature": true, "tool_call": true, @@ -59718,119 +63551,89 @@ }, "attachment": true, "open_weights": true, - "knowledge": "2025-01", - "release_date": "2026-04-21", - "last_updated": "2026-04-21", + "knowledge": "2024-12", + "release_date": "2026-04-22", + "last_updated": "2026-04-22", "cost": { - "input": 0.95, - "output": 4, - "cache_read": 0.16 + "input": 0, + "output": 0, + "cache_read": 0 }, "type": "chat" }, { - "id": "kimi-k2-thinking", - "name": "Kimi K2 Thinking", - "display_name": "Kimi K2 Thinking", + "id": "mimo-v2.5-tts-voicedesign", + "name": "MiMo-V2.5-TTS-VoiceDesign", + "display_name": "MiMo-V2.5-TTS-VoiceDesign", "modalities": { "input": [ "text" ], "output": [ - "text" + "audio" ] }, "limit": { - "context": 262144, - "output": 262144 + "context": 8192, + "output": 8192 }, - "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } + "supported": false }, "attachment": false, "open_weights": true, - "knowledge": "2024-08", - "release_date": "2025-11-06", - "last_updated": "2025-11-06", + "release_date": "2026-04-22", + "last_updated": "2026-04-22", "cost": { - "input": 0.6, - "output": 2.5, - "cache_read": 0.15 + "input": 0, + "output": 0 }, "type": "chat" }, { - "id": "kimi-k2-thinking-turbo", - "name": "Kimi K2 Thinking Turbo", - "display_name": "Kimi K2 Thinking Turbo", + "id": "mimo-v2.5-tts-voiceclone", + "name": "MiMo-V2.5-TTS-VoiceClone", + "display_name": "MiMo-V2.5-TTS-VoiceClone", "modalities": { "input": [ "text" ], "output": [ - "text" + "audio" ] }, "limit": { - "context": 262144, - "output": 262144 + "context": 8192, + "output": 8192 }, - "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } + "supported": false }, "attachment": false, "open_weights": true, - "knowledge": "2024-08", - "release_date": "2025-11-06", - "last_updated": "2025-11-06", + "release_date": "2026-04-22", + "last_updated": "2026-04-22", "cost": { - "input": 1.15, - "output": 8, - "cache_read": 0.15 + "input": 0, + "output": 0 }, "type": "chat" } ] }, - "minimax-cn-coding-plan": { - "id": "minimax-cn-coding-plan", - "name": "MiniMax Coding Plan (minimaxi.com)", - "display_name": "MiniMax Coding Plan (minimaxi.com)", - "api": "https://api.minimaxi.com/anthropic/v1", - "doc": "https://platform.minimaxi.com/docs/coding-plan/intro", - "models": [ - { - "id": "MiniMax-M2.5", - "name": "MiniMax-M2.5", - "display_name": "MiniMax-M2.5", + "modelscope": { + "id": "modelscope", + "name": "ModelScope", + "display_name": "ModelScope", + "api": "https://api-inference.modelscope.cn/v1", + "doc": "https://modelscope.cn/docs/model-service/API-Inference/intro", + "models": [ + { + "id": "Qwen/Qwen3-30B-A3B-Thinking-2507", + "name": "Qwen3 30B A3B Thinking 2507", + "display_name": "Qwen3 30B A3B Thinking 2507", "modalities": { "input": [ "text" @@ -59840,8 +63643,8 @@ ] }, "limit": { - "context": 204800, - "output": 131072 + "context": 262144, + "output": 32768 }, "temperature": true, "tool_call": true, @@ -59851,38 +63654,41 @@ }, "extra_capabilities": { "reasoning": { - "supported": true + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] } }, "attachment": false, "open_weights": true, - "release_date": "2026-02-12", - "last_updated": "2026-02-12", + "knowledge": "2025-04", + "release_date": "2025-07-30", + "last_updated": "2025-07-30", "cost": { "input": 0, - "output": 0, - "cache_read": 0, - "cache_write": 0 + "output": 0 }, "type": "chat" }, { - "id": "MiniMax-M3", - "name": "MiniMax-M3", - "display_name": "MiniMax-M3", + "id": "Qwen/Qwen3-235B-A22B-Thinking-2507", + "name": "Qwen3-235B-A22B-Thinking-2507", + "display_name": "Qwen3-235B-A22B-Thinking-2507", "modalities": { "input": [ - "text", - "image", - "video" + "text" ], "output": [ "text" ] }, "limit": { - "context": 512000, - "output": 128000 + "context": 262144, + "output": 131072 }, "temperature": true, "tool_call": true, @@ -59892,25 +63698,30 @@ }, "extra_capabilities": { "reasoning": { - "supported": true + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] } }, - "attachment": true, + "attachment": false, "open_weights": true, - "release_date": "2026-06-01", - "last_updated": "2026-06-01", + "knowledge": "2025-04", + "release_date": "2025-07-25", + "last_updated": "2025-07-25", "cost": { "input": 0, - "output": 0, - "cache_read": 0, - "cache_write": 0 + "output": 0 }, "type": "chat" }, { - "id": "MiniMax-M2.5-highspeed", - "name": "MiniMax-M2.5-highspeed", - "display_name": "MiniMax-M2.5-highspeed", + "id": "Qwen/Qwen3-Coder-30B-A3B-Instruct", + "name": "Qwen3 Coder 30B A3B Instruct", + "display_name": "Qwen3 Coder 30B A3B Instruct", "modalities": { "input": [ "text" @@ -59920,36 +63731,29 @@ ] }, "limit": { - "context": 204800, - "output": 131072 + "context": 262144, + "output": 65536 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true - } + "supported": false }, "attachment": false, "open_weights": true, - "release_date": "2026-02-13", - "last_updated": "2026-02-13", + "knowledge": "2025-04", + "release_date": "2025-07-31", + "last_updated": "2025-07-31", "cost": { "input": 0, - "output": 0, - "cache_read": 0, - "cache_write": 0 + "output": 0 }, "type": "chat" }, { - "id": "MiniMax-M2.7", - "name": "MiniMax-M2.7", - "display_name": "MiniMax-M2.7", + "id": "Qwen/Qwen3-30B-A3B-Instruct-2507", + "name": "Qwen3 30B A3B Instruct 2507", + "display_name": "Qwen3 30B A3B Instruct 2507", "modalities": { "input": [ "text" @@ -59959,42 +63763,29 @@ ] }, "limit": { - "context": 204800, - "output": 131072 + "context": 262144, + "output": 16384 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } + "supported": false }, "attachment": false, "open_weights": true, - "release_date": "2026-03-18", - "last_updated": "2026-03-18", + "knowledge": "2025-04", + "release_date": "2025-07-30", + "last_updated": "2025-07-30", "cost": { "input": 0, - "output": 0, - "cache_read": 0, - "cache_write": 0 + "output": 0 }, "type": "chat" }, { - "id": "MiniMax-M2", - "name": "MiniMax-M2", - "display_name": "MiniMax-M2", + "id": "Qwen/Qwen3-235B-A22B-Instruct-2507", + "name": "Qwen3 235B A22B Instruct 2507", + "display_name": "Qwen3 235B A22B Instruct 2507", "modalities": { "input": [ "text" @@ -60004,24 +63795,19 @@ ] }, "limit": { - "context": 196608, - "output": 128000 + "context": 262144, + "output": 131072 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true - } + "supported": false }, "attachment": false, "open_weights": true, - "release_date": "2025-10-27", - "last_updated": "2025-10-27", + "knowledge": "2025-04", + "release_date": "2025-04-28", + "last_updated": "2025-07-21", "cost": { "input": 0, "output": 0 @@ -60029,9 +63815,9 @@ "type": "chat" }, { - "id": "MiniMax-M2.7-highspeed", - "name": "MiniMax-M2.7-highspeed", - "display_name": "MiniMax-M2.7-highspeed", + "id": "ZhipuAI/GLM-4.6", + "name": "GLM-4.6", + "display_name": "GLM-4.6", "modalities": { "input": [ "text" @@ -60041,8 +63827,8 @@ ] }, "limit": { - "context": 204800, - "output": 131072 + "context": 202752, + "output": 98304 }, "temperature": true, "tool_call": true, @@ -60052,31 +63838,24 @@ }, "extra_capabilities": { "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] + "supported": true } }, "attachment": false, "open_weights": true, - "release_date": "2026-03-18", - "last_updated": "2026-03-18", + "knowledge": "2025-07", + "release_date": "2025-09-30", + "last_updated": "2025-09-30", "cost": { "input": 0, - "output": 0, - "cache_read": 0, - "cache_write": 0 + "output": 0 }, "type": "chat" }, { - "id": "MiniMax-M2.1", - "name": "MiniMax-M2.1", - "display_name": "MiniMax-M2.1", + "id": "ZhipuAI/GLM-4.5", + "name": "GLM-4.5", + "display_name": "GLM-4.5", "modalities": { "input": [ "text" @@ -60086,8 +63865,8 @@ ] }, "limit": { - "context": 204800, - "output": 131072 + "context": 131072, + "output": 98304 }, "temperature": true, "tool_call": true, @@ -60095,15 +63874,11 @@ "supported": true, "default": true }, - "extra_capabilities": { - "reasoning": { - "supported": true - } - }, "attachment": false, "open_weights": true, - "release_date": "2025-12-23", - "last_updated": "2025-12-23", + "knowledge": "2025-04", + "release_date": "2025-07-28", + "last_updated": "2025-07-28", "cost": { "input": 0, "output": 0 @@ -60112,17 +63887,16 @@ } ] }, - "inception": { - "id": "inception", - "name": "Inception", - "display_name": "Inception", - "api": "https://api.inceptionlabs.ai/v1/", - "doc": "https://platform.inceptionlabs.ai/docs", + "groq": { + "id": "groq", + "name": "Groq", + "display_name": "Groq", + "doc": "https://console.groq.com/docs/models", "models": [ { - "id": "mercury-edit-2", - "name": "Mercury Edit 2", - "display_name": "Mercury Edit 2", + "id": "llama-3.3-70b-versatile", + "name": "Llama 3.3 70B", + "display_name": "Llama 3.3 70B", "modalities": { "input": [ "text" @@ -60132,30 +63906,29 @@ ] }, "limit": { - "context": 128000, - "output": 8192 + "context": 131072, + "output": 32768 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, "attachment": false, - "open_weights": false, - "release_date": "2026-03-30", - "last_updated": "2026-03-30", + "open_weights": true, + "knowledge": "2023-12", + "release_date": "2024-12-06", + "last_updated": "2024-12-06", "cost": { - "input": 0.25, - "output": 0.75, - "cache_read": 0.025 + "input": 0.59, + "output": 0.79 }, "type": "chat" }, { - "id": "mercury-2", - "name": "Mercury 2", - "display_name": "Mercury 2", + "id": "llama-3.1-8b-instant", + "name": "Llama 3.1 8B", + "display_name": "Llama 3.1 8B", "modalities": { "input": [ "text" @@ -60165,128 +63938,83 @@ ] }, "limit": { - "context": 128000, - "output": 50000 + "context": 131072, + "output": 131072 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, "attachment": false, - "open_weights": false, - "knowledge": "2025-01-01", - "release_date": "2026-02-24", - "last_updated": "2026-02-24", + "open_weights": true, + "knowledge": "2023-12", + "release_date": "2024-07-23", + "last_updated": "2024-07-23", "cost": { - "input": 0.25, - "output": 0.75, - "cache_read": 0.025 + "input": 0.05, + "output": 0.08 }, "type": "chat" - } - ] - }, - "kuae-cloud-coding-plan": { - "id": "kuae-cloud-coding-plan", - "name": "KUAE Cloud Coding Plan", - "display_name": "KUAE Cloud Coding Plan", - "api": "https://coding-plan-endpoint.kuaecloud.net/v1", - "doc": "https://docs.mthreads.com/kuaecloud/kuaecloud-doc-online/coding_plan/", - "models": [ + }, { - "id": "GLM-4.7", - "name": "GLM-4.7", - "display_name": "GLM-4.7", + "id": "whisper-large-v3-turbo", + "name": "Whisper Large V3 Turbo", + "display_name": "Whisper Large V3 Turbo", "modalities": { "input": [ - "text" + "audio" ], "output": [ "text" ] }, "limit": { - "context": 204800, - "output": 131072 + "context": 8192, + "output": 8192 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } + "supported": false }, "attachment": false, "open_weights": true, - "knowledge": "2025-04", - "release_date": "2025-12-22", - "last_updated": "2025-12-22", - "cost": { - "input": 0, - "output": 0, - "cache_read": 0, - "cache_write": 0 - }, + "release_date": "2024-10-01", + "last_updated": "2024-10-01", "type": "chat" - } - ] - }, - "chutes": { - "id": "chutes", - "name": "Chutes", - "display_name": "Chutes", - "api": "https://llm.chutes.ai/v1", - "doc": "https://llm.chutes.ai/v1/models", - "models": [ + }, { - "id": "XiaomiMiMo/MiMo-V2-Flash-TEE", - "name": "MiMo V2 Flash TEE", - "display_name": "MiMo V2 Flash TEE", + "id": "whisper-large-v3", + "name": "Whisper", + "display_name": "Whisper", "modalities": { "input": [ - "text" + "audio" ], "output": [ "text" ] }, "limit": { - "context": 262144, - "output": 65536 + "context": 8192, + "output": 8192 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": false }, "attachment": false, "open_weights": true, - "knowledge": "2024-12-01", - "release_date": "2025-12-16", - "last_updated": "2026-02-04", - "cost": { - "input": 0.09, - "output": 0.29, - "cache_read": 0.045 - }, + "release_date": "2023-09-01", + "last_updated": "2025-09-05", "type": "chat" }, { - "id": "MiniMaxAI/MiniMax-M2.5-TEE", - "name": "MiniMax M2.5 TEE", - "display_name": "MiniMax M2.5 TEE", + "id": "meta-llama/llama-prompt-guard-2-86m", + "name": "Prompt Guard 2 86M", + "display_name": "Prompt Guard 2 86M", "modalities": { "input": [ "text" @@ -60296,41 +64024,28 @@ ] }, "limit": { - "context": 196608, - "output": 65536 + "context": 512, + "output": 512 }, - "temperature": true, - "tool_call": true, + "temperature": false, + "tool_call": false, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } + "supported": false }, "attachment": false, "open_weights": true, - "release_date": "2026-02-12", - "last_updated": "2026-02-12", + "release_date": "2025-05-29", + "last_updated": "2025-05-29", "cost": { - "input": 0.15, - "output": 1.2, - "cache_read": 0.075 + "input": 0.04, + "output": 0.04 }, "type": "chat" }, { - "id": "zai-org/GLM-5.1-TEE", - "name": "GLM 5.1 TEE", - "display_name": "GLM 5.1 TEE", + "id": "meta-llama/llama-prompt-guard-2-22m", + "name": "Llama Prompt Guard 2 22M", + "display_name": "Llama Prompt Guard 2 22M", "modalities": { "input": [ "text" @@ -60340,74 +64055,61 @@ ] }, "limit": { - "context": 202752, - "output": 65535 + "context": 512, + "output": 512 }, - "temperature": true, - "tool_call": true, + "temperature": false, + "tool_call": false, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } + "supported": false }, "attachment": false, "open_weights": true, - "release_date": "2026-03-27", - "last_updated": "2026-03-27", + "release_date": "2025-05-29", + "last_updated": "2025-05-29", "cost": { - "input": 1.05, - "output": 3.5, - "cache_read": 0.525 + "input": 0.03, + "output": 0.03 }, "type": "chat" }, { - "id": "zai-org/GLM-4.7-FP8", - "name": "GLM 4.7 FP8", - "display_name": "GLM 4.7 FP8", + "id": "meta-llama/llama-4-scout-17b-16e-instruct", + "name": "Llama 4 Scout 17B 16E", + "display_name": "Llama 4 Scout 17B 16E", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 202752, - "output": 65535 + "context": 131072, + "output": 8192 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, - "attachment": false, + "attachment": true, "open_weights": true, - "release_date": "2026-01-27", - "last_updated": "2026-04-25", + "knowledge": "2024-08", + "release_date": "2025-04-05", + "last_updated": "2025-04-05", "cost": { - "input": 0.2989, - "output": 1.1957, - "cache_read": 0.14945 + "input": 0.11, + "output": 0.34 }, "type": "chat" }, { - "id": "zai-org/GLM-5-TEE", - "name": "GLM 5 TEE", - "display_name": "GLM 5 TEE", + "id": "openai/gpt-oss-safeguard-20b", + "name": "Safety GPT OSS 20B", + "display_name": "Safety GPT OSS 20B", "modalities": { "input": [ "text" @@ -60417,8 +64119,8 @@ ] }, "limit": { - "context": 202752, - "output": 65535 + "context": 131072, + "output": 65536 }, "temperature": true, "tool_call": true, @@ -60426,32 +64128,21 @@ "supported": true, "default": true }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } - }, "attachment": false, "open_weights": true, - "release_date": "2026-02-11", - "last_updated": "2026-02-11", + "release_date": "2025-10-29", + "last_updated": "2025-10-29", "cost": { - "input": 0.95, - "output": 2.55, - "cache_read": 0.475 + "input": 0.075, + "output": 0.3, + "cache_read": 0.037 }, "type": "chat" }, { - "id": "zai-org/GLM-4.7-TEE", - "name": "GLM 4.7 TEE", - "display_name": "GLM 4.7 TEE", + "id": "openai/gpt-oss-120b", + "name": "GPT OSS 120B", + "display_name": "GPT OSS 120B", "modalities": { "input": [ "text" @@ -60461,8 +64152,8 @@ ] }, "limit": { - "context": 202752, - "output": 65535 + "context": 131072, + "output": 65536 }, "temperature": true, "tool_call": true, @@ -60472,31 +64163,24 @@ }, "extra_capabilities": { "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] + "supported": true } }, "attachment": false, "open_weights": true, - "knowledge": "2025-04", - "release_date": "2025-12-22", - "last_updated": "2025-12-22", + "release_date": "2025-08-05", + "last_updated": "2025-10-21", "cost": { - "input": 0.39, - "output": 1.75, - "cache_read": 0.195 + "input": 0.15, + "output": 0.6, + "cache_read": 0.075 }, "type": "chat" }, { - "id": "zai-org/GLM-5-Turbo", - "name": "GLM 5 Turbo", - "display_name": "GLM 5 Turbo", + "id": "openai/gpt-oss-20b", + "name": "GPT OSS 20B", + "display_name": "GPT OSS 20B", "modalities": { "input": [ "text" @@ -60506,8 +64190,8 @@ ] }, "limit": { - "context": 202752, - "output": 65535 + "context": 131072, + "output": 65536 }, "temperature": true, "tool_call": true, @@ -60517,75 +64201,78 @@ }, "extra_capabilities": { "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] + "supported": true } }, "attachment": false, "open_weights": true, - "release_date": "2026-03-11", - "last_updated": "2026-04-25", + "release_date": "2025-08-05", + "last_updated": "2025-09-25", "cost": { - "input": 0.4891, - "output": 1.9565, - "cache_read": 0.24455 + "input": 0.075, + "output": 0.3, + "cache_read": 0.0375 }, "type": "chat" }, { - "id": "zai-org/GLM-4.6V", - "name": "GLM 4.6V", - "display_name": "GLM 4.6V", + "id": "canopylabs/orpheus-v1-english", + "name": "Canopy Labs Orpheus V1 English", + "display_name": "Canopy Labs Orpheus V1 English", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ - "text" + "audio" ] }, "limit": { - "context": 131072, - "output": 65536 + "context": 4000, + "output": 50000 }, - "temperature": true, - "tool_call": true, + "temperature": false, + "tool_call": false, "reasoning": { - "supported": true, - "default": true + "supported": false }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } + "attachment": false, + "open_weights": false, + "release_date": "2025-12-19", + "last_updated": "2025-12-19", + "type": "chat" + }, + { + "id": "canopylabs/orpheus-arabic-saudi", + "name": "Canopy Labs Orpheus Arabic Saudi", + "display_name": "Canopy Labs Orpheus Arabic Saudi", + "modalities": { + "input": [ + "text" + ], + "output": [ + "audio" + ] }, - "attachment": true, - "open_weights": true, - "release_date": "2025-12-29", - "last_updated": "2026-04-25", - "cost": { - "input": 0.3, - "output": 0.9, - "cache_read": 0.15 + "limit": { + "context": 4000, + "output": 50000 + }, + "temperature": false, + "tool_call": false, + "reasoning": { + "supported": false }, + "attachment": false, + "open_weights": false, + "release_date": "2025-12-16", + "last_updated": "2025-12-16", "type": "chat" }, { - "id": "NousResearch/Hermes-4-14B", - "name": "Hermes 4 14B", - "display_name": "Hermes 4 14B", + "id": "groq/compound", + "name": "Compound", + "display_name": "Compound", "modalities": { "input": [ "text" @@ -60595,41 +64282,24 @@ ] }, "limit": { - "context": 40960, - "output": 40960 + "context": 131072, + "output": 8192 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } + "supported": false }, "attachment": false, - "open_weights": true, - "release_date": "2025-12-29", - "last_updated": "2026-04-25", - "cost": { - "input": 0.0136, - "output": 0.0543, - "cache_read": 0.0068 - }, + "open_weights": false, + "release_date": "2025-09-04", + "last_updated": "2025-09-04", "type": "chat" }, { - "id": "NousResearch/DeepHermes-3-Mistral-24B-Preview", - "name": "DeepHermes 3 Mistral 24B Preview", - "display_name": "DeepHermes 3 Mistral 24B Preview", + "id": "groq/compound-mini", + "name": "Compound Mini", + "display_name": "Compound Mini", "modalities": { "input": [ "text" @@ -60639,42 +64309,35 @@ ] }, "limit": { - "context": 32768, - "output": 32768 + "context": 131072, + "output": 8192 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": false }, "attachment": false, - "open_weights": true, - "release_date": "2025-12-29", - "last_updated": "2026-04-25", - "cost": { - "input": 0.0245, - "output": 0.0978, - "cache_read": 0.01225 - }, + "open_weights": false, + "release_date": "2025-09-04", + "last_updated": "2025-09-04", "type": "chat" }, { - "id": "moonshotai/Kimi-K2.6-TEE", - "name": "Kimi K2.6 TEE", - "display_name": "Kimi K2.6 TEE", + "id": "qwen/qwen3-32b", + "name": "Qwen3-32B", + "display_name": "Qwen3-32B", "modalities": { "input": [ - "text", - "image", - "video" + "text" ], "output": [ "text" ] }, "limit": { - "context": 262144, - "output": 65535 + "context": 131072, + "output": 40960 }, "temperature": true, "tool_call": true, @@ -60693,27 +64356,32 @@ ] } }, - "attachment": true, + "attachment": false, "open_weights": true, - "knowledge": "2025-12", - "release_date": "2026-04-21", - "last_updated": "2026-04-21", + "release_date": "2025-06-11", + "last_updated": "2025-06-12", "cost": { - "input": 0.95, - "output": 4, - "cache_read": 0.475 + "input": 0.29, + "output": 0.59 }, "type": "chat" - }, + } + ] + }, + "mixlayer": { + "id": "mixlayer", + "name": "Mixlayer", + "display_name": "Mixlayer", + "api": "https://models.mixlayer.ai/v1", + "doc": "https://docs.mixlayer.com", + "models": [ { - "id": "moonshotai/Kimi-K2.5-TEE", - "name": "Kimi K2.5 TEE", - "display_name": "Kimi K2.5 TEE", + "id": "qwen/qwen3.5-27b", + "name": "Qwen3.5 27B", + "display_name": "Qwen3.5 27B", "modalities": { "input": [ - "text", - "image", - "video" + "text" ], "output": [ "text" @@ -60721,7 +64389,7 @@ }, "limit": { "context": 262144, - "output": 65535 + "output": 262144 }, "temperature": true, "tool_call": true, @@ -60740,22 +64408,20 @@ ] } }, - "attachment": true, + "attachment": false, "open_weights": true, - "knowledge": "2024-10", - "release_date": "2026-01", - "last_updated": "2026-01", + "release_date": "2026-03-18", + "last_updated": "2026-03-18", "cost": { - "input": 0.44, - "output": 2, - "cache_read": 0.22 + "input": 0.3, + "output": 2.4 }, "type": "chat" }, { - "id": "deepseek-ai/DeepSeek-V3.1-TEE", - "name": "DeepSeek V3.1 TEE", - "display_name": "DeepSeek V3.1 TEE", + "id": "qwen/qwen3.5-35b-a3b", + "name": "Qwen3.5 35B A3B", + "display_name": "Qwen3.5 35B A3B", "modalities": { "input": [ "text" @@ -60765,8 +64431,8 @@ ] }, "limit": { - "context": 163840, - "output": 65536 + "context": 262144, + "output": 262144 }, "temperature": true, "tool_call": true, @@ -60787,19 +64453,18 @@ }, "attachment": false, "open_weights": true, - "release_date": "2025-12-29", - "last_updated": "2026-04-25", + "release_date": "2026-03-18", + "last_updated": "2026-03-18", "cost": { - "input": 0.27, - "output": 1, - "cache_read": 0.135 + "input": 0.25, + "output": 1.3 }, "type": "chat" }, { - "id": "deepseek-ai/DeepSeek-V3.2-TEE", - "name": "DeepSeek V3.2 TEE", - "display_name": "DeepSeek V3.2 TEE", + "id": "qwen/qwen3.5-9b", + "name": "Qwen3.5 9B", + "display_name": "Qwen3.5 9B", "modalities": { "input": [ "text" @@ -60809,8 +64474,8 @@ ] }, "limit": { - "context": 131072, - "output": 65536 + "context": 262144, + "output": 262144 }, "temperature": true, "tool_call": true, @@ -60831,19 +64496,18 @@ }, "attachment": false, "open_weights": true, - "release_date": "2025-12-29", - "last_updated": "2026-04-25", + "release_date": "2026-03-18", + "last_updated": "2026-03-18", "cost": { - "input": 0.28, - "output": 0.42, - "cache_read": 0.14 + "input": 0.1, + "output": 0.4 }, "type": "chat" }, { - "id": "deepseek-ai/DeepSeek-R1-Distill-Llama-70B", - "name": "DeepSeek R1 Distill Llama 70B", - "display_name": "DeepSeek R1 Distill Llama 70B", + "id": "qwen/qwen3.5-397b-a17b", + "name": "Qwen3.5 397B A17B", + "display_name": "Qwen3.5 397B A17B", "modalities": { "input": [ "text" @@ -60853,8 +64517,8 @@ ] }, "limit": { - "context": 131072, - "output": 131072 + "context": 262144, + "output": 262144 }, "temperature": true, "tool_call": true, @@ -60875,51 +64539,18 @@ }, "attachment": false, "open_weights": true, - "release_date": "2025-12-29", - "last_updated": "2026-04-25", - "cost": { - "input": 0.0272, - "output": 0.1087, - "cache_read": 0.0136 - }, - "type": "chat" - }, - { - "id": "deepseek-ai/DeepSeek-V3-0324-TEE", - "name": "DeepSeek V3 0324 TEE", - "display_name": "DeepSeek V3 0324 TEE", - "modalities": { - "input": [ - "text" - ], - "output": [ - "text" - ] - }, - "limit": { - "context": 163840, - "output": 65536 - }, - "temperature": true, - "tool_call": true, - "reasoning": { - "supported": false - }, - "attachment": false, - "open_weights": true, - "release_date": "2025-12-29", - "last_updated": "2026-04-25", + "release_date": "2026-03-18", + "last_updated": "2026-03-18", "cost": { - "input": 0.25, - "output": 1, - "cache_read": 0.125 + "input": 0.6, + "output": 3.6 }, "type": "chat" }, { - "id": "deepseek-ai/DeepSeek-R1-0528-TEE", - "name": "DeepSeek R1 0528 TEE", - "display_name": "DeepSeek R1 0528 TEE", + "id": "qwen/qwen3.5-122b-a10b", + "name": "Qwen3.5 122B A10B", + "display_name": "Qwen3.5 122B A10B", "modalities": { "input": [ "text" @@ -60929,8 +64560,8 @@ ] }, "limit": { - "context": 163840, - "output": 65536 + "context": 262144, + "output": 262144 }, "temperature": true, "tool_call": true, @@ -60951,64 +64582,115 @@ }, "attachment": false, "open_weights": true, - "knowledge": "2024-07", - "release_date": "2025-01-20", - "last_updated": "2025-05-29", + "release_date": "2026-03-18", + "last_updated": "2026-03-18", "cost": { - "input": 0.45, - "output": 2.15, - "cache_read": 0.225 + "input": 0.4, + "output": 3.2 }, "type": "chat" - }, + } + ] + }, + "orcarouter": { + "id": "orcarouter", + "name": "OrcaRouter", + "display_name": "OrcaRouter", + "api": "https://api.orcarouter.ai/v1", + "doc": "https://docs.orcarouter.ai", + "models": [ { - "id": "rednote-hilab/dots.ocr", - "name": "dots.ocr", - "display_name": "dots.ocr", + "id": "google/gemini-2.5-pro", + "name": "Gemini 2.5 Pro", + "display_name": "Gemini 2.5 Pro", "modalities": { "input": [ "text", - "image" + "image", + "audio", + "video", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 131072, - "output": 131072 + "context": 1048576, + "output": 65536 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": true, + "mode": "budget", + "budget": { + "default": -1, + "min": 128, + "max": 32768, + "auto": -1, + "unit": "tokens" + }, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thought_signatures" + ] + } }, "attachment": true, - "open_weights": true, - "release_date": "2025-12-29", - "last_updated": "2026-04-25", + "open_weights": false, + "knowledge": "2025-01", + "release_date": "2025-03-20", + "last_updated": "2025-06-05", "cost": { - "input": 0.01, - "output": 0.0109, - "cache_read": 0.005 + "input": 2.5, + "output": 15, + "cache_read": 0.125, + "tiers": [ + { + "input": 2.5, + "output": 15, + "cache_read": 0.25, + "tier": { + "type": "context", + "size": 200000 + } + } + ], + "context_over_200k": { + "input": 2.5, + "output": 15, + "cache_read": 0.25 + } }, "type": "chat" }, { - "id": "tngtech/DeepSeek-TNG-R1T2-Chimera-TEE", - "name": "DeepSeek TNG R1T2 Chimera TEE", - "display_name": "DeepSeek TNG R1T2 Chimera TEE", + "id": "google/gemini-2.5-flash", + "name": "Gemini 2.5 Flash", + "display_name": "Gemini 2.5 Flash", "modalities": { "input": [ - "text" + "text", + "image", + "audio", + "video", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 163840, - "output": 163840 + "context": 1048576, + "output": 65536 }, "temperature": true, "tool_call": true, @@ -61016,85 +64698,43 @@ "supported": true, "default": true }, - "attachment": false, - "open_weights": true, - "release_date": "2026-04-25", - "last_updated": "2026-04-25", - "cost": { - "input": 0.3, - "output": 1.1, - "cache_read": 0.15 - }, - "type": "chat" - }, - { - "id": "unsloth/Llama-3.2-1B-Instruct", - "name": "Llama 3.2 1B Instruct", - "display_name": "Llama 3.2 1B Instruct", - "modalities": { - "input": [ - "text" - ], - "output": [ - "text" - ] - }, - "limit": { - "context": 16384, - "output": 8192 - }, - "temperature": true, - "tool_call": false, - "reasoning": { - "supported": false - }, - "attachment": false, - "open_weights": true, - "release_date": "2026-01-27", - "last_updated": "2026-04-25", - "cost": { - "input": 0.01, - "output": 0.0109, - "cache_read": 0.005 - }, - "type": "chat" - }, - { - "id": "unsloth/Mistral-Nemo-Instruct-2407", - "name": "Mistral Nemo Instruct 2407", - "display_name": "Mistral Nemo Instruct 2407", - "modalities": { - "input": [ - "text" - ], - "output": [ - "text" - ] - }, - "limit": { - "context": 131072, - "output": 131072 - }, - "temperature": true, - "tool_call": false, - "reasoning": { - "supported": false + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": true, + "mode": "budget", + "budget": { + "default": -1, + "min": 0, + "max": 24576, + "auto": -1, + "off": 0, + "unit": "tokens" + }, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thought_signatures" + ] + } }, - "attachment": false, - "open_weights": true, - "release_date": "2025-12-29", - "last_updated": "2026-04-25", + "attachment": true, + "open_weights": false, + "knowledge": "2025-01", + "release_date": "2025-03-20", + "last_updated": "2025-06-05", "cost": { - "input": 0.02, - "output": 0.04, - "cache_read": 0.01 + "input": 0.3, + "output": 2.5, + "cache_read": 0.03, + "input_audio": 1 }, "type": "chat" }, { - "id": "unsloth/gemma-3-27b-it", - "name": "gemma 3 27b it", - "display_name": "gemma 3 27b it", + "id": "google/gemma-4-31b-it", + "name": "Gemma 4 31B IT", + "display_name": "Gemma 4 31B IT", "modalities": { "input": [ "text", @@ -61105,202 +64745,315 @@ ] }, "limit": { - "context": 128000, - "output": 65536 + "context": 262144, + "output": 32768 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "attachment": true, "open_weights": true, - "release_date": "2025-12-29", - "last_updated": "2026-04-25", + "release_date": "2026-04-02", + "last_updated": "2026-04-02", "cost": { - "input": 0.0272, - "output": 0.1087, - "cache_read": 0.0136 + "input": 0.13, + "output": 0.38 }, "type": "chat" }, { - "id": "unsloth/gemma-3-12b-it", - "name": "gemma 3 12b it", - "display_name": "gemma 3 12b it", + "id": "google/gemini-3.1-pro-preview-customtools", + "name": "Gemini 3.1 Pro Preview Custom Tools", + "display_name": "Gemini 3.1 Pro Preview Custom Tools", "modalities": { "input": [ "text", - "image" + "image", + "video", + "audio", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 131072, - "output": 131072 + "context": 1048576, + "output": 65536 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": true, + "mode": "level", + "level": "high", + "level_options": [ + "low", + "high" + ], + "summaries": true, + "visibility": "summary", + "continuation": [ + "thought_signatures" + ] + } }, "attachment": true, - "open_weights": true, - "release_date": "2025-12-29", - "last_updated": "2026-04-25", + "open_weights": false, + "knowledge": "2025-01", + "release_date": "2026-02-19", + "last_updated": "2026-02-19", "cost": { - "input": 0.03, - "output": 0.1, - "cache_read": 0.015 + "input": 4, + "output": 18, + "cache_read": 0.2, + "tiers": [ + { + "input": 4, + "output": 18, + "cache_read": 0.4, + "tier": { + "type": "context", + "size": 200000 + } + } + ], + "context_over_200k": { + "input": 4, + "output": 18, + "cache_read": 0.4 + } }, "type": "chat" }, { - "id": "unsloth/gemma-3-4b-it", - "name": "gemma 3 4b it", - "display_name": "gemma 3 4b it", + "id": "google/gemini-flash-lite-latest", + "name": "Gemini Flash-Lite Latest", + "display_name": "Gemini Flash-Lite Latest", "modalities": { "input": [ "text", - "image" + "image", + "audio", + "video", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 96000, - "output": 96000 + "context": 1048576, + "output": 65536 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "attachment": true, - "open_weights": true, - "release_date": "2025-12-29", - "last_updated": "2026-04-25", + "open_weights": false, + "knowledge": "2025-01", + "release_date": "2025-09-25", + "last_updated": "2025-09-25", "cost": { - "input": 0.01, - "output": 0.0272, - "cache_read": 0.005 + "input": 0.25, + "output": 1.5, + "cache_read": 0.025 }, "type": "chat" }, { - "id": "unsloth/Llama-3.2-3B-Instruct", - "name": "Llama 3.2 3B Instruct", - "display_name": "Llama 3.2 3B Instruct", + "id": "google/gemini-2.5-flash-lite", + "name": "Gemini 2.5 Flash-Lite", + "display_name": "Gemini 2.5 Flash-Lite", "modalities": { "input": [ - "text" + "text", + "image", + "audio", + "video", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 16384, - "output": 16384 + "context": 1048576, + "output": 65536 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": false }, - "attachment": false, - "open_weights": true, - "release_date": "2025-02-12", - "last_updated": "2026-04-25", + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": false, + "mode": "budget", + "budget": { + "default": -1, + "min": 512, + "max": 24576, + "auto": -1, + "unit": "tokens" + }, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thought_signatures" + ] + } + }, + "attachment": true, + "open_weights": false, + "knowledge": "2025-01", + "release_date": "2025-06-17", + "last_updated": "2025-06-17", "cost": { - "input": 0.01, - "output": 0.0136, - "cache_read": 0.005 + "input": 0.1, + "output": 0.4, + "cache_read": 0.01, + "input_audio": 0.3 }, "type": "chat" }, { - "id": "Qwen/Qwen3-Coder-Next-TEE", - "name": "Qwen3 Coder Next TEE", - "display_name": "Qwen3 Coder Next TEE", + "id": "google/gemini-3.1-pro-preview", + "name": "Gemini 3.1 Pro Preview", + "display_name": "Gemini 3.1 Pro Preview", "modalities": { "input": [ - "text" + "text", + "image", + "video", + "audio", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 262144, + "context": 1048576, "output": 65536 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": false, - "open_weights": true, - "release_date": "2026-04-25", - "last_updated": "2026-04-25", + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": true, + "mode": "level", + "level": "high", + "level_options": [ + "low", + "high" + ], + "summaries": true, + "visibility": "summary", + "continuation": [ + "thought_signatures" + ] + } + }, + "attachment": true, + "open_weights": false, + "knowledge": "2025-01", + "release_date": "2026-02-19", + "last_updated": "2026-02-19", "cost": { - "input": 0.12, - "output": 0.75, - "cache_read": 0.06 + "input": 4, + "output": 18, + "cache_read": 0.2, + "tiers": [ + { + "input": 4, + "output": 18, + "cache_read": 0.4, + "tier": { + "type": "context", + "size": 200000 + } + } + ], + "context_over_200k": { + "input": 4, + "output": 18, + "cache_read": 0.4 + } }, "type": "chat" }, { - "id": "Qwen/Qwen2.5-72B-Instruct", - "name": "Qwen2.5 72B Instruct", - "display_name": "Qwen2.5 72B Instruct", + "id": "google/gemma-4-26b-a4b-it", + "name": "Gemma 4 26B A4B IT", + "display_name": "Gemma 4 26B A4B IT", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 32768, + "context": 262144, "output": 32768 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": false, + "attachment": true, "open_weights": true, - "release_date": "2025-12-29", - "last_updated": "2026-04-25", + "release_date": "2026-04-02", + "last_updated": "2026-04-02", "cost": { - "input": 0.2989, - "output": 1.1957, - "cache_read": 0.14945 + "input": 0.06, + "output": 0.33 }, "type": "chat" }, { - "id": "Qwen/Qwen3-30B-A3B", - "name": "Qwen3 30B A3B", - "display_name": "Qwen3 30B A3B", + "id": "google/gemini-3-pro-preview", + "name": "Gemini 3 Pro Preview", + "display_name": "Gemini 3 Pro Preview", "modalities": { "input": [ - "text" + "text", + "image", + "video", + "audio", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 40960, - "output": 40960 + "context": 1048576, + "output": 65536 }, "temperature": true, "tool_call": true, @@ -61311,40 +65064,67 @@ "extra_capabilities": { "reasoning": { "supported": true, - "interleaved": true, + "default_enabled": true, + "mode": "level", + "level": "high", + "level_options": [ + "low", + "high" + ], "summaries": true, "visibility": "summary", "continuation": [ - "thinking_blocks" + "thought_signatures" ] } }, - "attachment": false, - "open_weights": true, - "release_date": "2025-12-29", - "last_updated": "2026-04-25", + "attachment": true, + "open_weights": false, + "knowledge": "2025-01", + "release_date": "2025-11-18", + "last_updated": "2025-11-18", "cost": { - "input": 0.06, - "output": 0.22, - "cache_read": 0.03 + "input": 4, + "output": 18, + "cache_read": 0.2, + "tiers": [ + { + "input": 4, + "output": 18, + "cache_read": 0.4, + "tier": { + "type": "context", + "size": 200000 + } + } + ], + "context_over_200k": { + "input": 4, + "output": 18, + "cache_read": 0.4 + } }, "type": "chat" }, { - "id": "Qwen/Qwen3-235B-A22B-Thinking-2507", - "name": "Qwen3 235B A22B Thinking 2507", - "display_name": "Qwen3 235B A22B Thinking 2507", + "id": "google/gemini-3-flash-preview", + "name": "Gemini 3 Flash Preview", + "display_name": "Gemini 3 Flash Preview", "modalities": { "input": [ - "text" + "text", + "image", + "video", + "audio", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 262144, - "output": 262144 + "context": 1048576, + "output": 65536 }, "temperature": true, "tool_call": true, @@ -61355,94 +65135,122 @@ "extra_capabilities": { "reasoning": { "supported": true, - "interleaved": true, + "default_enabled": true, + "mode": "level", + "level": "high", + "level_options": [ + "minimal", + "low", + "medium", + "high" + ], "summaries": true, "visibility": "summary", "continuation": [ - "thinking_blocks" + "thought_signatures" ] } }, - "attachment": false, - "open_weights": true, - "release_date": "2025-12-29", - "last_updated": "2026-04-25", + "attachment": true, + "open_weights": false, + "knowledge": "2025-01", + "release_date": "2025-12-17", + "last_updated": "2025-12-17", "cost": { - "input": 0.11, - "output": 0.6, - "cache_read": 0.055 + "input": 0.5, + "output": 3, + "cache_read": 0.05, + "input_audio": 1 }, "type": "chat" }, { - "id": "Qwen/Qwen3-235B-A22B-Instruct-2507-TEE", - "name": "Qwen3 235B A22B Instruct 2507 TEE", - "display_name": "Qwen3 235B A22B Instruct 2507 TEE", + "id": "google/gemini-flash-latest", + "name": "Gemini Flash Latest", + "display_name": "Gemini Flash Latest", "modalities": { "input": [ - "text" + "text", + "image", + "audio", + "video", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 262144, + "context": 1048576, "output": 65536 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": false, - "open_weights": true, - "knowledge": "2025-04", - "release_date": "2025-04", - "last_updated": "2025-04", + "attachment": true, + "open_weights": false, + "knowledge": "2025-01", + "release_date": "2025-09-25", + "last_updated": "2025-09-25", "cost": { - "input": 0.1, - "output": 0.6, - "cache_read": 0.05 + "input": 0.5, + "output": 3, + "cache_read": 0.075, + "input_audio": 1 }, "type": "chat" }, { - "id": "Qwen/Qwen3-Next-80B-A3B-Instruct", - "name": "Qwen3 Next 80B A3B Instruct", - "display_name": "Qwen3 Next 80B A3B Instruct", + "id": "google/gemini-3.1-flash-lite-preview", + "name": "Gemini 3.1 Flash Lite Preview", + "display_name": "Gemini 3.1 Flash Lite Preview", "modalities": { "input": [ - "text" + "text", + "image", + "video", + "audio", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 262144, - "output": 262144 + "context": 1048576, + "output": 65536 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": false, - "open_weights": true, - "release_date": "2025-12-29", - "last_updated": "2026-04-25", + "extra_capabilities": { + "reasoning": { + "supported": true + } + }, + "attachment": true, + "open_weights": false, + "knowledge": "2025-01", + "release_date": "2026-03-03", + "last_updated": "2026-03-03", "cost": { - "input": 0.1, - "output": 0.8, - "cache_read": 0.05 + "input": 0.25, + "output": 1.5, + "cache_read": 0.025, + "input_audio": 0.5 }, "type": "chat" }, { - "id": "Qwen/Qwen3Guard-Gen-0.6B", - "name": "Qwen3Guard Gen 0.6B", - "display_name": "Qwen3Guard Gen 0.6B", + "id": "z-ai/glm-4.7", + "name": "GLM-4.7", + "display_name": "GLM-4.7", "modalities": { "input": [ "text" @@ -61452,41 +65260,54 @@ ] }, "limit": { - "context": 32768, - "output": 8192 + "context": 204800, + "output": 131072 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } }, "attachment": false, "open_weights": true, - "release_date": "2025-12-29", - "last_updated": "2026-04-25", + "knowledge": "2025-04", + "release_date": "2025-12-22", + "last_updated": "2025-12-22", "cost": { - "input": 0.01, - "output": 0.0109, - "cache_read": 0.005 + "input": 0.6, + "output": 2.2, + "cache_read": 0.11, + "cache_write": 0 }, "type": "chat" }, { - "id": "Qwen/Qwen3.5-397B-A17B-TEE", - "name": "Qwen3.5 397B A17B TEE", - "display_name": "Qwen3.5 397B A17B TEE", + "id": "z-ai/glm-4.5", + "name": "GLM-4.5", + "display_name": "GLM-4.5", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 262144, - "output": 65536 + "context": 131072, + "output": 98304 }, "temperature": true, "tool_call": true, @@ -61494,44 +65315,34 @@ "supported": true, "default": true }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } - }, - "attachment": true, + "attachment": false, "open_weights": true, - "release_date": "2026-02-15", - "last_updated": "2026-02-15", + "knowledge": "2025-04", + "release_date": "2025-07-28", + "last_updated": "2025-07-28", "cost": { - "input": 0.39, - "output": 2.34, - "cache_read": 0.195 + "input": 0.6, + "output": 2.2, + "cache_read": 0.11, + "cache_write": 0 }, "type": "chat" }, { - "id": "Qwen/Qwen3.6-27B-TEE", - "name": "Qwen3.6 27B TEE", - "display_name": "Qwen3.6 27B TEE", + "id": "z-ai/glm-5.1", + "name": "GLM-5.1", + "display_name": "GLM-5.1", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 262144, - "output": 65536 + "context": 200000, + "output": 131072 }, "temperature": true, "tool_call": true, @@ -61550,21 +65361,22 @@ ] } }, - "attachment": true, + "attachment": false, "open_weights": true, - "release_date": "2026-04-22", - "last_updated": "2026-04-22", + "release_date": "2026-03-27", + "last_updated": "2026-03-27", "cost": { - "input": 0.195, - "output": 1.56, - "cache_read": 0.0975 + "input": 1.4, + "output": 4.4, + "cache_read": 0.26, + "cache_write": 0 }, "type": "chat" }, { - "id": "Qwen/Qwen2.5-Coder-32B-Instruct", - "name": "Qwen2.5 Coder 32B Instruct", - "display_name": "Qwen2.5 Coder 32B Instruct", + "id": "z-ai/glm-4.6", + "name": "GLM-4.6", + "display_name": "GLM-4.6", "modalities": { "input": [ "text" @@ -61574,62 +65386,72 @@ ] }, "limit": { - "context": 32768, - "output": 32768 + "context": 204800, + "output": 131072 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true + } }, "attachment": false, "open_weights": true, - "release_date": "2025-12-29", - "last_updated": "2026-04-25", + "knowledge": "2025-04", + "release_date": "2025-09-30", + "last_updated": "2025-09-30", "cost": { - "input": 0.0272, - "output": 0.1087, - "cache_read": 0.0136 + "input": 0.6, + "output": 2.2, + "cache_read": 0.11, + "cache_write": 0 }, "type": "chat" }, { - "id": "Qwen/Qwen2.5-VL-32B-Instruct", - "name": "Qwen2.5 VL 32B Instruct", - "display_name": "Qwen2.5 VL 32B Instruct", + "id": "z-ai/glm-4.5-air", + "name": "GLM-4.5-Air", + "display_name": "GLM-4.5-Air", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 16384, - "output": 16384 + "context": 131072, + "output": 98304 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": true, + "attachment": false, "open_weights": true, - "release_date": "2025-12-29", - "last_updated": "2026-04-25", + "knowledge": "2025-04", + "release_date": "2025-07-28", + "last_updated": "2025-07-28", "cost": { - "input": 0.0543, - "output": 0.2174, - "cache_read": 0.02715 + "input": 0.2, + "output": 1.1, + "cache_read": 0.03, + "cache_write": 0 }, "type": "chat" }, { - "id": "Qwen/Qwen3-32B-TEE", - "name": "Qwen3 32B TEE", - "display_name": "Qwen3 32B TEE", + "id": "z-ai/glm-5", + "name": "GLM-5", + "display_name": "GLM-5", "modalities": { "input": [ "text" @@ -61639,8 +65461,8 @@ ] }, "limit": { - "context": 40960, - "output": 40960 + "context": 204800, + "output": 131072 }, "temperature": true, "tool_call": true, @@ -61648,22 +65470,33 @@ "supported": true, "default": true }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } + }, "attachment": false, "open_weights": true, - "knowledge": "2025-04", - "release_date": "2025-04", - "last_updated": "2025-04", + "release_date": "2026-02-11", + "last_updated": "2026-02-11", "cost": { - "input": 0.08, - "output": 0.24, - "cache_read": 0.04 + "input": 1, + "output": 3.2, + "cache_read": 0.2, + "cache_write": 0 }, "type": "chat" }, { - "id": "google/gemma-4-31B-turbo-TEE", - "name": "gemma 4 31B turbo TEE", - "display_name": "gemma 4 31B turbo TEE", + "id": "openai/gpt-5.2-pro", + "name": "GPT-5.2 Pro", + "display_name": "GPT-5.2 Pro", "modalities": { "input": [ "text", @@ -61674,43 +65507,64 @@ ] }, "limit": { - "context": 131072, - "output": 65536 + "context": 400000, + "output": 128000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { "supported": true, "default": true }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": true, + "mode": "effort", + "effort": "high", + "effort_options": [ + "medium", + "high", + "xhigh" + ], + "verbosity": "medium", + "verbosity_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" + } + }, "attachment": true, - "open_weights": true, - "release_date": "2026-04-02", - "last_updated": "2026-04-02", + "open_weights": false, + "knowledge": "2025-08-31", + "release_date": "2025-12-11", + "last_updated": "2025-12-11", "cost": { - "input": 0.13, - "output": 0.38, - "cache_read": 0.065 + "input": 21, + "output": 168 }, "type": "chat" }, { - "id": "openai/gpt-oss-120b-TEE", - "name": "gpt oss 120b TEE", - "display_name": "gpt oss 120b TEE", + "id": "openai/gpt-5", + "name": "GPT-5", + "display_name": "GPT-5", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 131072, - "output": 65536 + "context": 400000, + "output": 128000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { "supported": true, @@ -61719,38 +65573,40 @@ "extra_capabilities": { "reasoning": { "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] + "default_enabled": true, + "mode": "effort", + "effort": "medium", + "effort_options": [ + "minimal", + "low", + "medium", + "high" + ], + "verbosity": "medium", + "verbosity_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" } }, - "attachment": false, - "open_weights": true, - "release_date": "2025-12-29", - "last_updated": "2026-04-25", + "attachment": true, + "open_weights": false, + "knowledge": "2024-09-30", + "release_date": "2025-08-07", + "last_updated": "2025-08-07", "cost": { - "input": 0.09, - "output": 0.36, - "cache_read": 0.045 + "input": 1.25, + "output": 10, + "cache_read": 0.125 }, "type": "chat" - } - ] - }, - "crof": { - "id": "crof", - "name": "CrofAI", - "display_name": "CrofAI", - "api": "https://crof.ai/v1", - "doc": "https://crof.ai/docs", - "models": [ + }, { - "id": "deepseek-v4-pro-lightning", - "name": "DeepSeek V4 Pro", - "display_name": "DeepSeek V4 Pro", + "id": "openai/gpt-3.5-turbo", + "name": "GPT-3.5-turbo", + "display_name": "GPT-3.5-turbo", "modalities": { "input": [ "text" @@ -61760,10 +65616,44 @@ ] }, "limit": { - "context": 1000000, - "output": 131072 + "context": 16385, + "output": 4096 }, "temperature": true, + "tool_call": false, + "reasoning": { + "supported": false + }, + "attachment": false, + "open_weights": false, + "knowledge": "2021-09-01", + "release_date": "2023-03-01", + "last_updated": "2023-11-06", + "cost": { + "input": 0.5, + "output": 1.5, + "cache_read": 0 + }, + "type": "chat" + }, + { + "id": "openai/gpt-5-pro", + "name": "GPT-5 Pro", + "display_name": "GPT-5 Pro", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 400000, + "output": 272000 + }, + "temperature": false, "tool_call": true, "reasoning": { "supported": true, @@ -61772,62 +65662,68 @@ "extra_capabilities": { "reasoning": { "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] + "default_enabled": true, + "mode": "fixed", + "effort": "high", + "verbosity": "medium", + "verbosity_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" } }, - "attachment": false, - "open_weights": true, - "knowledge": "2025-05", - "release_date": "2026-04-24", - "last_updated": "2026-04-24", + "attachment": true, + "open_weights": false, + "knowledge": "2024-09-30", + "release_date": "2025-10-06", + "last_updated": "2025-10-06", "cost": { - "input": 0.8, - "output": 1.6, - "cache_read": 0.02 + "input": 15, + "output": 120 }, "type": "chat" }, { - "id": "greg-1", - "name": "Greg 1 Normal", - "display_name": "Greg 1 Normal", + "id": "openai/gpt-4o", + "name": "GPT-4o", + "display_name": "GPT-4o", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 229376, - "output": 229376 + "context": 128000, + "output": 16384 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { "supported": false }, - "attachment": false, + "attachment": true, "open_weights": false, - "release_date": "2026-01-27", - "last_updated": "2026-01-27", + "knowledge": "2023-09", + "release_date": "2024-05-13", + "last_updated": "2024-08-06", "cost": { - "input": 0.1, - "output": 0.3, - "cache_read": 0.02 + "input": 2.5, + "output": 10, + "cache_read": 1.25 }, "type": "chat" }, { - "id": "greg-rp", - "name": "Greg (Roleplay)", - "display_name": "Greg (Roleplay)", + "id": "openai/gpt-4", + "name": "GPT-4", + "display_name": "GPT-4", "modalities": { "input": [ "text" @@ -61837,29 +65733,29 @@ ] }, "limit": { - "context": 229376, - "output": 229376 + "context": 8192, + "output": 8192 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { "supported": false }, - "attachment": false, + "attachment": true, "open_weights": false, - "release_date": "2026-01-27", - "last_updated": "2026-01-27", + "knowledge": "2023-11", + "release_date": "2023-11-06", + "last_updated": "2024-04-09", "cost": { - "input": 0.1, - "output": 0.3, - "cache_read": 0.02 + "input": 30, + "output": 60 }, "type": "chat" }, { - "id": "gemma-4-31b-it", - "name": "Gemma 4 31B IT", - "display_name": "Gemma 4 31B IT", + "id": "openai/gpt-4o-2024-05-13", + "name": "GPT-4o (2024-05-13)", + "display_name": "GPT-4o (2024-05-13)", "modalities": { "input": [ "text", @@ -61870,331 +65766,373 @@ ] }, "limit": { - "context": 262144, - "output": 262144 + "context": 128000, + "output": 4096 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, "attachment": true, - "open_weights": true, - "release_date": "2026-04-02", - "last_updated": "2026-04-02", + "open_weights": false, + "knowledge": "2023-09", + "release_date": "2024-05-13", + "last_updated": "2024-05-13", "cost": { - "input": 0.1, - "output": 0.3, - "cache_read": 0.02 + "input": 5, + "output": 15 }, "type": "chat" }, { - "id": "qwen3.6-27b", - "name": "Qwen3.6 27B", - "display_name": "Qwen3.6 27B", + "id": "openai/gpt-5.4-nano", + "name": "GPT-5.4 nano", + "display_name": "GPT-5.4 nano", "modalities": { "input": [ "text", - "image", - "video", - "audio" + "image" ], "output": [ "text" ] }, "limit": { - "context": 262144, - "output": 262144 + "context": 400000, + "output": 128000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { "supported": true, - "default": true + "default": false }, "extra_capabilities": { "reasoning": { "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] + "default_enabled": false, + "mode": "effort", + "effort": "none", + "effort_options": [ + "none", + "low", + "medium", + "high", + "xhigh" + ], + "verbosity": "medium", + "verbosity_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" } }, "attachment": true, - "open_weights": true, - "release_date": "2026-04-22", - "last_updated": "2026-04-22", + "open_weights": false, + "knowledge": "2025-08-31", + "release_date": "2026-03-17", + "last_updated": "2026-03-17", "cost": { "input": 0.2, - "output": 1.5, - "cache_read": 0.04 + "output": 1.25, + "cache_read": 0.02 }, "type": "chat" }, { - "id": "deepseek-v3.2", - "name": "DeepSeek V3.2", - "display_name": "DeepSeek V3.2", + "id": "openai/gpt-5-chat-latest", + "name": "GPT-5 Chat (latest)", + "display_name": "GPT-5 Chat (latest)", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 163840, - "output": 163840 + "context": 400000, + "output": 128000 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true - } + "supported": true, + "default": true }, - "attachment": false, + "attachment": true, "open_weights": false, - "release_date": "2025-07-22", - "last_updated": "2025-07-22", + "knowledge": "2024-09-30", + "release_date": "2025-08-07", + "last_updated": "2025-08-07", "cost": { - "input": 0.18, - "output": 0.35, - "cache_read": 0.04 + "input": 1.25, + "output": 10, + "cache_read": 0.125 }, "type": "chat" }, { - "id": "greg-1-super", - "name": "Greg 1 Super", - "display_name": "Greg 1 Super", + "id": "openai/gpt-5.1-codex", + "name": "GPT-5.1 Codex", + "display_name": "GPT-5.1 Codex", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 229376, - "output": 229376 + "context": 400000, + "output": 128000 }, - "temperature": true, - "tool_call": false, + "temperature": false, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": false + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": false, + "mode": "effort", + "effort": "none", + "effort_options": [ + "none", + "low", + "medium", + "high" + ], + "verbosity": "medium", + "verbosity_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" + } }, - "attachment": false, + "attachment": true, "open_weights": false, - "release_date": "2026-01-27", - "last_updated": "2026-01-27", + "knowledge": "2024-09-30", + "release_date": "2025-11-13", + "last_updated": "2025-11-13", "cost": { - "input": 1, - "output": 5, - "cache_read": 0.2 + "input": 1.25, + "output": 10, + "cache_read": 0.125 }, "type": "chat" }, { - "id": "kimi-k2.6", - "name": "Kimi K2.6", - "display_name": "Kimi K2.6", + "id": "openai/gpt-5.1-codex-max", + "name": "GPT-5.1 Codex Max", + "display_name": "GPT-5.1 Codex Max", "modalities": { "input": [ "text", - "image", - "video" + "image" ], "output": [ "text" ] }, "limit": { - "context": 262144, - "output": 262144 + "context": 400000, + "output": 128000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { "supported": true, - "default": true + "default": false }, "extra_capabilities": { "reasoning": { "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] + "default_enabled": false, + "mode": "effort", + "effort": "none", + "effort_options": [ + "none", + "low", + "medium", + "high" + ], + "verbosity": "medium", + "verbosity_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" } }, "attachment": true, - "open_weights": true, - "knowledge": "2025-01", - "release_date": "2026-04-21", - "last_updated": "2026-04-21", + "open_weights": false, + "knowledge": "2024-09-30", + "release_date": "2025-11-13", + "last_updated": "2025-11-13", "cost": { - "input": 0.5, - "output": 1.99, - "cache_read": 0.05 + "input": 1.25, + "output": 10, + "cache_read": 0.125 }, "type": "chat" }, { - "id": "glm-4.7", - "name": "GLM-4.7", - "display_name": "GLM-4.7", + "id": "openai/gpt-5.3-chat-latest", + "name": "GPT-5.3 Chat (latest)", + "display_name": "GPT-5.3 Chat (latest)", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 202752, - "output": 202752 + "context": 128000, + "output": 16384 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } + "supported": false }, - "attachment": false, - "open_weights": true, - "knowledge": "2025-04", - "release_date": "2025-12-22", - "last_updated": "2025-12-22", + "attachment": true, + "open_weights": false, + "knowledge": "2025-08-31", + "release_date": "2026-03-03", + "last_updated": "2026-03-03", "cost": { - "input": 0.25, - "output": 1.1, - "cache_read": 0.05, - "cache_write": 0 + "input": 1.75, + "output": 14, + "cache_read": 0.175 }, "type": "chat" }, { - "id": "greg-1-mini", - "name": "Greg 1 Mini", - "display_name": "Greg 1 Mini", + "id": "openai/gpt-4o-2024-08-06", + "name": "GPT-4o (2024-08-06)", + "display_name": "GPT-4o (2024-08-06)", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 229376, - "output": 229376 + "context": 128000, + "output": 16384 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { "supported": false }, - "attachment": false, + "attachment": true, "open_weights": false, - "release_date": "2026-01-27", - "last_updated": "2026-01-27", + "knowledge": "2023-09", + "release_date": "2024-08-06", + "last_updated": "2024-08-06", "cost": { - "input": 0.07, - "output": 0.15, - "cache_read": 0.01 + "input": 2.5, + "output": 10, + "cache_read": 1.25 }, "type": "chat" }, { - "id": "qwen3.5-9b", - "name": "Qwen3.5 9B", - "display_name": "Qwen3.5 9B", + "id": "openai/gpt-5.2", + "name": "GPT-5.2", + "display_name": "GPT-5.2", "modalities": { "input": [ "text", - "image", - "video", - "audio" + "image" ], "output": [ "text" ] }, "limit": { - "context": 262144, - "output": 262144 + "context": 400000, + "output": 128000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { "supported": true, - "default": true + "default": false }, "extra_capabilities": { "reasoning": { "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] + "default_enabled": false, + "mode": "effort", + "effort": "none", + "effort_options": [ + "none", + "low", + "medium", + "high", + "xhigh" + ], + "verbosity": "medium", + "verbosity_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" } }, "attachment": true, - "open_weights": true, - "release_date": "2026-03-13", - "last_updated": "2026-03-13", + "open_weights": false, + "knowledge": "2025-08-31", + "release_date": "2025-12-11", + "last_updated": "2025-12-11", "cost": { - "input": 0.04, - "output": 0.15, - "cache_read": 0.008 + "input": 1.75, + "output": 14, + "cache_read": 0.175 }, "type": "chat" }, { - "id": "glm-4.7-flash", - "name": "GLM-4.7-Flash", - "display_name": "GLM-4.7-Flash", + "id": "openai/gpt-5.3-codex", + "name": "GPT-5.3 Codex", + "display_name": "GPT-5.3 Codex", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 202752, - "output": 131072 + "context": 400000, + "output": 128000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { "supported": true, @@ -62202,129 +66140,144 @@ }, "extra_capabilities": { "reasoning": { - "supported": true + "supported": true, + "default_enabled": true, + "mode": "effort", + "effort": "medium", + "effort_options": [ + "low", + "medium", + "high", + "xhigh" + ], + "verbosity": "medium", + "verbosity_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" } }, - "attachment": false, - "open_weights": true, - "knowledge": "2025-04", - "release_date": "2026-01-19", - "last_updated": "2026-01-19", + "attachment": true, + "open_weights": false, + "knowledge": "2025-08-31", + "release_date": "2026-02-05", + "last_updated": "2026-02-05", "cost": { - "input": 0.04, - "output": 0.3, - "cache_read": 0.008, - "cache_write": 0 + "input": 1.75, + "output": 14, + "cache_read": 0.175 }, "type": "chat" }, { - "id": "deepseek-v4-flash", - "name": "DeepSeek V4 Flash", - "display_name": "DeepSeek V4 Flash", + "id": "openai/gpt-5.1-codex-mini", + "name": "GPT-5.1 Codex mini", + "display_name": "GPT-5.1 Codex mini", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 1000000, - "output": 131072 + "context": 400000, + "output": 128000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { "supported": true, - "default": true + "default": false }, "extra_capabilities": { "reasoning": { "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] + "default_enabled": false, + "mode": "effort", + "effort": "none", + "effort_options": [ + "none", + "low", + "medium", + "high" + ], + "verbosity": "medium", + "verbosity_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" } }, - "attachment": false, - "open_weights": true, - "knowledge": "2025-05", - "release_date": "2026-04-24", - "last_updated": "2026-04-24", + "attachment": true, + "open_weights": false, + "knowledge": "2024-09-30", + "release_date": "2025-11-13", + "last_updated": "2025-11-13", "cost": { - "input": 0.12, - "output": 0.21, - "cache_read": 0.003 + "input": 0.25, + "output": 2, + "cache_read": 0.025 }, "type": "chat" }, { - "id": "glm-5", - "name": "GLM-5", - "display_name": "GLM-5", + "id": "openai/gpt-5.1-chat-latest", + "name": "GPT-5.1 Chat", + "display_name": "GPT-5.1 Chat", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 202752, - "output": 202752 + "context": 128000, + "output": 16384 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { "supported": true, "default": true }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } - }, - "attachment": false, - "open_weights": true, - "release_date": "2026-02-11", - "last_updated": "2026-02-11", + "attachment": true, + "open_weights": false, + "knowledge": "2024-09-30", + "release_date": "2025-11-13", + "last_updated": "2025-11-13", "cost": { - "input": 0.48, - "output": 1.9, - "cache_read": 0.1, - "cache_write": 0 + "input": 1.25, + "output": 10, + "cache_read": 0.125 }, "type": "chat" }, { - "id": "kimi-k2.5-lightning", - "name": "Kimi K2.5 (Lightning)", - "display_name": "Kimi K2.5 (Lightning)", + "id": "openai/gpt-5.2-chat-latest", + "name": "GPT-5.2 Chat", + "display_name": "GPT-5.2 Chat", "modalities": { "input": [ "text", - "image", - "video" + "image" ], "output": [ "text" ] }, "limit": { - "context": 131072, - "output": 32768 + "context": 128000, + "output": 16384 }, "temperature": false, "tool_call": true, @@ -62332,267 +66285,270 @@ "supported": true, "default": true }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } - }, - "attachment": false, - "open_weights": true, - "release_date": "2026-02-06", - "last_updated": "2026-02-06", + "attachment": true, + "open_weights": false, + "knowledge": "2025-08-31", + "release_date": "2025-12-11", + "last_updated": "2025-12-11", "cost": { - "input": 1, - "output": 3, - "cache_read": 0.2 + "input": 1.75, + "output": 14, + "cache_read": 0.175 }, "type": "chat" }, { - "id": "qwen3.5-397b-a17b", - "name": "Qwen3.5 397B-A17B", - "display_name": "Qwen3.5 397B-A17B", + "id": "openai/gpt-4.1-nano", + "name": "GPT-4.1 nano", + "display_name": "GPT-4.1 nano", "modalities": { "input": [ "text", - "image", - "video", - "audio" + "image" ], "output": [ "text" ] }, "limit": { - "context": 262144, - "output": 262144 + "context": 1047576, + "output": 32768 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } + "supported": false }, "attachment": true, - "open_weights": true, - "release_date": "2026-02-15", - "last_updated": "2026-02-15", + "open_weights": false, + "knowledge": "2024-04", + "release_date": "2025-04-14", + "last_updated": "2025-04-14", "cost": { - "input": 0.35, - "output": 1.75, - "cache_read": 0.07 + "input": 0.1, + "output": 0.4, + "cache_read": 0.025 }, "type": "chat" }, { - "id": "minimax-m2.5", - "name": "MiniMax-M2.5", - "display_name": "MiniMax-M2.5", + "id": "openai/gpt-4o-2024-11-20", + "name": "GPT-4o (2024-11-20)", + "display_name": "GPT-4o (2024-11-20)", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 204800, - "output": 131072 + "context": 128000, + "output": 16384 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true - } + "supported": false }, - "attachment": false, - "open_weights": true, - "release_date": "2026-02-12", - "last_updated": "2026-02-12", + "attachment": true, + "open_weights": false, + "knowledge": "2023-09", + "release_date": "2024-11-20", + "last_updated": "2024-11-20", "cost": { - "input": 0.11, - "output": 0.95, - "cache_read": 0.02, - "cache_write": 0.375 + "input": 2.5, + "output": 10, + "cache_read": 1.25 }, "type": "chat" }, { - "id": "deepseek-v4-pro", - "name": "DeepSeek V4 Pro", - "display_name": "DeepSeek V4 Pro", + "id": "openai/gpt-5.4", + "name": "GPT-5.4", + "display_name": "GPT-5.4", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 1000000, - "output": 131072 + "context": 1050000, + "output": 128000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { "supported": true, - "default": true + "default": false }, "extra_capabilities": { "reasoning": { "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] + "default_enabled": false, + "mode": "effort", + "effort": "none", + "effort_options": [ + "none", + "low", + "medium", + "high", + "xhigh" + ], + "verbosity": "medium", + "verbosity_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" } }, - "attachment": false, - "open_weights": true, - "knowledge": "2025-05", - "release_date": "2026-04-24", - "last_updated": "2026-04-24", + "attachment": true, + "open_weights": false, + "knowledge": "2025-08-31", + "release_date": "2026-03-05", + "last_updated": "2026-03-05", "cost": { - "input": 0.35, - "output": 0.8, - "cache_read": 0.003 + "input": 5, + "output": 22.5, + "cache_read": 0.25, + "tiers": [ + { + "input": 5, + "output": 22.5, + "cache_read": 0.5, + "tier": { + "type": "context", + "size": 272000 + } + } + ], + "context_over_200k": { + "input": 5, + "output": 22.5, + "cache_read": 0.5 + } }, "type": "chat" }, { - "id": "kimi-k2.5", - "name": "Kimi K2.5", - "display_name": "Kimi K2.5", + "id": "openai/gpt-5.4-mini", + "name": "GPT-5.4 mini", + "display_name": "GPT-5.4 mini", "modalities": { "input": [ "text", - "image", - "video" + "image" ], "output": [ "text" ] }, "limit": { - "context": 262144, - "output": 262144 + "context": 400000, + "output": 128000 }, "temperature": false, "tool_call": true, "reasoning": { "supported": true, - "default": true + "default": false }, "extra_capabilities": { "reasoning": { "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] + "default_enabled": false, + "mode": "effort", + "effort": "none", + "effort_options": [ + "none", + "low", + "medium", + "high", + "xhigh" + ], + "verbosity": "medium", + "verbosity_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" } }, - "attachment": false, - "open_weights": true, - "knowledge": "2025-01", - "release_date": "2026-01", - "last_updated": "2026-01", + "attachment": true, + "open_weights": false, + "knowledge": "2025-08-31", + "release_date": "2026-03-17", + "last_updated": "2026-03-17", "cost": { - "input": 0.35, - "output": 1.7, - "cache_read": 0.07 + "input": 0.75, + "output": 4.5, + "cache_read": 0.075 }, "type": "chat" }, { - "id": "glm-5.1", - "name": "GLM-5.1", - "display_name": "GLM-5.1", + "id": "openai/gpt-4.1", + "name": "GPT-4.1", + "display_name": "GPT-4.1", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 202752, - "output": 202752 + "context": 1047576, + "output": 32768 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } + "supported": false }, - "attachment": false, - "open_weights": true, - "release_date": "2026-03-27", - "last_updated": "2026-03-27", + "attachment": true, + "open_weights": false, + "knowledge": "2024-04", + "release_date": "2025-04-14", + "last_updated": "2025-04-14", "cost": { - "input": 0.45, - "output": 2.15, - "cache_read": 0.08, - "cache_write": 0 + "input": 2, + "output": 8, + "cache_read": 0.5 }, "type": "chat" }, { - "id": "mimo-v2.5-pro", - "name": "MiMo-V2.5-Pro", - "display_name": "MiMo-V2.5-Pro", + "id": "openai/gpt-5-mini", + "name": "GPT-5 Mini", + "display_name": "GPT-5 Mini", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 1048576, - "output": 131072 + "context": 400000, + "output": 128000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { "supported": true, @@ -62601,66 +66557,53 @@ "extra_capabilities": { "reasoning": { "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] + "default_enabled": true, + "mode": "effort", + "effort": "medium", + "effort_options": [ + "minimal", + "low", + "medium", + "high" + ], + "verbosity": "medium", + "verbosity_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" } }, - "attachment": false, - "open_weights": true, - "knowledge": "2024-12", - "release_date": "2026-04-22", - "last_updated": "2026-04-22", + "attachment": true, + "open_weights": false, + "knowledge": "2024-05-30", + "release_date": "2025-08-07", + "last_updated": "2025-08-07", "cost": { - "input": 0.4, - "output": 0.8, - "cache_read": 0.003, - "tiers": [ - { - "input": 2, - "output": 6, - "cache_read": 0.4, - "tier": { - "type": "context", - "size": 256000 - } - } - ], - "context_over_200k": { - "input": 2, - "output": 6, - "cache_read": 0.4 - } + "input": 0.25, + "output": 2, + "cache_read": 0.025 }, "type": "chat" - } - ] - }, - "frogbot": { - "id": "frogbot", - "name": "FrogBot", - "display_name": "FrogBot", - "api": "https://app.frogbot.ai/api/v1", - "doc": "https://docs.frogbot.ai", - "models": [ + }, { - "id": "minimax-m2-7", - "name": "MiniMax-M2.7", - "display_name": "MiniMax-M2.7", + "id": "openai/gpt-4.1-mini", + "name": "GPT-4.1 mini", + "display_name": "GPT-4.1 mini", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 192000, - "output": 8192 + "context": 1047576, + "output": 32768 }, "temperature": true, "tool_call": true, @@ -62669,85 +66612,53 @@ }, "attachment": true, "open_weights": false, - "knowledge": "2024-09", - "release_date": "2026-03-18", - "last_updated": "2026-03-18", + "knowledge": "2024-04", + "release_date": "2025-04-14", + "last_updated": "2025-04-14", "cost": { - "input": 0.3, - "output": 1.2, - "cache_read": 0.06 + "input": 0.4, + "output": 1.6, + "cache_read": 0.1 }, "type": "chat" }, { - "id": "claude-sonnet-4-6", - "name": "Claude Sonnet 4.6", - "display_name": "Claude Sonnet 4.6", + "id": "openai/gpt-4-turbo", + "name": "GPT-4 Turbo", + "display_name": "GPT-4 Turbo", "modalities": { "input": [ "text", - "image", - "pdf" + "image" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 64000 + "context": 128000, + "output": 4096 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": false - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": false, - "mode": "mixed", - "budget": { - "min": 1024, - "unit": "tokens" - }, - "effort": "high", - "effort_options": [ - "low", - "medium", - "high", - "max" - ], - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ], - "notes": [ - "Anthropic recommends adaptive thinking with effort for Claude 4.6; budget_tokens remains a deprecated compatibility path.", - "Anthropic API defaults effort to high; lower effort levels should be chosen per workload." - ] - } + "supported": false }, "attachment": true, "open_weights": false, - "knowledge": "2025-08-31", - "release_date": "2026-02-17", - "last_updated": "2026-02-17", + "knowledge": "2023-12", + "release_date": "2023-11-06", + "last_updated": "2024-04-09", "cost": { - "input": 3, - "output": 15, - "cache_read": 0.3, - "cache_write": 3.75 + "input": 10, + "output": 30 }, "type": "chat" }, { - "id": "gpt-4o", - "name": "GPT-4o", - "display_name": "GPT-4o", + "id": "openai/gpt-5-nano", + "name": "GPT-5 Nano", + "display_name": "GPT-5 Nano", "modalities": { "input": [ "text", @@ -62758,30 +66669,52 @@ ] }, "limit": { - "context": 128000, - "output": 16384 + "context": 400000, + "output": 128000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": true, + "mode": "effort", + "effort": "medium", + "effort_options": [ + "minimal", + "low", + "medium", + "high" + ], + "verbosity": "medium", + "verbosity_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" + } }, "attachment": true, "open_weights": false, - "knowledge": "2023-09", - "release_date": "2024-05-13", - "last_updated": "2024-08-06", + "knowledge": "2024-05-30", + "release_date": "2025-08-07", + "last_updated": "2025-08-07", "cost": { - "input": 2.5, - "output": 10, - "cache_read": 1.25 + "input": 0.05, + "output": 0.4, + "cache_read": 0.005 }, "type": "chat" }, { - "id": "gpt-5-4-mini", - "name": "GPT-5.4 Mini", - "display_name": "GPT-5.4 Mini", + "id": "openai/gpt-5.4-pro", + "name": "GPT-5.4 Pro", + "display_name": "GPT-5.4 Pro", "modalities": { "input": [ "text", @@ -62792,24 +66725,22 @@ ] }, "limit": { - "context": 400000, + "context": 1050000, "output": 128000 }, "temperature": false, "tool_call": true, "reasoning": { "supported": true, - "default": false + "default": true }, "extra_capabilities": { "reasoning": { "supported": true, - "default_enabled": false, + "default_enabled": true, "mode": "effort", - "effort": "none", + "effort": "high", "effort_options": [ - "none", - "low", "medium", "high", "xhigh" @@ -62826,19 +66757,32 @@ "attachment": true, "open_weights": false, "knowledge": "2025-08-31", - "release_date": "2026-03-17", - "last_updated": "2026-03-17", + "release_date": "2026-03-05", + "last_updated": "2026-03-05", "cost": { - "input": 0.75, - "output": 4.5, - "cache_read": 0.075 + "input": 60, + "output": 270, + "tiers": [ + { + "input": 60, + "output": 270, + "tier": { + "type": "context", + "size": 272000 + } + } + ], + "context_over_200k": { + "input": 60, + "output": 270 + } }, "type": "chat" }, { - "id": "claude-haiku-4-5", - "name": "Claude Haiku 4.5", - "display_name": "Claude Haiku 4.5", + "id": "openai/gpt-5.5-pro", + "name": "GPT-5.5 Pro", + "display_name": "GPT-5.5 Pro", "modalities": { "input": [ "text", @@ -62850,59 +66794,53 @@ ] }, "limit": { - "context": 200000, - "output": 64000 + "context": 1050000, + "output": 128000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { "supported": true, - "default": false + "default": true }, "extra_capabilities": { "reasoning": { - "supported": true, - "default_enabled": false, - "mode": "budget", - "budget": { - "min": 1024, - "unit": "tokens" - }, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ], - "notes": [ - "Claude 4 manual thinking uses thinking.type = \"enabled\" with budget_tokens.", - "Interleaved thinking requires the interleaved-thinking-2025-05-14 beta header for this model family." - ] + "supported": true } }, "attachment": true, "open_weights": false, - "knowledge": "2025-02-28", - "release_date": "2025-10-15", - "last_updated": "2025-10-15", + "knowledge": "2025-12-01", + "release_date": "2026-04-23", + "last_updated": "2026-04-23", "cost": { - "input": 1, - "output": 5, - "cache_read": 0.1, - "cache_write": 1.25 + "input": 30, + "output": 180, + "tiers": [ + { + "input": 60, + "output": 270, + "tier": { + "type": "context", + "size": 272000 + } + } + ], + "context_over_200k": { + "input": 60, + "output": 270 + } }, "type": "chat" }, { - "id": "gemini-3-flash-preview", - "name": "Gemini 3 Flash Preview", - "display_name": "Gemini 3 Flash Preview", + "id": "openai/gpt-4o-mini", + "name": "GPT-4o mini", + "display_name": "GPT-4o mini", "modalities": { "input": [ "text", "image", - "video", - "audio", "pdf" ], "output": [ @@ -62910,11 +66848,45 @@ ] }, "limit": { - "context": 1048576, - "output": 65536 + "context": 128000, + "output": 16384 }, "temperature": true, "tool_call": true, + "reasoning": { + "supported": false + }, + "attachment": true, + "open_weights": false, + "knowledge": "2023-09", + "release_date": "2024-07-18", + "last_updated": "2024-07-18", + "cost": { + "input": 0.15, + "output": 0.6, + "cache_read": 0.075 + }, + "type": "chat" + }, + { + "id": "openai/gpt-5-codex", + "name": "GPT-5-Codex", + "display_name": "GPT-5-Codex", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 400000, + "output": 128000 + }, + "temperature": false, + "tool_call": true, "reasoning": { "supported": true, "default": true @@ -62923,114 +66895,164 @@ "reasoning": { "supported": true, "default_enabled": true, - "mode": "level", - "level": "high", - "level_options": [ + "mode": "effort", + "effort": "medium", + "effort_options": [ "minimal", "low", "medium", "high" ], - "summaries": true, - "visibility": "summary", - "continuation": [ - "thought_signatures" - ] + "verbosity": "medium", + "verbosity_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" } }, - "attachment": true, + "attachment": false, "open_weights": false, - "knowledge": "2025-01", - "release_date": "2025-12-17", - "last_updated": "2025-12-17", + "knowledge": "2024-09-30", + "release_date": "2025-09-15", + "last_updated": "2025-09-15", "cost": { - "input": 0.5, - "output": 3, - "cache_read": 0.05 + "input": 1.25, + "output": 10, + "cache_read": 0.125 }, "type": "chat" }, { - "id": "zai-glm-5-1", - "name": "Z.AI GLM-5.1", - "display_name": "Z.AI GLM-5.1", + "id": "openai/gpt-5.2-codex", + "name": "GPT-5.2 Codex", + "display_name": "GPT-5.2 Codex", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 198000, - "output": 8192 + "context": 400000, + "output": 128000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": true, + "mode": "effort", + "effort": "medium", + "effort_options": [ + "low", + "medium", + "high", + "xhigh" + ], + "verbosity": "medium", + "verbosity_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" + } }, "attachment": true, - "open_weights": true, - "knowledge": "2024-10", - "release_date": "2025-01-20", - "last_updated": "2025-02-22", + "open_weights": false, + "knowledge": "2025-08-31", + "release_date": "2025-12-11", + "last_updated": "2025-12-11", "cost": { - "input": 1.4, - "output": 4.4, - "cache_read": 0.26 + "input": 1.75, + "output": 14, + "cache_read": 0.175 }, "type": "chat" }, { - "id": "minimax-m2-5", - "name": "MiniMax-M2.5", - "display_name": "MiniMax-M2.5", + "id": "openai/gpt-5.1", + "name": "GPT-5.1", + "display_name": "GPT-5.1", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 192000, - "output": 8192 + "context": 400000, + "output": 128000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": false + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": false, + "mode": "effort", + "effort": "none", + "effort_options": [ + "none", + "low", + "medium", + "high" + ], + "verbosity": "medium", + "verbosity_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" + } }, "attachment": true, "open_weights": false, - "knowledge": "2024-09", - "release_date": "2025-01-15", - "last_updated": "2025-02-22", + "knowledge": "2024-09-30", + "release_date": "2025-11-13", + "last_updated": "2025-11-13", "cost": { - "input": 0.3, - "output": 1.2, - "cache_read": 0.03 + "input": 1.25, + "output": 10, + "cache_read": 0.125 }, "type": "chat" }, { - "id": "gpt-5-5", + "id": "openai/gpt-5.5", "name": "GPT-5.5", "display_name": "GPT-5.5", "modalities": { "input": [ "text", - "image" + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 272000, + "context": 1050000, "output": 128000 }, "temperature": false, @@ -63062,33 +67084,51 @@ }, "attachment": true, "open_weights": false, - "knowledge": "2025-08-31", - "release_date": "2026-03-05", - "last_updated": "2026-03-05", + "knowledge": "2025-12-01", + "release_date": "2026-04-23", + "last_updated": "2026-04-23", "cost": { - "input": 2.5, - "output": 15, - "cache_read": 0.25 + "input": 5, + "output": 30, + "cache_read": 0.5, + "tiers": [ + { + "input": 10, + "output": 45, + "cache_read": 1, + "tier": { + "type": "context", + "size": 272000 + } + } + ], + "context_over_200k": { + "input": 10, + "output": 45, + "cache_read": 1 + } }, "type": "chat" }, { - "id": "gpt-oss-120b", - "name": "GPT OSS 120B", - "display_name": "GPT OSS 120B", + "id": "kimi/kimi-k2.5", + "name": "Kimi K2.5", + "display_name": "Kimi K2.5", "modalities": { "input": [ - "text" + "text", + "image", + "video" ], "output": [ "text" ] }, "limit": { - "context": 131072, - "output": 32768 + "context": 262144, + "output": 262144 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { "supported": true, @@ -63096,38 +67136,44 @@ }, "extra_capabilities": { "reasoning": { - "supported": true + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] } }, "attachment": false, "open_weights": true, - "release_date": "1970-01-01", - "last_updated": "1970-01-01", + "knowledge": "2025-01", + "release_date": "2026-01", + "last_updated": "2026-01", "cost": { - "input": 0.15, - "output": 0.6 + "input": 0.6, + "output": 3, + "cache_read": 0.1 }, "type": "chat" }, { - "id": "gemini-3-1-pro-preview", - "name": "Gemini 3.1 Pro Preview", - "display_name": "Gemini 3.1 Pro Preview", + "id": "kimi/kimi-k2.6", + "name": "Kimi K2.6", + "display_name": "Kimi K2.6", "modalities": { "input": [ "text", "image", - "video", - "audio", - "pdf" + "video" ], "output": [ "text" ] }, "limit": { - "context": 1000000, - "output": 64000 + "context": 262144, + "output": 262144 }, "temperature": true, "tool_call": true, @@ -63135,22 +67181,33 @@ "supported": true, "default": true }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } + }, "attachment": true, - "open_weights": false, - "knowledge": "2026-01", - "release_date": "2026-02-18", - "last_updated": "2026-02-18", + "open_weights": true, + "knowledge": "2025-01", + "release_date": "2026-04-21", + "last_updated": "2026-04-21", "cost": { - "input": 2, - "output": 12, - "cache_read": 0.2 + "input": 0.95, + "output": 4, + "cache_read": 0.16 }, "type": "chat" }, { - "id": "grok-4-1-fast-non-reasoning", - "name": "Grok 4.1 Fast (Non-Reasoning)", - "display_name": "Grok 4.1 Fast (Non-Reasoning)", + "id": "orcarouter/auto", + "name": "OrcaRouter Auto", + "display_name": "OrcaRouter Auto", "modalities": { "input": [ "text", @@ -63161,8 +67218,8 @@ ] }, "limit": { - "context": 2000000, - "output": 128000 + "context": 128000, + "output": 16384 }, "temperature": true, "tool_call": true, @@ -63171,34 +67228,33 @@ }, "attachment": true, "open_weights": false, - "knowledge": "2025-11", - "release_date": "2025-11-25", - "last_updated": "2025-11-25", + "release_date": "2025-01-01", + "last_updated": "2026-05-14", "cost": { - "input": 0.2, - "output": 0.5, - "cache_read": 0.05 + "input": 0, + "output": 0 }, "type": "chat" }, { - "id": "gpt-5-4-nano", - "name": "GPT-5.4 Nano", - "display_name": "GPT-5.4 Nano", + "id": "anthropic/claude-sonnet-4.5", + "name": "Claude Sonnet 4.5 (latest)", + "display_name": "Claude Sonnet 4.5 (latest)", "modalities": { "input": [ "text", - "image" + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 400000, - "output": 128000 + "context": 200000, + "output": 64000 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, @@ -63208,77 +67264,98 @@ "reasoning": { "supported": true, "default_enabled": false, - "mode": "effort", - "effort": "none", - "effort_options": [ - "none", - "low", - "medium", - "high", - "xhigh" - ], - "verbosity": "medium", - "verbosity_options": [ - "low", - "medium", - "high" + "mode": "budget", + "budget": { + "min": 1024, + "unit": "tokens" + }, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" ], - "visibility": "hidden" + "notes": [ + "Claude 4 manual thinking uses thinking.type = \"enabled\" with budget_tokens.", + "Interleaved thinking requires the interleaved-thinking-2025-05-14 beta header for this model family." + ] } }, "attachment": true, "open_weights": false, - "knowledge": "2024-05-30", - "release_date": "2025-08-07", - "last_updated": "2025-08-07", + "knowledge": "2025-07-31", + "release_date": "2025-09-29", + "last_updated": "2025-09-29", "cost": { - "input": 0.2, - "output": 1.25, - "cache_read": 0.02 + "input": 3, + "output": 15, + "cache_read": 0.3, + "cache_write": 3.75 }, "type": "chat" }, { - "id": "gpt-oss-20b", - "name": "GPT OSS 20B", - "display_name": "GPT OSS 20B", + "id": "anthropic/claude-sonnet-4", + "name": "Claude Sonnet 4 (latest)", + "display_name": "Claude Sonnet 4 (latest)", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 131072, - "output": 32768 + "context": 200000, + "output": 64000 }, "temperature": true, "tool_call": true, "reasoning": { "supported": true, - "default": true + "default": false }, "extra_capabilities": { "reasoning": { - "supported": true + "supported": true, + "default_enabled": false, + "mode": "budget", + "budget": { + "min": 1024, + "unit": "tokens" + }, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ], + "notes": [ + "Claude 4 manual thinking uses thinking.type = \"enabled\" with budget_tokens.", + "Interleaved thinking requires the interleaved-thinking-2025-05-14 beta header for this model family." + ] } }, - "attachment": false, - "open_weights": true, - "release_date": "1970-01-01", - "last_updated": "1970-01-01", + "attachment": true, + "open_weights": false, + "knowledge": "2025-03-31", + "release_date": "2025-05-22", + "last_updated": "2025-05-22", "cost": { - "input": 0.07, - "output": 0.2 + "input": 3, + "output": 15, + "cache_read": 0.3, + "cache_write": 3.75 }, "type": "chat" }, { - "id": "qwen-3-6-plus", - "name": "Qwen 3.6 Plus", - "display_name": "Qwen 3.6 Plus", + "id": "anthropic/claude-haiku-4.5", + "name": "Claude Haiku 4.5 (latest)", + "display_name": "Claude Haiku 4.5 (latest)", "modalities": { "input": [ "text", @@ -63290,36 +67367,57 @@ ] }, "limit": { - "context": 1000000, + "context": 200000, "output": 64000 }, "temperature": true, "tool_call": true, "reasoning": { "supported": true, - "default": true + "default": false + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": false, + "mode": "budget", + "budget": { + "min": 1024, + "unit": "tokens" + }, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ], + "notes": [ + "Claude 4 manual thinking uses thinking.type = \"enabled\" with budget_tokens.", + "Interleaved thinking requires the interleaved-thinking-2025-05-14 beta header for this model family." + ] + } }, "attachment": true, "open_weights": false, - "release_date": "2026-04-02", - "last_updated": "2026-04-03", + "knowledge": "2025-02-28", + "release_date": "2025-10-15", + "last_updated": "2025-10-15", "cost": { - "input": 0.5, - "output": 3, - "cache_read": 0.1 + "input": 1, + "output": 5, + "cache_read": 0.1, + "cache_write": 1.25 }, "type": "chat" }, { - "id": "gemini-2.5-pro", - "name": "Gemini 2.5 Pro", - "display_name": "Gemini 2.5 Pro", + "id": "anthropic/claude-opus-4.7", + "name": "Claude Opus 4.7", + "display_name": "Claude Opus 4.7", "modalities": { "input": [ "text", "image", - "audio", - "video", "pdf" ], "output": [ @@ -63327,90 +67425,120 @@ ] }, "limit": { - "context": 1048576, - "output": 65536 + "context": 1000000, + "output": 128000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { "supported": true, - "default": true + "default": false }, "extra_capabilities": { "reasoning": { "supported": true, - "default_enabled": true, - "mode": "budget", - "budget": { - "default": -1, - "min": 128, - "max": 32768, - "auto": -1, - "unit": "tokens" - }, + "default_enabled": false, + "mode": "effort", + "effort": "high", + "effort_options": [ + "low", + "medium", + "high", + "xhigh", + "max" + ], + "interleaved": true, "summaries": true, - "visibility": "summary", + "visibility": "omitted", "continuation": [ - "thought_signatures" + "thinking_blocks" + ], + "notes": [ + "Claude Opus 4.7 and newer Opus models require thinking.type = \"adaptive\" to enable thinking explicitly.", + "Manual budget_tokens requests return 400 on Claude Opus 4.7 and newer adaptive-only Opus models.", + "task_budget is separate from thinking control and should not be treated as a thinking budget." ] } }, "attachment": true, "open_weights": false, - "knowledge": "2025-01", - "release_date": "2025-03-20", - "last_updated": "2025-06-05", + "knowledge": "2026-01-31", + "release_date": "2026-04-16", + "last_updated": "2026-04-16", "cost": { - "input": 1.25, - "output": 10, - "cache_read": 0.31 + "input": 5, + "output": 25, + "cache_read": 0.5, + "cache_write": 6.25 }, "type": "chat" }, { - "id": "kimi-k2-6", - "name": "Kimi-K2.6", - "display_name": "Kimi-K2.6", + "id": "anthropic/claude-opus-4.1", + "name": "Claude Opus 4.1 (latest)", + "display_name": "Claude Opus 4.1 (latest)", "modalities": { "input": [ "text", - "image" + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 256000, - "output": 128000 + "context": 200000, + "output": 32000 }, "temperature": true, "tool_call": true, "reasoning": { "supported": true, - "default": true + "default": false }, - "attachment": false, + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": false, + "mode": "budget", + "budget": { + "min": 1024, + "unit": "tokens" + }, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ], + "notes": [ + "Claude 4 manual thinking uses thinking.type = \"enabled\" with budget_tokens.", + "Interleaved thinking requires the interleaved-thinking-2025-05-14 beta header for this model family." + ] + } + }, + "attachment": true, "open_weights": false, - "release_date": "1970-01-01", - "last_updated": "1970-01-01", + "knowledge": "2025-03-31", + "release_date": "2025-08-05", + "last_updated": "2025-08-05", "cost": { - "input": 0.95, - "output": 4, - "cache_read": 0.16 + "input": 15, + "output": 75, + "cache_read": 1.5, + "cache_write": 18.75 }, "type": "chat" }, { - "id": "gemini-2.5-flash", - "name": "Gemini 2.5 Flash", - "display_name": "Gemini 2.5 Flash", + "id": "anthropic/claude-opus-4.5", + "name": "Claude Opus 4.5 (latest)", + "display_name": "Claude Opus 4.5 (latest)", "modalities": { "input": [ "text", "image", - "audio", - "video", "pdf" ], "output": [ @@ -63418,141 +67546,180 @@ ] }, "limit": { - "context": 1048576, - "output": 65536 + "context": 200000, + "output": 64000 }, "temperature": true, "tool_call": true, "reasoning": { "supported": true, - "default": true + "default": false }, "extra_capabilities": { "reasoning": { "supported": true, - "default_enabled": true, - "mode": "budget", + "default_enabled": false, + "mode": "mixed", "budget": { - "default": -1, - "min": 0, - "max": 24576, - "auto": -1, - "off": 0, + "min": 1024, "unit": "tokens" }, + "effort": "high", + "effort_options": [ + "low", + "medium", + "high" + ], + "interleaved": true, "summaries": true, "visibility": "summary", "continuation": [ - "thought_signatures" + "thinking_blocks" + ], + "notes": [ + "Claude Opus 4.5 uses manual thinking.type = \"enabled\" with budget_tokens; effort can be used alongside the thinking budget.", + "Interleaved thinking requires the interleaved-thinking-2025-05-14 beta header." ] } }, "attachment": true, "open_weights": false, - "knowledge": "2025-01", - "release_date": "2025-07-17", - "last_updated": "2025-07-17", + "knowledge": "2025-03-31", + "release_date": "2025-11-24", + "last_updated": "2025-11-24", "cost": { - "input": 0.3, - "output": 2.5, - "cache_read": 0.075 + "input": 5, + "output": 25, + "cache_read": 0.5, + "cache_write": 6.25 }, "type": "chat" }, { - "id": "gpt-5-3-codex", - "name": "GPT-5.3 Codex", - "display_name": "GPT-5.3 Codex", + "id": "anthropic/claude-sonnet-4.6", + "name": "Claude Sonnet 4.6", + "display_name": "Claude Sonnet 4.6", "modalities": { "input": [ "text", - "image" + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 400000, - "output": 128000 + "context": 1000000, + "output": 64000 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, - "default": true + "default": false }, "extra_capabilities": { "reasoning": { "supported": true, - "default_enabled": true, - "mode": "effort", - "effort": "medium", + "default_enabled": false, + "mode": "mixed", + "budget": { + "min": 1024, + "unit": "tokens" + }, + "effort": "high", "effort_options": [ "low", "medium", "high", - "xhigh" + "max" ], - "verbosity": "medium", - "verbosity_options": [ - "low", - "medium", - "high" + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" ], - "visibility": "hidden" + "notes": [ + "Anthropic recommends adaptive thinking with effort for Claude 4.6; budget_tokens remains a deprecated compatibility path.", + "Anthropic API defaults effort to high; lower effort levels should be chosen per workload." + ] } }, "attachment": true, "open_weights": false, - "knowledge": "2026-01-31", - "release_date": "2026-02-15", - "last_updated": "2026-02-15", + "knowledge": "2025-08-31", + "release_date": "2026-02-17", + "last_updated": "2026-03-13", "cost": { - "input": 1.75, - "output": 14, - "cache_read": 0.175 + "input": 3, + "output": 15, + "cache_read": 0.3, + "cache_write": 3.75 }, "type": "chat" }, { - "id": "grok-4-3", - "name": "Grok 4.3", - "display_name": "Grok 4.3", + "id": "anthropic/claude-opus-4", + "name": "Claude Opus 4 (latest)", + "display_name": "Claude Opus 4 (latest)", "modalities": { "input": [ "text", "image", - "video" + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 1000000, - "output": 128000 + "context": 200000, + "output": 32000 }, "temperature": true, "tool_call": true, "reasoning": { "supported": true, - "default": true + "default": false + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": false, + "mode": "budget", + "budget": { + "min": 1024, + "unit": "tokens" + }, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ], + "notes": [ + "Claude 4 manual thinking uses thinking.type = \"enabled\" with budget_tokens.", + "Interleaved thinking requires the interleaved-thinking-2025-05-14 beta header for this model family." + ] + } }, "attachment": true, "open_weights": false, - "knowledge": "2024-11", - "release_date": "2026-04-30", - "last_updated": "2026-04-30", + "knowledge": "2025-03-31", + "release_date": "2025-05-22", + "last_updated": "2025-05-22", "cost": { - "input": 1.25, - "output": 2.5, - "cache_read": 0.2 + "input": 15, + "output": 75, + "cache_read": 1.5, + "cache_write": 18.75 }, "type": "chat" }, { - "id": "claude-opus-4-6", + "id": "anthropic/claude-opus-4.6", "name": "Claude Opus 4.6", "display_name": "Claude Opus 4.6", "modalities": { @@ -63566,7 +67733,7 @@ ] }, "limit": { - "context": 200000, + "context": 1000000, "output": 128000 }, "temperature": true, @@ -63607,7 +67774,7 @@ "open_weights": false, "knowledge": "2025-05-31", "release_date": "2026-02-05", - "last_updated": "2026-02-05", + "last_updated": "2026-03-13", "cost": { "input": 5, "output": 25, @@ -63617,65 +67784,79 @@ "type": "chat" }, { - "id": "deepseek-v4-pro", - "name": "DeepSeek v4 Pro", - "display_name": "DeepSeek v4 Pro", + "id": "grok/grok-4.3", + "name": "Grok 4.3", + "display_name": "Grok 4.3", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 8192 + "context": 1000000, + "output": 30000 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true + "supported": true, + "default": true }, "extra_capabilities": { "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] + "supported": true } }, "attachment": true, "open_weights": false, - "knowledge": "2026-01", - "release_date": "2026-04-24", - "last_updated": "2026-04-24", + "release_date": "2026-04-17", + "last_updated": "2026-04-17", "cost": { - "input": 1.74, - "output": 3.48, - "cache_read": 0.14 + "input": 1.25, + "output": 2.5, + "cache_read": 0.2, + "tiers": [ + { + "input": 2.5, + "output": 5, + "cache_read": 0.4, + "tier": { + "type": "context", + "size": 200000 + } + } + ], + "context_over_200k": { + "input": 2.5, + "output": 5, + "cache_read": 0.4 + } }, "type": "chat" }, { - "id": "kimi-k2.5", - "name": "Kimi-K2.5", - "display_name": "Kimi-K2.5", + "id": "qwen/qwen3.6-35b-a3b", + "name": "Qwen3.6 35B-A3B", + "display_name": "Qwen3.6 35B-A3B", "modalities": { "input": [ "text", - "image" + "image", + "video", + "audio" ], "output": [ "text" ] }, "limit": { - "context": 256000, - "output": 128000 + "context": 262144, + "output": 65536 }, "temperature": true, "tool_call": true, @@ -63694,96 +67875,76 @@ ] } }, - "attachment": false, - "open_weights": false, - "release_date": "1970-01-01", - "last_updated": "1970-01-01", + "attachment": true, + "open_weights": true, + "release_date": "2026-04-17", + "last_updated": "2026-04-17", "cost": { - "input": 0.6, - "output": 3, - "cache_read": 0.1 + "input": 0.248, + "output": 1.485 }, "type": "chat" }, { - "id": "claude-opus-4-7", - "name": "Claude Opus 4.7", - "display_name": "Claude Opus 4.7", + "id": "qwen/qwen3-max", + "name": "Qwen3 Max", + "display_name": "Qwen3 Max", "modalities": { "input": [ - "text", - "image", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 128000 + "context": 262144, + "output": 65536 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": false + "supported": true }, "extra_capabilities": { "reasoning": { "supported": true, - "default_enabled": false, - "mode": "effort", - "effort": "high", - "effort_options": [ - "low", - "medium", - "high", - "xhigh", - "max" - ], "interleaved": true, "summaries": true, - "visibility": "omitted", + "visibility": "summary", "continuation": [ "thinking_blocks" - ], - "notes": [ - "Claude Opus 4.7 and newer Opus models require thinking.type = \"adaptive\" to enable thinking explicitly.", - "Manual budget_tokens requests return 400 on Claude Opus 4.7 and newer adaptive-only Opus models.", - "task_budget is separate from thinking control and should not be treated as a thinking budget." ] } }, - "attachment": true, + "attachment": false, "open_weights": false, - "knowledge": "2026-01-31", - "release_date": "2026-04-16", - "last_updated": "2026-04-16", + "knowledge": "2025-04", + "release_date": "2025-09-23", + "last_updated": "2025-09-23", "cost": { - "input": 5, - "output": 25, - "cache_read": 0.5, - "cache_write": 6.25 + "input": 0.359, + "output": 1.434 }, "type": "chat" }, { - "id": "grok-4-1-fast-reasoning", - "name": "Grok 4.1 Fast (Reasoning)", - "display_name": "Grok 4.1 Fast (Reasoning)", + "id": "qwen/qwen3.5-plus", + "name": "Qwen3.5 Plus", + "display_name": "Qwen3.5 Plus", "modalities": { "input": [ "text", - "image" + "image", + "video" ], "output": [ "text" ] }, "limit": { - "context": 2000000, - "output": 128000 + "context": 1000000, + "output": 65536 }, "temperature": true, "tool_call": true, @@ -63793,36 +67954,45 @@ }, "extra_capabilities": { "reasoning": { - "supported": true + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] } }, - "attachment": true, + "attachment": false, "open_weights": false, - "knowledge": "2025-11", - "release_date": "2025-11-25", - "last_updated": "2025-11-25", + "knowledge": "2025-04", + "release_date": "2026-02-16", + "last_updated": "2026-02-16", "cost": { - "input": 0.2, - "output": 0.5, - "cache_read": 0.05 + "input": 0.115, + "output": 0.688, + "reasoning": 2.4 }, "type": "chat" }, { - "id": "grok-code-fast-1", - "name": "Grok 4.1 Fast (Reasoning)", - "display_name": "Grok 4.1 Fast (Reasoning)", + "id": "qwen/qwen3.5-27b", + "name": "Qwen3.5 27B", + "display_name": "Qwen3.5 27B", "modalities": { "input": [ - "text" + "text", + "image", + "video", + "audio" ], "output": [ "text" ] }, "limit": { - "context": 256000, - "output": 128000 + "context": 262144, + "output": 65536 }, "temperature": true, "tool_call": true, @@ -63832,465 +68002,379 @@ }, "extra_capabilities": { "reasoning": { - "supported": true + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] } }, - "attachment": false, - "open_weights": false, - "knowledge": "2023-10", - "release_date": "2025-08-28", - "last_updated": "2025-08-28", + "attachment": true, + "open_weights": true, + "release_date": "2026-02-23", + "last_updated": "2026-02-23", "cost": { - "input": 0.2, - "output": 1.5, - "cache_read": 0.02 + "input": 0.086, + "output": 0.688 }, "type": "chat" - } - ] - }, - "anthropic": { - "id": "anthropic", - "name": "Anthropic", - "display_name": "Anthropic", - "doc": "https://docs.anthropic.com/en/docs/about-claude/models", - "models": [ + }, { - "id": "claude-opus-4-5", - "name": "Claude Opus 4.5 (latest)", - "display_name": "Claude Opus 4.5 (latest)", + "id": "qwen/qwen3.5-35b-a3b", + "name": "Qwen3.5 35B-A3B", + "display_name": "Qwen3.5 35B-A3B", "modalities": { "input": [ "text", "image", - "pdf" + "video", + "audio" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 64000 + "context": 262144, + "output": 65536 }, "temperature": true, "tool_call": true, "reasoning": { "supported": true, - "default": false + "default": true }, "extra_capabilities": { "reasoning": { "supported": true, - "default_enabled": false, - "mode": "mixed", - "budget": { - "min": 1024, - "unit": "tokens" - }, - "effort": "high", - "effort_options": [ - "low", - "medium", - "high" - ], "interleaved": true, "summaries": true, "visibility": "summary", "continuation": [ "thinking_blocks" - ], - "notes": [ - "Claude Opus 4.5 uses manual thinking.type = \"enabled\" with budget_tokens; effort can be used alongside the thinking budget.", - "Interleaved thinking requires the interleaved-thinking-2025-05-14 beta header." ] } }, "attachment": true, - "open_weights": false, - "knowledge": "2025-03-31", - "release_date": "2025-11-24", - "last_updated": "2025-11-24", + "open_weights": true, + "release_date": "2026-02-23", + "last_updated": "2026-02-23", "cost": { - "input": 5, - "output": 25, - "cache_read": 0.5, - "cache_write": 6.25 + "input": 0.057, + "output": 0.459 }, "type": "chat" }, { - "id": "claude-sonnet-4-6", - "name": "Claude Sonnet 4.6", - "display_name": "Claude Sonnet 4.6", + "id": "qwen/qwen3.5-397b-a17b", + "name": "Qwen3.5 397B-A17B", + "display_name": "Qwen3.5 397B-A17B", "modalities": { "input": [ "text", "image", - "pdf" + "video", + "audio" ], "output": [ "text" ] }, "limit": { - "context": 1000000, - "output": 64000 + "context": 262144, + "output": 65536 }, "temperature": true, "tool_call": true, "reasoning": { "supported": true, - "default": false + "default": true }, "extra_capabilities": { "reasoning": { "supported": true, - "default_enabled": false, - "mode": "mixed", - "budget": { - "min": 1024, - "unit": "tokens" - }, - "effort": "high", - "effort_options": [ - "low", - "medium", - "high", - "max" - ], "interleaved": true, "summaries": true, "visibility": "summary", "continuation": [ "thinking_blocks" - ], - "notes": [ - "Anthropic recommends adaptive thinking with effort for Claude 4.6; budget_tokens remains a deprecated compatibility path.", - "Anthropic API defaults effort to high; lower effort levels should be chosen per workload." ] } }, "attachment": true, - "open_weights": false, - "knowledge": "2025-08-31", - "release_date": "2026-02-17", - "last_updated": "2026-03-13", + "open_weights": true, + "release_date": "2026-02-15", + "last_updated": "2026-02-15", "cost": { - "input": 3, - "output": 15, - "cache_read": 0.3, - "cache_write": 3.75 + "input": 0.172, + "output": 1.032 }, "type": "chat" }, { - "id": "claude-haiku-4-5-20251001", - "name": "Claude Haiku 4.5", - "display_name": "Claude Haiku 4.5", + "id": "qwen/qwen3.5-122b-a10b", + "name": "Qwen3.5 122B-A10B", + "display_name": "Qwen3.5 122B-A10B", "modalities": { "input": [ "text", "image", - "pdf" + "video", + "audio" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 64000 + "context": 262144, + "output": 65536 }, "temperature": true, "tool_call": true, "reasoning": { "supported": true, - "default": false + "default": true }, "extra_capabilities": { "reasoning": { "supported": true, - "default_enabled": false, - "mode": "budget", - "budget": { - "min": 1024, - "unit": "tokens" - }, "interleaved": true, "summaries": true, "visibility": "summary", "continuation": [ "thinking_blocks" - ], - "notes": [ - "Claude 4 manual thinking uses thinking.type = \"enabled\" with budget_tokens.", - "Interleaved thinking requires the interleaved-thinking-2025-05-14 beta header for this model family." ] } }, "attachment": true, - "open_weights": false, - "knowledge": "2025-02-28", - "release_date": "2025-10-15", - "last_updated": "2025-10-15", + "open_weights": true, + "release_date": "2026-02-23", + "last_updated": "2026-02-23", "cost": { - "input": 1, - "output": 5, - "cache_read": 0.1, - "cache_write": 1.25 + "input": 0.115, + "output": 0.917 }, "type": "chat" }, { - "id": "claude-sonnet-4-0", - "name": "Claude Sonnet 4 (latest)", - "display_name": "Claude Sonnet 4 (latest)", + "id": "qwen/qwen3.6-plus", + "name": "Qwen3.6 Plus", + "display_name": "Qwen3.6 Plus", "modalities": { "input": [ "text", "image", - "pdf" + "video" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 64000 + "context": 1000000, + "output": 65536 }, "temperature": true, "tool_call": true, "reasoning": { "supported": true, - "default": false + "default": true }, "extra_capabilities": { "reasoning": { "supported": true, - "default_enabled": false, - "mode": "budget", - "budget": { - "min": 1024, - "unit": "tokens" - }, "interleaved": true, "summaries": true, "visibility": "summary", "continuation": [ "thinking_blocks" - ], - "notes": [ - "Claude 4 manual thinking uses thinking.type = \"enabled\" with budget_tokens.", - "Interleaved thinking requires the interleaved-thinking-2025-05-14 beta header for this model family." ] } }, - "attachment": true, - "open_weights": false, - "knowledge": "2025-03-31", - "release_date": "2025-05-22", - "last_updated": "2025-05-22", - "cost": { - "input": 3, - "output": 15, - "cache_read": 0.3, - "cache_write": 3.75 - }, + "attachment": false, + "open_weights": false, + "knowledge": "2025-04", + "release_date": "2026-04-02", + "last_updated": "2026-04-02", + "cost": { + "input": 0.5, + "output": 3, + "cache_read": 0.05, + "cache_write": 0.625, + "tiers": [ + { + "input": 2, + "output": 6, + "cache_read": 0.2, + "cache_write": 2.5, + "tier": { + "type": "context", + "size": 256000 + } + } + ], + "context_over_200k": { + "input": 2, + "output": 6, + "cache_read": 0.2, + "cache_write": 2.5 + } + }, "type": "chat" }, { - "id": "claude-haiku-4-5", - "name": "Claude Haiku 4.5 (latest)", - "display_name": "Claude Haiku 4.5 (latest)", + "id": "deepseek/deepseek-v4-flash", + "name": "DeepSeek V4 Flash", + "display_name": "DeepSeek V4 Flash", "modalities": { "input": [ - "text", - "image", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 64000 + "context": 1000000, + "output": 384000 }, "temperature": true, "tool_call": true, "reasoning": { "supported": true, - "default": false + "default": true }, "extra_capabilities": { "reasoning": { "supported": true, - "default_enabled": false, - "mode": "budget", - "budget": { - "min": 1024, - "unit": "tokens" - }, "interleaved": true, "summaries": true, "visibility": "summary", "continuation": [ "thinking_blocks" - ], - "notes": [ - "Claude 4 manual thinking uses thinking.type = \"enabled\" with budget_tokens.", - "Interleaved thinking requires the interleaved-thinking-2025-05-14 beta header for this model family." ] } }, - "attachment": true, - "open_weights": false, - "knowledge": "2025-02-28", - "release_date": "2025-10-15", - "last_updated": "2025-10-15", + "attachment": false, + "open_weights": true, + "knowledge": "2025-05", + "release_date": "2026-04-24", + "last_updated": "2026-04-24", "cost": { - "input": 1, - "output": 5, - "cache_read": 0.1, - "cache_write": 1.25 + "input": 0.19, + "output": 0.37, + "cache_read": 0.0028 }, "type": "chat" }, { - "id": "claude-opus-4-20250514", - "name": "Claude Opus 4", - "display_name": "Claude Opus 4", + "id": "deepseek/deepseek-v4-pro", + "name": "DeepSeek V4 Pro", + "display_name": "DeepSeek V4 Pro", "modalities": { "input": [ - "text", - "image", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 32000 + "context": 1000000, + "output": 384000 }, "temperature": true, "tool_call": true, "reasoning": { "supported": true, - "default": false + "default": true }, "extra_capabilities": { "reasoning": { "supported": true, - "default_enabled": false, - "mode": "budget", - "budget": { - "min": 1024, - "unit": "tokens" - }, "interleaved": true, "summaries": true, "visibility": "summary", "continuation": [ "thinking_blocks" - ], - "notes": [ - "Claude 4 manual thinking uses thinking.type = \"enabled\" with budget_tokens.", - "Interleaved thinking requires the interleaved-thinking-2025-05-14 beta header for this model family." ] } }, - "attachment": true, - "open_weights": false, - "knowledge": "2025-03-31", - "release_date": "2025-05-22", - "last_updated": "2025-05-22", + "attachment": false, + "open_weights": true, + "knowledge": "2025-05", + "release_date": "2026-04-24", + "last_updated": "2026-04-24", "cost": { - "input": 15, - "output": 75, - "cache_read": 1.5, - "cache_write": 18.75 + "input": 0.56, + "output": 1.12, + "cache_read": 0.003625 }, "type": "chat" }, { - "id": "claude-opus-4-1", - "name": "Claude Opus 4.1 (latest)", - "display_name": "Claude Opus 4.1 (latest)", + "id": "deepseek/deepseek-reasoner", + "name": "DeepSeek Reasoner", + "display_name": "DeepSeek Reasoner", "modalities": { "input": [ - "text", - "image", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 32000 + "context": 1000000, + "output": 384000 }, "temperature": true, "tool_call": true, "reasoning": { "supported": true, - "default": false + "default": true }, "extra_capabilities": { "reasoning": { "supported": true, - "default_enabled": false, - "mode": "budget", - "budget": { - "min": 1024, - "unit": "tokens" - }, "interleaved": true, "summaries": true, "visibility": "summary", "continuation": [ "thinking_blocks" - ], - "notes": [ - "Claude 4 manual thinking uses thinking.type = \"enabled\" with budget_tokens.", - "Interleaved thinking requires the interleaved-thinking-2025-05-14 beta header for this model family." ] } }, "attachment": true, - "open_weights": false, - "knowledge": "2025-03-31", - "release_date": "2025-08-05", - "last_updated": "2025-08-05", + "open_weights": true, + "knowledge": "2025-09", + "release_date": "2025-12-01", + "last_updated": "2026-02-28", "cost": { - "input": 15, - "output": 75, - "cache_read": 1.5, - "cache_write": 18.75 + "input": 0.435, + "output": 0.87, + "cache_read": 0.028 }, "type": "chat" }, { - "id": "claude-3-opus-20240229", - "name": "Claude Opus 3", - "display_name": "Claude Opus 3", + "id": "deepseek/deepseek-chat", + "name": "DeepSeek Chat", + "display_name": "DeepSeek Chat", "modalities": { "input": [ - "text", - "image", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 4096 + "context": 1000000, + "output": 384000 }, "temperature": true, "tool_call": true, @@ -64298,37 +68382,34 @@ "supported": false }, "attachment": true, - "open_weights": false, - "knowledge": "2023-08-31", - "release_date": "2024-02-29", - "last_updated": "2024-02-29", + "open_weights": true, + "knowledge": "2025-09", + "release_date": "2025-12-01", + "last_updated": "2026-02-28", "cost": { - "input": 15, - "output": 75, - "cache_read": 1.5, - "cache_write": 18.75 + "input": 0.14, + "output": 0.28, + "cache_read": 0.028 }, "type": "chat" }, { - "id": "claude-fable-5", - "name": "Claude Fable 5", - "display_name": "Claude Fable 5", + "id": "minimax/minimax-m2.7-highspeed", + "name": "MiniMax-M2.7-highspeed", + "display_name": "MiniMax-M2.7-highspeed", "modalities": { "input": [ - "text", - "image", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 1000000, - "output": 128000 + "context": 204800, + "output": 131072 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, @@ -64337,295 +68418,268 @@ "extra_capabilities": { "reasoning": { "supported": true, - "default_enabled": true, - "mode": "effort", - "effort": "high", - "effort_options": [ - "low", - "medium", - "high", - "xhigh", - "max" - ], "interleaved": true, "summaries": true, - "visibility": "omitted", + "visibility": "summary", "continuation": [ "thinking_blocks" - ], - "notes": [ - "Adaptive thinking is always on for Claude Fable 5 and Claude Mythos 5; thinking.type = \"disabled\" is rejected.", - "Manual budget_tokens requests return 400 on Claude Fable 5 and Claude Mythos 5.", - "thinking.display defaults to omitted; set display to summarized to receive readable thinking summaries." ] } }, - "attachment": true, - "open_weights": false, - "release_date": "2026-06-09", - "last_updated": "2026-06-09", + "attachment": false, + "open_weights": true, + "release_date": "2026-03-18", + "last_updated": "2026-03-18", "cost": { - "input": 10, - "output": 50, - "cache_read": 1, - "cache_write": 12.5 + "input": 0.6, + "output": 2.4, + "cache_read": 0.06, + "cache_write": 0.375 }, "type": "chat" }, { - "id": "claude-3-5-haiku-latest", - "name": "Claude Haiku 3.5 (latest)", - "display_name": "Claude Haiku 3.5 (latest)", + "id": "minimax/minimax-m2.5", + "name": "MiniMax-M2.5", + "display_name": "MiniMax-M2.5", "modalities": { "input": [ - "text", - "image", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 8192 + "context": 204800, + "output": 131072 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": true, - "open_weights": false, - "knowledge": "2024-07-31", - "release_date": "2024-10-22", - "last_updated": "2024-10-22", + "extra_capabilities": { + "reasoning": { + "supported": true + } + }, + "attachment": false, + "open_weights": true, + "release_date": "2026-02-12", + "last_updated": "2026-02-12", "cost": { - "input": 0.8, - "output": 4, - "cache_read": 0.08, - "cache_write": 1 + "input": 0.3, + "output": 1.2, + "cache_read": 0.03, + "cache_write": 0.375 }, "type": "chat" }, { - "id": "claude-sonnet-4-5-20250929", - "name": "Claude Sonnet 4.5", - "display_name": "Claude Sonnet 4.5", + "id": "minimax/minimax-m2.7", + "name": "MiniMax-M2.7", + "display_name": "MiniMax-M2.7", "modalities": { "input": [ - "text", - "image", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 64000 + "context": 204800, + "output": 131072 }, "temperature": true, "tool_call": true, "reasoning": { "supported": true, - "default": false + "default": true }, "extra_capabilities": { "reasoning": { "supported": true, - "default_enabled": false, - "mode": "budget", - "budget": { - "min": 1024, - "unit": "tokens" - }, "interleaved": true, "summaries": true, "visibility": "summary", "continuation": [ "thinking_blocks" - ], - "notes": [ - "Claude 4 manual thinking uses thinking.type = \"enabled\" with budget_tokens.", - "Interleaved thinking requires the interleaved-thinking-2025-05-14 beta header for this model family." ] } }, - "attachment": true, - "open_weights": false, - "knowledge": "2025-07-31", - "release_date": "2025-09-29", - "last_updated": "2025-09-29", + "attachment": false, + "open_weights": true, + "release_date": "2026-03-18", + "last_updated": "2026-03-18", "cost": { - "input": 3, - "output": 15, - "cache_read": 0.3, - "cache_write": 3.75 + "input": 0.3, + "output": 1.2, + "cache_read": 0.06, + "cache_write": 0.375 }, "type": "chat" }, { - "id": "claude-3-5-haiku-20241022", - "name": "Claude Haiku 3.5", - "display_name": "Claude Haiku 3.5", + "id": "minimax/minimax-m2.5-highspeed", + "name": "MiniMax-M2.5-highspeed", + "display_name": "MiniMax-M2.5-highspeed", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 204800, + "output": 131072 + }, + "temperature": true, + "tool_call": true, + "reasoning": { + "supported": true, + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true + } + }, + "attachment": false, + "open_weights": true, + "release_date": "2026-02-13", + "last_updated": "2026-02-13", + "cost": { + "input": 0.6, + "output": 2.4, + "cache_read": 0.06, + "cache_write": 0.375 + }, + "type": "chat" + } + ] + }, + "helicone": { + "id": "helicone", + "name": "Helicone", + "display_name": "Helicone", + "api": "https://ai-gateway.helicone.ai/v1", + "doc": "https://helicone.ai/models", + "models": [ + { + "id": "chatgpt-4o-latest", + "name": "OpenAI ChatGPT-4o", + "display_name": "OpenAI ChatGPT-4o", "modalities": { "input": [ "text", - "image", - "pdf" + "image" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 8192 + "context": 128000, + "output": 16384 }, "temperature": true, "tool_call": true, "reasoning": { "supported": false }, - "attachment": true, + "attachment": false, "open_weights": false, - "knowledge": "2024-07-31", - "release_date": "2024-10-22", - "last_updated": "2024-10-22", + "knowledge": "2024-08", + "release_date": "2024-08-14", + "last_updated": "2024-08-14", "cost": { - "input": 0.8, - "output": 4, - "cache_read": 0.08, - "cache_write": 1 + "input": 5, + "output": 20, + "cache_read": 2.5 }, "type": "chat" }, { - "id": "claude-opus-4-1-20250805", - "name": "Claude Opus 4.1", - "display_name": "Claude Opus 4.1", + "id": "gpt-4.1-mini-2025-04-14", + "name": "OpenAI GPT-4.1 Mini", + "display_name": "OpenAI GPT-4.1 Mini", "modalities": { "input": [ "text", - "image", - "pdf" + "image" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 32000 + "context": 1047576, + "output": 32768 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": false - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": false, - "mode": "budget", - "budget": { - "min": 1024, - "unit": "tokens" - }, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ], - "notes": [ - "Claude 4 manual thinking uses thinking.type = \"enabled\" with budget_tokens.", - "Interleaved thinking requires the interleaved-thinking-2025-05-14 beta header for this model family." - ] - } + "supported": false }, - "attachment": true, + "attachment": false, "open_weights": false, - "knowledge": "2025-03-31", - "release_date": "2025-08-05", - "last_updated": "2025-08-05", + "knowledge": "2025-04", + "release_date": "2025-04-14", + "last_updated": "2025-04-14", "cost": { - "input": 15, - "output": 75, - "cache_read": 1.5, - "cache_write": 18.75 + "input": 0.39999999999999997, + "output": 1.5999999999999999, + "cache_read": 0.09999999999999999 }, "type": "chat" }, { - "id": "claude-3-7-sonnet-20250219", - "name": "Claude Sonnet 3.7", - "display_name": "Claude Sonnet 3.7", + "id": "deepseek-v3.1-terminus", + "name": "DeepSeek V3.1 Terminus", + "display_name": "DeepSeek V3.1 Terminus", "modalities": { "input": [ - "text", - "image", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 64000 + "context": 128000, + "output": 16384 }, "temperature": true, "tool_call": true, "reasoning": { "supported": true, - "default": false - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": false, - "mode": "budget", - "budget": { - "min": 1024, - "unit": "tokens" - }, - "interleaved": false, - "summaries": false, - "visibility": "full", - "continuation": [ - "thinking_blocks" - ], - "notes": [ - "Anthropic uses thinking budget tokens" - ] - } + "default": true }, - "attachment": true, + "attachment": false, "open_weights": false, - "knowledge": "2024-10-31", - "release_date": "2025-02-19", - "last_updated": "2025-02-19", + "knowledge": "2025-09", + "release_date": "2025-09-22", + "last_updated": "2025-09-22", "cost": { - "input": 3, - "output": 15, - "cache_read": 0.3, - "cache_write": 3.75 + "input": 0.27, + "output": 1, + "cache_read": 0.21600000000000003 }, "type": "chat" }, { - "id": "claude-3-5-sonnet-20240620", - "name": "Claude Sonnet 3.5", - "display_name": "Claude Sonnet 3.5", + "id": "claude-3.5-haiku", + "name": "Anthropic: Claude 3.5 Haiku", + "display_name": "Anthropic: Claude 3.5 Haiku", "modalities": { "input": [ "text", - "image", - "pdf" + "image" ], "output": [ "text" @@ -64640,64 +68694,59 @@ "reasoning": { "supported": false }, - "attachment": true, + "attachment": false, "open_weights": false, - "knowledge": "2024-04-30", - "release_date": "2024-06-20", - "last_updated": "2024-06-20", + "knowledge": "2024-10", + "release_date": "2024-10-22", + "last_updated": "2024-10-22", "cost": { - "input": 3, - "output": 15, - "cache_read": 0.3, - "cache_write": 3.75 + "input": 0.7999999999999999, + "output": 4, + "cache_read": 0.08, + "cache_write": 1 }, "type": "chat" }, { - "id": "claude-3-5-sonnet-20241022", - "name": "Claude Sonnet 3.5 v2", - "display_name": "Claude Sonnet 3.5 v2", + "id": "llama-3.1-8b-instruct", + "name": "Meta Llama 3.1 8B Instruct", + "display_name": "Meta Llama 3.1 8B Instruct", "modalities": { "input": [ - "text", - "image", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 8192 + "context": 16384, + "output": 16384 }, "temperature": true, "tool_call": true, "reasoning": { "supported": false }, - "attachment": true, + "attachment": false, "open_weights": false, - "knowledge": "2024-04-30", - "release_date": "2024-10-22", - "last_updated": "2024-10-22", + "knowledge": "2024-07", + "release_date": "2024-07-23", + "last_updated": "2024-07-23", "cost": { - "input": 3, - "output": 15, - "cache_read": 0.3, - "cache_write": 3.75 + "input": 0.02, + "output": 0.049999999999999996 }, "type": "chat" }, { - "id": "claude-opus-4-5-20251101", - "name": "Claude Opus 4.5", - "display_name": "Claude Opus 4.5", + "id": "o3", + "name": "OpenAI o3", + "display_name": "OpenAI o3", "modalities": { "input": [ "text", - "image", - "pdf" + "image" ], "output": [ "text" @@ -64705,584 +68754,436 @@ }, "limit": { "context": 200000, - "output": 64000 + "output": 100000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { "supported": true, - "default": false + "default": true }, "extra_capabilities": { "reasoning": { "supported": true, - "default_enabled": false, - "mode": "mixed", - "budget": { - "min": 1024, - "unit": "tokens" - }, - "effort": "high", + "default_enabled": true, + "mode": "effort", + "effort": "medium", "effort_options": [ "low", "medium", "high" ], - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ], - "notes": [ - "Claude Opus 4.5 uses manual thinking.type = \"enabled\" with budget_tokens; effort can be used alongside the thinking budget.", - "Interleaved thinking requires the interleaved-thinking-2025-05-14 beta header." - ] + "visibility": "hidden" } }, - "attachment": true, + "attachment": false, "open_weights": false, - "knowledge": "2025-03-31", - "release_date": "2025-11-01", - "last_updated": "2025-11-01", + "knowledge": "2024-06", + "release_date": "2024-06-01", + "last_updated": "2024-06-01", "cost": { - "input": 5, - "output": 25, - "cache_read": 0.5, - "cache_write": 6.25 + "input": 2, + "output": 8, + "cache_read": 0.5 }, "type": "chat" }, { - "id": "claude-opus-4-8", - "name": "Claude Opus 4.8", - "display_name": "Claude Opus 4.8", + "id": "llama-prompt-guard-2-86m", + "name": "Meta Llama Prompt Guard 2 86M", + "display_name": "Meta Llama Prompt Guard 2 86M", "modalities": { "input": [ - "text", - "image", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 1000000, - "output": 128000 + "context": 512, + "output": 2 }, - "temperature": false, - "tool_call": true, + "temperature": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": false - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": false, - "mode": "effort", - "effort": "high", - "effort_options": [ - "low", - "medium", - "high", - "xhigh", - "max" - ], - "interleaved": true, - "summaries": true, - "visibility": "omitted", - "continuation": [ - "thinking_blocks" - ], - "notes": [ - "Claude Opus 4.7 and newer Opus models require thinking.type = \"adaptive\" to enable thinking explicitly.", - "Manual budget_tokens requests return 400 on Claude Opus 4.7 and newer adaptive-only Opus models.", - "task_budget is separate from thinking control and should not be treated as a thinking budget." - ] - } + "supported": false }, - "attachment": true, + "attachment": false, "open_weights": false, - "release_date": "2026-05-28", - "last_updated": "2026-05-28", + "knowledge": "2024-10", + "release_date": "2024-10-01", + "last_updated": "2024-10-01", "cost": { - "input": 5, - "output": 25, - "cache_read": 0.5, - "cache_write": 6.25 + "input": 0.01, + "output": 0.01 }, "type": "chat" }, { - "id": "claude-3-haiku-20240307", - "name": "Claude Haiku 3", - "display_name": "Claude Haiku 3", + "id": "qwen3-coder-30b-a3b-instruct", + "name": "Qwen3 Coder 30B A3B Instruct", + "display_name": "Qwen3 Coder 30B A3B Instruct", "modalities": { "input": [ - "text", - "image", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 4096 + "context": 262144, + "output": 262144 }, "temperature": true, "tool_call": true, "reasoning": { "supported": false }, - "attachment": true, + "attachment": false, "open_weights": false, - "knowledge": "2023-08-31", - "release_date": "2024-03-13", - "last_updated": "2024-03-13", + "knowledge": "2025-07", + "release_date": "2025-07-31", + "last_updated": "2025-07-31", "cost": { - "input": 0.25, - "output": 1.25, - "cache_read": 0.03, - "cache_write": 0.3 + "input": 0.09999999999999999, + "output": 0.3 }, "type": "chat" }, { - "id": "claude-sonnet-4-20250514", - "name": "Claude Sonnet 4", - "display_name": "Claude Sonnet 4", + "id": "hermes-2-pro-llama-3-8b", + "name": "Hermes 2 Pro Llama 3 8B", + "display_name": "Hermes 2 Pro Llama 3 8B", "modalities": { "input": [ - "text", - "image", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 64000 + "context": 131072, + "output": 131072 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": false - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": false, - "mode": "budget", - "budget": { - "min": 1024, - "unit": "tokens" - }, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ], - "notes": [ - "Claude 4 manual thinking uses thinking.type = \"enabled\" with budget_tokens.", - "Interleaved thinking requires the interleaved-thinking-2025-05-14 beta header for this model family." - ] - } + "supported": false }, - "attachment": true, + "attachment": false, "open_weights": false, - "knowledge": "2025-03-31", - "release_date": "2025-05-22", - "last_updated": "2025-05-22", + "knowledge": "2024-05", + "release_date": "2024-05-27", + "last_updated": "2024-05-27", "cost": { - "input": 3, - "output": 15, - "cache_read": 0.3, - "cache_write": 3.75 + "input": 0.14, + "output": 0.14 }, "type": "chat" }, { - "id": "claude-sonnet-4-5", - "name": "Claude Sonnet 4.5 (latest)", - "display_name": "Claude Sonnet 4.5 (latest)", + "id": "deepseek-v3", + "name": "DeepSeek V3", + "display_name": "DeepSeek V3", "modalities": { "input": [ - "text", - "image", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 64000 + "context": 128000, + "output": 8192 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": false - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": false, - "mode": "budget", - "budget": { - "min": 1024, - "unit": "tokens" - }, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ], - "notes": [ - "Claude 4 manual thinking uses thinking.type = \"enabled\" with budget_tokens.", - "Interleaved thinking requires the interleaved-thinking-2025-05-14 beta header for this model family." - ] - } + "supported": false }, - "attachment": true, + "attachment": false, "open_weights": false, - "knowledge": "2025-07-31", - "release_date": "2025-09-29", - "last_updated": "2025-09-29", + "knowledge": "2024-12", + "release_date": "2024-12-26", + "last_updated": "2024-12-26", "cost": { - "input": 3, - "output": 15, - "cache_read": 0.3, - "cache_write": 3.75 + "input": 0.56, + "output": 1.68, + "cache_read": 0.07 }, "type": "chat" }, { - "id": "claude-opus-4-6", - "name": "Claude Opus 4.6", - "display_name": "Claude Opus 4.6", + "id": "grok-code-fast-1", + "name": "xAI Grok Code Fast 1", + "display_name": "xAI Grok Code Fast 1", "modalities": { "input": [ - "text", - "image", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 1000000, - "output": 128000 + "context": 256000, + "output": 10000 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": false + "supported": true }, "extra_capabilities": { "reasoning": { - "supported": true, - "default_enabled": false, - "mode": "mixed", - "budget": { - "min": 1024, - "unit": "tokens" - }, - "effort": "high", - "effort_options": [ - "low", - "medium", - "high", - "max" - ], - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ], - "notes": [ - "Anthropic recommends adaptive thinking with effort for Claude 4.6; budget_tokens remains a deprecated compatibility path.", - "Anthropic API defaults effort to high; lower effort levels should be chosen per workload." - ] + "supported": true } }, - "attachment": true, + "attachment": false, "open_weights": false, - "knowledge": "2025-05-31", - "release_date": "2026-02-05", - "last_updated": "2026-03-13", + "knowledge": "2024-08", + "release_date": "2024-08-25", + "last_updated": "2024-08-25", "cost": { - "input": 5, - "output": 25, - "cache_read": 0.5, - "cache_write": 6.25 + "input": 0.19999999999999998, + "output": 1.5, + "cache_read": 0.02 }, "type": "chat" }, { - "id": "claude-opus-4-7", - "name": "Claude Opus 4.7", - "display_name": "Claude Opus 4.7", + "id": "o1-mini", + "name": "OpenAI: o1-mini", + "display_name": "OpenAI: o1-mini", "modalities": { "input": [ - "text", - "image", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 1000000, - "output": 128000 + "context": 128000, + "output": 65536 }, "temperature": false, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": true, - "default": false + "default": true }, "extra_capabilities": { "reasoning": { "supported": true, - "default_enabled": false, + "default_enabled": true, "mode": "effort", - "effort": "high", + "effort": "medium", "effort_options": [ "low", "medium", - "high", - "xhigh", - "max" - ], - "interleaved": true, - "summaries": true, - "visibility": "omitted", - "continuation": [ - "thinking_blocks" + "high" ], - "notes": [ - "Claude Opus 4.7 and newer Opus models require thinking.type = \"adaptive\" to enable thinking explicitly.", - "Manual budget_tokens requests return 400 on Claude Opus 4.7 and newer adaptive-only Opus models.", - "task_budget is separate from thinking control and should not be treated as a thinking budget." - ] + "visibility": "hidden" } }, - "attachment": true, + "attachment": false, "open_weights": false, - "knowledge": "2026-01-31", - "release_date": "2026-04-16", - "last_updated": "2026-04-16", + "knowledge": "2025-01", + "release_date": "2025-01-01", + "last_updated": "2025-01-01", "cost": { - "input": 5, - "output": 25, - "cache_read": 0.5, - "cache_write": 6.25 + "input": 1.1, + "output": 4.4, + "cache_read": 0.55 }, "type": "chat" }, { - "id": "claude-3-sonnet-20240229", - "name": "Claude Sonnet 3", - "display_name": "Claude Sonnet 3", + "id": "deepseek-r1-distill-llama-70b", + "name": "DeepSeek R1 Distill Llama 70B", + "display_name": "DeepSeek R1 Distill Llama 70B", "modalities": { "input": [ - "text", - "image", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 200000, + "context": 128000, "output": 4096 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": true, + "extra_capabilities": { + "reasoning": { + "supported": true + } + }, + "attachment": false, "open_weights": false, - "knowledge": "2023-08-31", - "release_date": "2024-03-04", - "last_updated": "2024-03-04", + "knowledge": "2025-01", + "release_date": "2025-01-20", + "last_updated": "2025-01-20", "cost": { - "input": 3, - "output": 15, - "cache_read": 0.3, - "cache_write": 0.3 + "input": 0.03, + "output": 0.13 }, "type": "chat" }, { - "id": "claude-opus-4-0", - "name": "Claude Opus 4 (latest)", - "display_name": "Claude Opus 4 (latest)", + "id": "qwen3-32b", + "name": "Qwen3 32B", + "display_name": "Qwen3 32B", "modalities": { "input": [ - "text", - "image", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 32000 + "context": 131072, + "output": 40960 }, "temperature": true, "tool_call": true, "reasoning": { "supported": true, - "default": false + "default": true }, "extra_capabilities": { "reasoning": { "supported": true, - "default_enabled": false, - "mode": "budget", - "budget": { - "min": 1024, - "unit": "tokens" - }, "interleaved": true, "summaries": true, "visibility": "summary", "continuation": [ "thinking_blocks" - ], - "notes": [ - "Claude 4 manual thinking uses thinking.type = \"enabled\" with budget_tokens.", - "Interleaved thinking requires the interleaved-thinking-2025-05-14 beta header for this model family." ] } }, - "attachment": true, + "attachment": false, "open_weights": false, - "knowledge": "2025-03-31", - "release_date": "2025-05-22", - "last_updated": "2025-05-22", + "knowledge": "2025-04", + "release_date": "2025-04-28", + "last_updated": "2025-04-28", "cost": { - "input": 15, - "output": 75, - "cache_read": 1.5, - "cache_write": 18.75 + "input": 0.29, + "output": 0.59 }, "type": "chat" - } - ] - }, - "alibaba": { - "id": "alibaba", - "name": "alibaba", - "display_name": "alibaba", - "api": "https://dashscope-intl.aliyuncs.com/compatible-mode/v1", - "doc": "https://www.alibabacloud.com/help/en/model-studio/models", - "models": [ + }, { - "id": "qwen3-asr-flash", - "name": "Qwen3-ASR Flash", - "display_name": "Qwen3-ASR Flash", + "id": "claude-sonnet-4", + "name": "Anthropic: Claude Sonnet 4", + "display_name": "Anthropic: Claude Sonnet 4", "modalities": { "input": [ - "audio" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 53248, - "output": 4096 + "context": 200000, + "output": 64000 }, - "temperature": false, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": false + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": false, + "mode": "budget", + "budget": { + "min": 1024, + "unit": "tokens" + }, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ], + "notes": [ + "Claude 4 manual thinking uses thinking.type = \"enabled\" with budget_tokens.", + "Interleaved thinking requires the interleaved-thinking-2025-05-14 beta header for this model family." + ] + } }, "attachment": false, "open_weights": false, - "knowledge": "2024-04", - "release_date": "2025-09-08", - "last_updated": "2025-09-08", + "knowledge": "2025-05", + "release_date": "2025-05-14", + "last_updated": "2025-05-14", "cost": { - "input": 0.035, - "output": 0.035 + "input": 3, + "output": 15, + "cache_read": 0.30000000000000004, + "cache_write": 3.75 }, "type": "chat" }, { - "id": "qwen3.5-122b-a10b", - "name": "Qwen3.5 122B-A10B", - "display_name": "Qwen3.5 122B-A10B", + "id": "qwen3-next-80b-a3b-instruct", + "name": "Qwen3 Next 80B A3B Instruct", + "display_name": "Qwen3 Next 80B A3B Instruct", "modalities": { "input": [ "text", "image", - "video", - "audio" + "video" ], "output": [ "text" ] }, "limit": { - "context": 262144, - "output": 65536 + "context": 262000, + "output": 16384 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } + "supported": false }, - "attachment": true, - "open_weights": true, - "release_date": "2026-02-23", - "last_updated": "2026-02-23", + "attachment": false, + "open_weights": false, + "knowledge": "2025-01", + "release_date": "2025-01-01", + "last_updated": "2025-01-01", "cost": { - "input": 0.4, - "output": 3.2 + "input": 0.14, + "output": 1.4 }, "type": "chat" }, { - "id": "qwen3-next-80b-a3b-instruct", - "name": "Qwen3 Next 80B A3B Instruct", - "display_name": "Qwen3 Next 80B A3B Instruct", + "id": "llama-4-maverick", + "name": "Meta Llama 4 Maverick 17B 128E", + "display_name": "Meta Llama 4 Maverick 17B 128E", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" @@ -65290,7 +69191,7 @@ }, "limit": { "context": 131072, - "output": 32768 + "output": 8192 }, "temperature": true, "tool_call": true, @@ -65298,20 +69199,20 @@ "supported": false }, "attachment": false, - "open_weights": true, - "knowledge": "2025-04", - "release_date": "2025-09", - "last_updated": "2025-09", + "open_weights": false, + "knowledge": "2025-01", + "release_date": "2025-01-01", + "last_updated": "2025-01-01", "cost": { - "input": 0.5, - "output": 2 + "input": 0.15, + "output": 0.6 }, "type": "chat" }, { - "id": "qwen2-5-vl-72b-instruct", - "name": "Qwen2.5-VL 72B Instruct", - "display_name": "Qwen2.5-VL 72B Instruct", + "id": "mistral-nemo", + "name": "Mistral Nemo", + "display_name": "Mistral Nemo", "modalities": { "input": [ "text", @@ -65322,29 +69223,29 @@ ] }, "limit": { - "context": 131072, - "output": 8192 + "context": 128000, + "output": 16400 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": false }, "attachment": false, - "open_weights": true, - "knowledge": "2024-04", - "release_date": "2024-09", - "last_updated": "2024-09", + "open_weights": false, + "knowledge": "2024-07", + "release_date": "2024-07-18", + "last_updated": "2024-07-18", "cost": { - "input": 2.8, - "output": 8.4 + "input": 20, + "output": 40 }, "type": "chat" }, { - "id": "qwen3-32b", - "name": "Qwen3 32B", - "display_name": "Qwen3 32B", + "id": "llama-3.3-70b-versatile", + "name": "Meta Llama 3.3 70B Versatile", + "display_name": "Meta Llama 3.3 70B Versatile", "modalities": { "input": [ "text" @@ -65355,46 +69256,28 @@ }, "limit": { "context": 131072, - "output": 16384 + "output": 32678 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true, - "budget": { - "default": 38912, - "min": 0, - "max": 38912 - } - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } + "supported": false }, "attachment": false, - "open_weights": true, - "knowledge": "2025-04", - "release_date": "2025-04", - "last_updated": "2025-04", + "open_weights": false, + "knowledge": "2024-12", + "release_date": "2024-12-06", + "last_updated": "2024-12-06", "cost": { - "input": 0.7, - "output": 2.8, - "reasoning": 8.4 + "input": 0.59, + "output": 0.7899999999999999 }, "type": "chat" }, { - "id": "qwen3-coder-30b-a3b-instruct", - "name": "Qwen3-Coder 30B-A3B Instruct", - "display_name": "Qwen3-Coder 30B-A3B Instruct", + "id": "gemma2-9b-it", + "name": "Google Gemma 2", + "display_name": "Google Gemma 2", "modalities": { "input": [ "text" @@ -65404,100 +69287,98 @@ ] }, "limit": { - "context": 262144, - "output": 65536 + "context": 8192, + "output": 8192 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": false }, "attachment": false, - "open_weights": true, - "knowledge": "2025-04", - "release_date": "2025-04", - "last_updated": "2025-04", + "open_weights": false, + "knowledge": "2024-06", + "release_date": "2024-06-25", + "last_updated": "2024-06-25", "cost": { - "input": 0.45, - "output": 2.25 + "input": 0.01, + "output": 0.03 }, "type": "chat" }, { - "id": "qwen-flash", - "name": "Qwen Flash", - "display_name": "Qwen Flash", + "id": "gemini-2.5-pro", + "name": "Google Gemini 2.5 Pro", + "display_name": "Google Gemini 2.5 Pro", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 1000000, - "output": 32768 + "context": 1048576, + "output": 65536 }, "temperature": true, "tool_call": true, "reasoning": { "supported": true, - "default": false, - "budget": { - "default": 81920, - "min": 0, - "max": 81920 - } + "default": true }, "extra_capabilities": { "reasoning": { "supported": true, - "interleaved": true, + "default_enabled": true, + "mode": "budget", + "budget": { + "default": -1, + "min": 128, + "max": 32768, + "auto": -1, + "unit": "tokens" + }, "summaries": true, "visibility": "summary", "continuation": [ - "thinking_blocks" + "thought_signatures" ] } }, - "search": { - "supported": true, - "default": false, - "forced_search": false, - "search_strategy": "turbo" - }, "attachment": false, "open_weights": false, - "knowledge": "2024-04", - "release_date": "2025-07-28", - "last_updated": "2025-07-28", + "knowledge": "2025-06", + "release_date": "2025-06-17", + "last_updated": "2025-06-17", "cost": { - "input": 0.05, - "output": 0.4 + "input": 1.25, + "output": 10, + "cache_read": 0.3125, + "cache_write": 1.25 }, "type": "chat" }, { - "id": "qwen3.6-27b", - "name": "Qwen3.6 27B", - "display_name": "Qwen3.6 27B", + "id": "gpt-5", + "name": "OpenAI GPT-5", + "display_name": "OpenAI GPT-5", "modalities": { "input": [ "text", - "image", - "video", - "audio" + "image" ], "output": [ "text" ] }, "limit": { - "context": 262144, - "output": 65536 + "context": 400000, + "output": 128000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { "supported": true, @@ -65506,86 +69387,109 @@ "extra_capabilities": { "reasoning": { "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] + "default_enabled": true, + "mode": "effort", + "effort": "medium", + "effort_options": [ + "minimal", + "low", + "medium", + "high" + ], + "verbosity": "medium", + "verbosity_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" } }, - "attachment": true, - "open_weights": true, - "release_date": "2026-04-22", - "last_updated": "2026-04-22", + "attachment": false, + "open_weights": false, + "knowledge": "2025-01", + "release_date": "2025-01-01", + "last_updated": "2025-01-01", "cost": { - "input": 0.6, - "output": 3.6 + "input": 1.25, + "output": 10, + "cache_read": 0.12500000000000003 }, "type": "chat" }, { - "id": "qwen3.5-plus", - "name": "Qwen3.5 Plus", - "display_name": "Qwen3.5 Plus", + "id": "claude-haiku-4-5-20251001", + "name": "Anthropic: Claude 4.5 Haiku (20251001)", + "display_name": "Anthropic: Claude 4.5 Haiku (20251001)", "modalities": { "input": [ "text", - "image", - "video" + "image" ], "output": [ "text" ] }, "limit": { - "context": 1000000, - "output": 65536 + "context": 200000, + "output": 8192 }, "temperature": true, "tool_call": true, "reasoning": { "supported": true, - "default": true + "default": false }, "extra_capabilities": { "reasoning": { "supported": true, + "default_enabled": false, + "mode": "budget", + "budget": { + "min": 1024, + "unit": "tokens" + }, "interleaved": true, "summaries": true, "visibility": "summary", "continuation": [ "thinking_blocks" + ], + "notes": [ + "Claude 4 manual thinking uses thinking.type = \"enabled\" with budget_tokens.", + "Interleaved thinking requires the interleaved-thinking-2025-05-14 beta header for this model family." ] } }, "attachment": false, "open_weights": false, - "knowledge": "2025-04", - "release_date": "2026-02-16", - "last_updated": "2026-02-16", + "knowledge": "2025-10", + "release_date": "2025-10-01", + "last_updated": "2025-10-01", "cost": { - "input": 0.4, - "output": 2.4, - "reasoning": 2.4 + "input": 1, + "output": 5, + "cache_read": 0.09999999999999999, + "cache_write": 1.25 }, "type": "chat" }, { - "id": "qwen-plus-character-ja", - "name": "Qwen Plus Character (Japanese)", - "display_name": "Qwen Plus Character (Japanese)", + "id": "claude-4.5-haiku", + "name": "Anthropic: Claude 4.5 Haiku", + "display_name": "Anthropic: Claude 4.5 Haiku", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 8192, - "output": 512 + "context": 200000, + "output": 8192 }, "temperature": true, "tool_call": true, @@ -65594,182 +69498,208 @@ }, "attachment": false, "open_weights": false, - "knowledge": "2024-04", - "release_date": "2024-01", - "last_updated": "2024-01", + "knowledge": "2025-10", + "release_date": "2025-10-01", + "last_updated": "2025-10-01", "cost": { - "input": 0.5, - "output": 1.4 + "input": 1, + "output": 5, + "cache_read": 0.09999999999999999, + "cache_write": 1.25 }, "type": "chat" }, { - "id": "qwen3-livetranslate-flash-realtime", - "name": "Qwen3-LiveTranslate Flash Realtime", - "display_name": "Qwen3-LiveTranslate Flash Realtime", + "id": "gpt-5-pro", + "name": "OpenAI: GPT-5 Pro", + "display_name": "OpenAI: GPT-5 Pro", "modalities": { "input": [ - "text", - "image", - "audio", - "video" + "text" ], "output": [ - "text", - "audio" + "text" ] }, "limit": { - "context": 53248, - "output": 4096 + "context": 128000, + "output": 32768 }, - "temperature": true, + "temperature": false, "tool_call": false, "reasoning": { - "supported": false + "supported": true, + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": true, + "mode": "fixed", + "effort": "high", + "verbosity": "medium", + "verbosity_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" + } }, "attachment": false, "open_weights": false, - "knowledge": "2024-04", - "release_date": "2025-09-22", - "last_updated": "2025-09-22", + "knowledge": "2025-01", + "release_date": "2025-01-01", + "last_updated": "2025-01-01", "cost": { - "input": 10, - "output": 10, - "input_audio": 10, - "output_audio": 38 + "input": 15, + "output": 120 }, "type": "chat" }, { - "id": "qwen3-235b-a22b", - "name": "Qwen3 235B A22B", - "display_name": "Qwen3 235B A22B", + "id": "gemini-2.5-flash", + "name": "Google Gemini 2.5 Flash", + "display_name": "Google Gemini 2.5 Flash", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 131072, - "output": 32768 + "context": 1048576, + "output": 65535 }, "temperature": true, "tool_call": true, "reasoning": { "supported": true, - "default": false, - "budget": { - "default": 81920, - "min": 0, - "max": 81920 - } + "default": true }, "extra_capabilities": { "reasoning": { "supported": true, - "interleaved": true, + "default_enabled": true, + "mode": "budget", + "budget": { + "default": -1, + "min": 0, + "max": 24576, + "auto": -1, + "off": 0, + "unit": "tokens" + }, "summaries": true, "visibility": "summary", "continuation": [ - "thinking_blocks" + "thought_signatures" ] } }, "attachment": false, - "open_weights": true, - "knowledge": "2025-04", - "release_date": "2025-04", - "last_updated": "2025-04", + "open_weights": false, + "knowledge": "2025-06", + "release_date": "2025-06-17", + "last_updated": "2025-06-17", "cost": { - "input": 0.7, - "output": 2.8, - "reasoning": 8.4 + "input": 0.3, + "output": 2.5, + "cache_read": 0.075, + "cache_write": 0.3 }, "type": "chat" }, { - "id": "qwen3-max", - "name": "Qwen3 Max", - "display_name": "Qwen3 Max", + "id": "gpt-4o", + "name": "OpenAI GPT-4o", + "display_name": "OpenAI GPT-4o", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 262144, - "output": 65536 + "context": 128000, + "output": 16384 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } + "supported": false }, "attachment": false, "open_weights": false, - "knowledge": "2025-04", - "release_date": "2025-09-23", - "last_updated": "2025-09-23", + "knowledge": "2024-05", + "release_date": "2024-05-13", + "last_updated": "2024-05-13", "cost": { - "input": 1.2, - "output": 6 + "input": 2.5, + "output": 10, + "cache_read": 1.25 }, "type": "chat" }, { - "id": "qwen2-5-72b-instruct", - "name": "Qwen2.5 72B Instruct", - "display_name": "Qwen2.5 72B Instruct", + "id": "o4-mini", + "name": "OpenAI o4 Mini", + "display_name": "OpenAI o4 Mini", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 131072, - "output": 8192 + "context": 200000, + "output": 100000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": true, + "mode": "effort", + "effort": "medium", + "effort_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" + } }, "attachment": false, - "open_weights": true, - "knowledge": "2024-04", - "release_date": "2024-09", - "last_updated": "2024-09", + "open_weights": false, + "knowledge": "2024-06", + "release_date": "2024-06-01", + "last_updated": "2024-06-01", "cost": { - "input": 1.4, - "output": 5.6 + "input": 1.1, + "output": 4.4, + "cache_read": 0.275 }, "type": "chat" }, { - "id": "qwen3-coder-plus", - "name": "Qwen3 Coder Plus", - "display_name": "Qwen3 Coder Plus", + "id": "llama-3.1-8b-instant", + "name": "Meta Llama 3.1 8B Instant", + "display_name": "Meta Llama 3.1 8B Instant", "modalities": { "input": [ "text" @@ -65779,8 +69709,8 @@ ] }, "limit": { - "context": 1000000, - "output": 65536 + "context": 131072, + "output": 32678 }, "temperature": true, "tool_call": true, @@ -65788,20 +69718,20 @@ "supported": false }, "attachment": false, - "open_weights": true, - "knowledge": "2025-04", - "release_date": "2025-07-23", - "last_updated": "2025-07-23", + "open_weights": false, + "knowledge": "2024-07", + "release_date": "2024-07-01", + "last_updated": "2024-07-01", "cost": { - "input": 1, - "output": 5 + "input": 0.049999999999999996, + "output": 0.08 }, "type": "chat" }, { - "id": "qwen3-14b", - "name": "Qwen3 14B", - "display_name": "Qwen3 14B", + "id": "llama-prompt-guard-2-22m", + "name": "Meta Llama Prompt Guard 2 22M", + "display_name": "Meta Llama Prompt Guard 2 22M", "modalities": { "input": [ "text" @@ -65811,64 +69741,43 @@ ] }, "limit": { - "context": 131072, - "output": 8192 + "context": 512, + "output": 2 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": true, - "budget": { - "default": 38912, - "min": 0, - "max": 38912 - } - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } + "supported": false }, "attachment": false, - "open_weights": true, - "knowledge": "2025-04", - "release_date": "2025-04", - "last_updated": "2025-04", + "open_weights": false, + "knowledge": "2024-10", + "release_date": "2024-10-01", + "last_updated": "2024-10-01", "cost": { - "input": 0.35, - "output": 1.4, - "reasoning": 4.2 + "input": 0.01, + "output": 0.01 }, "type": "chat" }, { - "id": "qwen3-omni-flash", - "name": "Qwen3-Omni Flash", - "display_name": "Qwen3-Omni Flash", + "id": "o3-pro", + "name": "OpenAI o3 Pro", + "display_name": "OpenAI o3 Pro", "modalities": { "input": [ "text", - "image", - "audio", - "video" + "image" ], "output": [ - "text", - "audio" + "text" ] }, "limit": { - "context": 65536, - "output": 16384 + "context": 200000, + "output": 100000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { "supported": true, @@ -65877,35 +69786,35 @@ "extra_capabilities": { "reasoning": { "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] + "default_enabled": true, + "mode": "effort", + "effort": "medium", + "effort_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" } }, "attachment": false, "open_weights": false, - "knowledge": "2024-04", - "release_date": "2025-09-15", - "last_updated": "2025-09-15", + "knowledge": "2024-06", + "release_date": "2024-06-01", + "last_updated": "2024-06-01", "cost": { - "input": 0.43, - "output": 1.66, - "input_audio": 3.81, - "output_audio": 15.11 + "input": 20, + "output": 80 }, "type": "chat" }, { - "id": "qwen3-vl-235b-a22b", - "name": "Qwen3-VL 235B-A22B", - "display_name": "Qwen3-VL 235B-A22B", + "id": "grok-3-mini", + "name": "xAI Grok 3 Mini", + "display_name": "xAI Grok 3 Mini", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" @@ -65913,91 +69822,86 @@ }, "limit": { "context": 131072, - "output": 32768 + "output": 131072 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } + "supported": false }, "attachment": false, - "open_weights": true, - "knowledge": "2025-04", - "release_date": "2025-04", - "last_updated": "2025-04", + "open_weights": false, + "knowledge": "2024-06", + "release_date": "2024-06-01", + "last_updated": "2024-06-01", "cost": { - "input": 0.7, - "output": 2.8, - "reasoning": 8.4 + "input": 0.3, + "output": 0.5, + "cache_read": 0.075 }, "type": "chat" }, { - "id": "qwen3-8b", - "name": "Qwen3 8B", - "display_name": "Qwen3 8B", + "id": "claude-opus-4-1-20250805", + "name": "Anthropic: Claude Opus 4.1 (20250805)", + "display_name": "Anthropic: Claude Opus 4.1 (20250805)", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 131072, - "output": 8192 + "context": 200000, + "output": 32000 }, "temperature": true, "tool_call": true, "reasoning": { "supported": true, - "default": true, - "budget": { - "default": 38912, - "min": 0, - "max": 38912 - } + "default": false }, "extra_capabilities": { "reasoning": { "supported": true, + "default_enabled": false, + "mode": "budget", + "budget": { + "min": 1024, + "unit": "tokens" + }, "interleaved": true, "summaries": true, "visibility": "summary", "continuation": [ "thinking_blocks" + ], + "notes": [ + "Claude 4 manual thinking uses thinking.type = \"enabled\" with budget_tokens.", + "Interleaved thinking requires the interleaved-thinking-2025-05-14 beta header for this model family." ] } }, "attachment": false, - "open_weights": true, - "knowledge": "2025-04", - "release_date": "2025-04", - "last_updated": "2025-04", + "open_weights": false, + "knowledge": "2025-08", + "release_date": "2025-08-05", + "last_updated": "2025-08-05", "cost": { - "input": 0.18, - "output": 0.7, - "reasoning": 2.1 + "input": 15, + "output": 75, + "cache_read": 1.5, + "cache_write": 18.75 }, "type": "chat" }, { - "id": "qwen3.7-max", - "name": "Qwen3.7 Max", - "display_name": "Qwen3.7 Max", + "id": "deepseek-tng-r1t2-chimera", + "name": "DeepSeek TNG R1T2 Chimera", + "display_name": "DeepSeek TNG R1T2 Chimera", "modalities": { "input": [ "text" @@ -66007,48 +69911,40 @@ ] }, "limit": { - "context": 1000000, - "output": 65536 + "context": 130000, + "output": 163840 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true - } + "supported": false }, "attachment": false, "open_weights": false, - "release_date": "2026-05-21", - "last_updated": "2026-05-21", + "knowledge": "2025-07", + "release_date": "2025-07-02", + "last_updated": "2025-07-02", "cost": { - "input": 2.5, - "output": 7.5, - "cache_read": 0.5, - "cache_write": 3.125 + "input": 0.3, + "output": 1.2 }, "type": "chat" }, { - "id": "qwen-vl-plus", - "name": "Qwen-VL Plus", - "display_name": "Qwen-VL Plus", + "id": "llama-3.3-70b-instruct", + "name": "Meta Llama 3.3 70B Instruct", + "display_name": "Meta Llama 3.3 70B Instruct", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 131072, - "output": 8192 + "context": 128000, + "output": 16400 }, "temperature": true, "tool_call": true, @@ -66057,136 +69953,85 @@ }, "attachment": false, "open_weights": false, - "knowledge": "2024-04", - "release_date": "2024-01-25", - "last_updated": "2025-08-15", + "knowledge": "2024-12", + "release_date": "2024-12-06", + "last_updated": "2024-12-06", "cost": { - "input": 0.21, - "output": 0.63 + "input": 0.13, + "output": 0.39 }, "type": "chat" }, { - "id": "qwen3.6-plus", - "name": "Qwen3.6 Plus", - "display_name": "Qwen3.6 Plus", + "id": "sonar-reasoning-pro", + "name": "Perplexity Sonar Reasoning Pro", + "display_name": "Perplexity Sonar Reasoning Pro", "modalities": { "input": [ - "text", - "image", - "video" + "text" ], "output": [ "text" ] }, "limit": { - "context": 1000000, - "output": 65536 + "context": 127000, + "output": 4096 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": true, "default": true }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } - }, "attachment": false, "open_weights": false, - "knowledge": "2025-04", - "release_date": "2026-04-02", - "last_updated": "2026-04-02", + "knowledge": "2025-01", + "release_date": "2025-01-27", + "last_updated": "2025-01-27", "cost": { - "input": 0.5, - "output": 3, - "cache_read": 0.05, - "cache_write": 0.625, - "tiers": [ - { - "input": 2, - "output": 6, - "cache_read": 0.2, - "cache_write": 2.5, - "tier": { - "type": "context", - "size": 256000 - } - } - ], - "context_over_200k": { - "input": 2, - "output": 6, - "cache_read": 0.2, - "cache_write": 2.5 - } + "input": 2, + "output": 8 }, "type": "chat" }, { - "id": "qwen3-vl-plus", - "name": "Qwen3 VL Plus", - "display_name": "Qwen3 VL Plus", + "id": "grok-3", + "name": "xAI Grok 3", + "display_name": "xAI Grok 3", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 262144, - "output": 32768 + "context": 131072, + "output": 131072 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { - "supported": true, - "default": false, - "budget": { - "default": 81920, - "min": 0, - "max": 81920 - } - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } + "supported": false }, "attachment": false, "open_weights": false, - "knowledge": "2025-04", - "release_date": "2025-09-23", - "last_updated": "2025-09-23", + "knowledge": "2024-06", + "release_date": "2024-06-01", + "last_updated": "2024-06-01", "cost": { - "input": 0.2, - "output": 1.6, - "reasoning": 4.8 + "input": 3, + "output": 15, + "cache_read": 0.75 }, "type": "chat" }, { - "id": "qwen-max", - "name": "Qwen Max", - "display_name": "Qwen Max", + "id": "glm-4.6", + "name": "Zai GLM-4.6", + "display_name": "Zai GLM-4.6", "modalities": { "input": [ "text" @@ -66196,84 +70041,91 @@ ] }, "limit": { - "context": 32768, - "output": 8192 + "context": 204800, + "output": 131072 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false - }, - "search": { "supported": true, - "default": false, - "forced_search": false, - "search_strategy": "turbo" + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true + } }, "attachment": false, "open_weights": false, - "knowledge": "2024-04", - "release_date": "2024-04-03", - "last_updated": "2025-01-25", + "knowledge": "2024-07", + "release_date": "2024-07-18", + "last_updated": "2024-07-18", "cost": { - "input": 1.6, - "output": 6.4 + "input": 0.44999999999999996, + "output": 1.5 }, "type": "chat" }, { - "id": "qwen-omni-turbo", - "name": "Qwen-Omni Turbo", - "display_name": "Qwen-Omni Turbo", + "id": "kimi-k2-thinking", + "name": "Kimi K2 Thinking", + "display_name": "Kimi K2 Thinking", "modalities": { "input": [ - "text", - "image", - "audio", - "video" + "text" ], "output": [ - "text", - "audio" + "text" ] }, "limit": { - "context": 32768, - "output": 2048 + "context": 256000, + "output": 262144 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } }, "attachment": false, "open_weights": false, - "knowledge": "2024-04", - "release_date": "2025-01-19", - "last_updated": "2025-03-26", + "knowledge": "2025-11", + "release_date": "2025-11-06", + "last_updated": "2025-11-06", "cost": { - "input": 0.07, - "output": 0.27, - "input_audio": 4.44, - "output_audio": 8.89 + "input": 0.48, + "output": 2 }, "type": "chat" }, { - "id": "qwen3-coder-480b-a35b-instruct", - "name": "Qwen3-Coder 480B-A35B Instruct", - "display_name": "Qwen3-Coder 480B-A35B Instruct", + "id": "grok-4-1-fast-non-reasoning", + "name": "xAI Grok 4.1 Fast Non-Reasoning", + "display_name": "xAI Grok 4.1 Fast Non-Reasoning", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ - "text" + "text", + "image" ] }, "limit": { - "context": 262144, - "output": 65536 + "context": 2000000, + "output": 30000 }, "temperature": true, "tool_call": true, @@ -66281,162 +70133,160 @@ "supported": false }, "attachment": false, - "open_weights": true, - "knowledge": "2025-04", - "release_date": "2025-04", - "last_updated": "2025-04", + "open_weights": false, + "knowledge": "2025-11", + "release_date": "2025-11-17", + "last_updated": "2025-11-17", "cost": { - "input": 1.5, - "output": 7.5 + "input": 0.19999999999999998, + "output": 0.5, + "cache_read": 0.049999999999999996 }, "type": "chat" }, { - "id": "qwen3-next-80b-a3b-thinking", - "name": "Qwen3 Next 80B A3B Thinking", - "display_name": "Qwen3 Next 80B A3B Thinking", + "id": "qwen3-coder", + "name": "Qwen3 Coder 480B A35B Instruct Turbo", + "display_name": "Qwen3 Coder 480B A35B Instruct Turbo", "modalities": { "input": [ - "text" + "text", + "image", + "audio", + "video" ], "output": [ "text" ] }, "limit": { - "context": 131072, - "output": 32768 + "context": 262144, + "output": 16384 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { - "supported": true, - "default": true, - "budget": { - "default": 81920, - "min": 0, - "max": 81920 - } - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } + "supported": false }, "attachment": false, - "open_weights": true, - "knowledge": "2025-04", - "release_date": "2025-09", - "last_updated": "2025-09", + "open_weights": false, + "knowledge": "2025-07", + "release_date": "2025-07-23", + "last_updated": "2025-07-23", "cost": { - "input": 0.5, - "output": 6 + "input": 0.22, + "output": 0.95 }, "type": "chat" }, { - "id": "qwen3-coder-flash", - "name": "Qwen3 Coder Flash", - "display_name": "Qwen3 Coder Flash", + "id": "gpt-5-chat-latest", + "name": "OpenAI GPT-5 Chat Latest", + "display_name": "OpenAI GPT-5 Chat Latest", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 1000000, - "output": 65536 + "context": 128000, + "output": 16384 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { "supported": false }, "attachment": false, "open_weights": false, - "knowledge": "2025-04", - "release_date": "2025-07-28", - "last_updated": "2025-07-28", + "knowledge": "2024-09", + "release_date": "2024-09-30", + "last_updated": "2024-09-30", "cost": { - "input": 0.3, - "output": 1.5 + "input": 1.25, + "output": 10, + "cache_read": 0.12500000000000003 }, "type": "chat" }, { - "id": "qwen3.5-35b-a3b", - "name": "Qwen3.5 35B-A3B", - "display_name": "Qwen3.5 35B-A3B", + "id": "gpt-5.1-codex", + "name": "OpenAI: GPT-5.1 Codex", + "display_name": "OpenAI: GPT-5.1 Codex", "modalities": { "input": [ "text", - "image", - "video", - "audio" + "image" ], "output": [ - "text" + "text", + "image" ] }, "limit": { - "context": 262144, - "output": 65536 + "context": 400000, + "output": 128000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { "supported": true, - "default": true + "default": false }, "extra_capabilities": { "reasoning": { "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] + "default_enabled": false, + "mode": "effort", + "effort": "none", + "effort_options": [ + "none", + "low", + "medium", + "high" + ], + "verbosity": "medium", + "verbosity_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" } }, - "attachment": true, - "open_weights": true, - "release_date": "2026-02-23", - "last_updated": "2026-02-23", + "attachment": false, + "open_weights": false, + "knowledge": "2025-01", + "release_date": "2025-01-01", + "last_updated": "2025-01-01", "cost": { - "input": 0.25, - "output": 2 + "input": 1.25, + "output": 10, + "cache_read": 0.12500000000000003 }, "type": "chat" }, { - "id": "qwen3.6-flash", - "name": "Qwen3.6 Flash", - "display_name": "Qwen3.6 Flash", + "id": "o3-mini", + "name": "OpenAI o3 Mini", + "display_name": "OpenAI o3 Mini", "modalities": { "input": [ - "text", - "image", - "video" + "text" ], "output": [ "text" ] }, "limit": { - "context": 1000000, - "output": 65536 + "context": 200000, + "output": 100000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { "supported": true, @@ -66445,29 +70295,33 @@ "extra_capabilities": { "reasoning": { "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] + "default_enabled": true, + "mode": "effort", + "effort": "medium", + "effort_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" } }, - "attachment": true, + "attachment": false, "open_weights": false, - "release_date": "2026-04-27", - "last_updated": "2026-04-27", + "knowledge": "2023-10", + "release_date": "2023-10-01", + "last_updated": "2023-10-01", "cost": { - "input": 0.1875, - "output": 1.125, - "cache_write": 0.234375 + "input": 1.1, + "output": 4.4, + "cache_read": 0.55 }, "type": "chat" }, { - "id": "qwen-turbo", - "name": "Qwen Turbo", - "display_name": "Qwen Turbo", + "id": "mistral-large-2411", + "name": "Mistral-Large", + "display_name": "Mistral-Large", "modalities": { "input": [ "text" @@ -66477,108 +70331,84 @@ ] }, "limit": { - "context": 131072, - "output": 16384 + "context": 128000, + "output": 32768 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": false, - "budget": { - "default": 38912, - "min": 0, - "max": 38912 - } - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } - }, - "search": { - "supported": true, - "default": false, - "forced_search": false, - "search_strategy": "turbo" + "supported": false }, "attachment": false, "open_weights": false, - "knowledge": "2024-04", - "release_date": "2024-11-01", - "last_updated": "2025-04-28", + "knowledge": "2024-07", + "release_date": "2024-07-24", + "last_updated": "2024-07-24", "cost": { - "input": 0.05, - "output": 0.2, - "reasoning": 0.5 + "input": 2, + "output": 6 }, "type": "chat" }, { - "id": "qwq-plus", - "name": "QwQ Plus", - "display_name": "QwQ Plus", + "id": "gemini-2.5-flash-lite", + "name": "Google Gemini 2.5 Flash Lite", + "display_name": "Google Gemini 2.5 Flash Lite", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 131072, - "output": 8192 + "context": 1048576, + "output": 65535 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { "supported": true, - "default": true, - "budget": { - "default": 32768, - "min": 0, - "max": 32768 - } + "default": false }, "extra_capabilities": { "reasoning": { "supported": true, - "interleaved": true, + "default_enabled": false, + "mode": "budget", + "budget": { + "default": -1, + "min": 512, + "max": 24576, + "auto": -1, + "unit": "tokens" + }, "summaries": true, "visibility": "summary", "continuation": [ - "thinking_blocks" + "thought_signatures" ] } }, - "search": { - "supported": true, - "default": false, - "forced_search": false, - "search_strategy": "turbo" - }, "attachment": false, "open_weights": false, - "knowledge": "2024-04", - "release_date": "2025-03-05", - "last_updated": "2025-03-05", + "knowledge": "2025-07", + "release_date": "2025-07-22", + "last_updated": "2025-07-22", "cost": { - "input": 0.8, - "output": 2.4 + "input": 0.09999999999999999, + "output": 0.39999999999999997, + "cache_read": 0.024999999999999998, + "cache_write": 0.09999999999999999 }, "type": "chat" }, { - "id": "qwen3-vl-30b-a3b", - "name": "Qwen3-VL 30B-A3B", - "display_name": "Qwen3-VL 30B-A3B", + "id": "llama-guard-4", + "name": "Meta Llama Guard 4 12B", + "display_name": "Meta Llama Guard 4 12B", "modalities": { "input": [ "text", @@ -66590,87 +70420,85 @@ }, "limit": { "context": 131072, - "output": 32768 + "output": 1024 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } + "supported": false }, "attachment": false, - "open_weights": true, - "knowledge": "2025-04", - "release_date": "2025-04", - "last_updated": "2025-04", + "open_weights": false, + "knowledge": "2025-01", + "release_date": "2025-01-01", + "last_updated": "2025-01-01", "cost": { - "input": 0.2, - "output": 0.8, - "reasoning": 2.4 + "input": 0.21, + "output": 0.21 }, "type": "chat" }, { - "id": "qwen3.6-35b-a3b", - "name": "Qwen3.6 35B-A3B", - "display_name": "Qwen3.6 35B-A3B", + "id": "claude-opus-4-1", + "name": "Anthropic: Claude Opus 4.1", + "display_name": "Anthropic: Claude Opus 4.1", "modalities": { "input": [ "text", - "image", - "video", - "audio" + "image" ], "output": [ "text" ] }, "limit": { - "context": 262144, - "output": 65536 + "context": 200000, + "output": 32000 }, "temperature": true, "tool_call": true, "reasoning": { "supported": true, - "default": true + "default": false }, "extra_capabilities": { "reasoning": { "supported": true, + "default_enabled": false, + "mode": "budget", + "budget": { + "min": 1024, + "unit": "tokens" + }, "interleaved": true, "summaries": true, "visibility": "summary", "continuation": [ "thinking_blocks" + ], + "notes": [ + "Claude 4 manual thinking uses thinking.type = \"enabled\" with budget_tokens.", + "Interleaved thinking requires the interleaved-thinking-2025-05-14 beta header for this model family." ] } }, - "attachment": true, - "open_weights": true, - "release_date": "2026-04-17", - "last_updated": "2026-04-17", + "attachment": false, + "open_weights": false, + "knowledge": "2025-08", + "release_date": "2025-08-05", + "last_updated": "2025-08-05", "cost": { - "input": 0.248, - "output": 1.485 + "input": 15, + "output": 75, + "cache_read": 1.5, + "cache_write": 18.75 }, "type": "chat" }, { - "id": "qwen-vl-ocr", - "name": "Qwen Vl Ocr", - "display_name": "Qwen Vl Ocr", + "id": "claude-3.7-sonnet", + "name": "Anthropic: Claude 3.7 Sonnet", + "display_name": "Anthropic: Claude 3.7 Sonnet", "modalities": { "input": [ "text", @@ -66681,109 +70509,156 @@ ] }, "limit": { - "context": 34096, - "output": 4096 + "context": 200000, + "output": 64000 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": false + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": false, + "mode": "budget", + "budget": { + "min": 1024, + "unit": "tokens" + }, + "interleaved": false, + "summaries": false, + "visibility": "full", + "continuation": [ + "thinking_blocks" + ], + "notes": [ + "Anthropic uses thinking budget tokens" + ] + } }, "attachment": false, "open_weights": false, - "knowledge": "2024-04", - "release_date": "2024-10-28", - "last_updated": "2025-04-13", + "knowledge": "2025-02", + "release_date": "2025-02-19", + "last_updated": "2025-02-19", "cost": { - "input": 0.72, - "output": 0.72 + "input": 3, + "output": 15, + "cache_read": 0.30000000000000004, + "cache_write": 3.75 }, "type": "chat" }, { - "id": "qwen2-5-omni-7b", - "name": "Qwen2.5-Omni 7B", - "display_name": "Qwen2.5-Omni 7B", + "id": "gpt-5.1-codex-mini", + "name": "OpenAI: GPT-5.1 Codex Mini", + "display_name": "OpenAI: GPT-5.1 Codex Mini", "modalities": { "input": [ "text", - "image", - "audio", - "video" + "image" ], "output": [ "text", - "audio" + "image" ] }, "limit": { - "context": 32768, - "output": 2048 + "context": 400000, + "output": 128000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": false + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": false, + "mode": "effort", + "effort": "none", + "effort_options": [ + "none", + "low", + "medium", + "high" + ], + "verbosity": "medium", + "verbosity_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" + } }, "attachment": false, - "open_weights": true, - "knowledge": "2024-04", - "release_date": "2024-12", - "last_updated": "2024-12", + "open_weights": false, + "knowledge": "2025-01", + "release_date": "2025-01-01", + "last_updated": "2025-01-01", "cost": { - "input": 0.1, - "output": 0.4, - "input_audio": 6.76 + "input": 0.25, + "output": 2, + "cache_read": 0.024999999999999998 }, "type": "chat" }, { - "id": "qwen-mt-turbo", - "name": "Qwen Mt Turbo", - "display_name": "Qwen Mt Turbo", + "id": "gpt-5.1-chat-latest", + "name": "OpenAI GPT-5.1 Chat", + "display_name": "OpenAI GPT-5.1 Chat", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ - "text" + "text", + "image" ] }, "limit": { - "context": 16384, - "output": 8192 + "context": 128000, + "output": 16384 }, - "temperature": true, - "tool_call": false, + "temperature": false, + "tool_call": true, "reasoning": { "supported": false }, "attachment": false, "open_weights": false, - "knowledge": "2024-04", - "release_date": "2025-01", - "last_updated": "2025-01", + "knowledge": "2025-01", + "release_date": "2025-01-01", + "last_updated": "2025-01-01", "cost": { - "input": 0.16, - "output": 0.49 + "input": 1.25, + "output": 10, + "cache_read": 0.12500000000000003 }, "type": "chat" }, { - "id": "qwen2-5-32b-instruct", - "name": "Qwen2.5 32B Instruct", - "display_name": "Qwen2.5 32B Instruct", + "id": "claude-3-haiku-20240307", + "name": "Anthropic: Claude 3 Haiku", + "display_name": "Anthropic: Claude 3 Haiku", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 131072, - "output": 8192 + "context": 200000, + "output": 4096 }, "temperature": true, "tool_call": true, @@ -66791,31 +70666,34 @@ "supported": false }, "attachment": false, - "open_weights": true, - "knowledge": "2024-04", - "release_date": "2024-09", - "last_updated": "2024-09", + "open_weights": false, + "knowledge": "2024-03", + "release_date": "2024-03-07", + "last_updated": "2024-03-07", "cost": { - "input": 0.7, - "output": 2.8 + "input": 0.25, + "output": 1.25, + "cache_read": 0.03, + "cache_write": 0.3 }, "type": "chat" }, { - "id": "qwen3.6-max-preview", - "name": "Qwen3.6 Max Preview", - "display_name": "Qwen3.6 Max Preview", + "id": "grok-4-fast-reasoning", + "name": "xAI: Grok 4 Fast Reasoning", + "display_name": "xAI: Grok 4 Fast Reasoning", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 262144, - "output": 65536 + "context": 2000000, + "output": 2000000 }, "temperature": true, "tool_call": true, @@ -66825,32 +70703,25 @@ }, "extra_capabilities": { "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] + "supported": true } }, "attachment": false, "open_weights": false, - "knowledge": "2025-04", - "release_date": "2026-04-20", - "last_updated": "2026-04-20", + "knowledge": "2025-09", + "release_date": "2025-09-01", + "last_updated": "2025-09-01", "cost": { - "input": 1.3, - "output": 7.8, - "cache_read": 0.13, - "cache_write": 1.625 + "input": 0.19999999999999998, + "output": 0.5, + "cache_read": 0.049999999999999996 }, "type": "chat" }, { - "id": "qwen-vl-max", - "name": "Qwen-VL Max", - "display_name": "Qwen-VL Max", + "id": "gpt-4.1-nano", + "name": "OpenAI GPT-4.1 Nano", + "display_name": "OpenAI GPT-4.1 Nano", "modalities": { "input": [ "text", @@ -66861,8 +70732,8 @@ ] }, "limit": { - "context": 131072, - "output": 8192 + "context": 1047576, + "output": 32768 }, "temperature": true, "tool_call": true, @@ -66871,33 +70742,31 @@ }, "attachment": false, "open_weights": false, - "knowledge": "2024-04", - "release_date": "2024-04-08", - "last_updated": "2025-08-13", + "knowledge": "2025-04", + "release_date": "2025-04-14", + "last_updated": "2025-04-14", "cost": { - "input": 0.8, - "output": 3.2 + "input": 0.09999999999999999, + "output": 0.39999999999999997, + "cache_read": 0.024999999999999998 }, "type": "chat" }, { - "id": "qwen3.5-397b-a17b", - "name": "Qwen3.5 397B-A17B", - "display_name": "Qwen3.5 397B-A17B", + "id": "gpt-oss-120b", + "name": "OpenAI GPT-OSS 120b", + "display_name": "OpenAI GPT-OSS 120b", "modalities": { "input": [ - "text", - "image", - "video", - "audio" + "text" ], "output": [ "text" ] }, "limit": { - "context": 262144, - "output": 65536 + "context": 131072, + "output": 131072 }, "temperature": true, "tool_call": true, @@ -66907,67 +70776,56 @@ }, "extra_capabilities": { "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] + "supported": true } }, - "attachment": true, - "open_weights": true, - "release_date": "2026-02-15", - "last_updated": "2026-02-15", + "attachment": false, + "open_weights": false, + "knowledge": "2024-06", + "release_date": "2024-06-01", + "last_updated": "2024-06-01", "cost": { - "input": 0.6, - "output": 3.6 + "input": 0.04, + "output": 0.16 }, "type": "chat" }, { - "id": "qwen3-omni-flash-realtime", - "name": "Qwen3-Omni Flash Realtime", - "display_name": "Qwen3-Omni Flash Realtime", + "id": "sonar", + "name": "Perplexity Sonar", + "display_name": "Perplexity Sonar", "modalities": { "input": [ - "text", - "image", - "audio", - "video" + "text" ], "output": [ - "text", - "audio" + "text" ] }, "limit": { - "context": 65536, - "output": 16384 + "context": 127000, + "output": 4096 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": false }, "attachment": false, "open_weights": false, - "knowledge": "2024-04", - "release_date": "2025-09-15", - "last_updated": "2025-09-15", + "knowledge": "2025-01", + "release_date": "2025-01-27", + "last_updated": "2025-01-27", "cost": { - "input": 0.52, - "output": 1.99, - "input_audio": 4.57, - "output_audio": 18.13 + "input": 1, + "output": 1 }, "type": "chat" }, { - "id": "qwen2-5-14b-instruct", - "name": "Qwen2.5 14B Instruct", - "display_name": "Qwen2.5 14B Instruct", + "id": "qwen2.5-coder-7b-fast", + "name": "Qwen2.5 Coder 7B fast", + "display_name": "Qwen2.5 Coder 7B fast", "modalities": { "input": [ "text" @@ -66977,149 +70835,122 @@ ] }, "limit": { - "context": 131072, + "context": 32000, "output": 8192 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": false }, "attachment": false, - "open_weights": true, - "knowledge": "2024-04", - "release_date": "2024-09", - "last_updated": "2024-09", + "open_weights": false, + "knowledge": "2024-09", + "release_date": "2024-09-15", + "last_updated": "2024-09-15", "cost": { - "input": 0.35, - "output": 1.4 + "input": 0.03, + "output": 0.09 }, "type": "chat" }, { - "id": "qwen3.7-plus", - "name": "Qwen3.7 Plus", - "display_name": "Qwen3.7 Plus", + "id": "o1", + "name": "OpenAI: o1", + "display_name": "OpenAI: o1", "modalities": { "input": [ - "text", - "image", - "video" + "text" ], "output": [ "text" ] }, "limit": { - "context": 1000000, - "output": 65536 + "context": 200000, + "output": 100000 }, - "temperature": true, - "tool_call": true, + "temperature": false, + "tool_call": false, "reasoning": { "supported": true, "default": true }, "extra_capabilities": { "reasoning": { - "supported": true + "supported": true, + "default_enabled": true, + "mode": "effort", + "effort": "medium", + "effort_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" } }, "attachment": false, "open_weights": false, - "knowledge": "2025-04", - "release_date": "2026-06-02", - "last_updated": "2026-06-04", + "knowledge": "2025-01", + "release_date": "2025-01-01", + "last_updated": "2025-01-01", "cost": { - "input": 0.5, - "output": 3, - "cache_read": 0.05, - "cache_write": 0.625, - "tiers": [ - { - "input": 2, - "output": 6, - "cache_read": 0.2, - "cache_write": 2.5, - "tier": { - "type": "context", - "size": 256000 - } - } - ], - "context_over_200k": { - "input": 2, - "output": 6, - "cache_read": 0.2, - "cache_write": 2.5 - } + "input": 15, + "output": 60, + "cache_read": 7.5 }, "type": "chat" }, { - "id": "qwen3.5-27b", - "name": "Qwen3.5 27B", - "display_name": "Qwen3.5 27B", + "id": "ernie-4.5-21b-a3b-thinking", + "name": "Baidu Ernie 4.5 21B A3B Thinking", + "display_name": "Baidu Ernie 4.5 21B A3B Thinking", "modalities": { "input": [ - "text", - "image", - "video", - "audio" + "text" ], "output": [ "text" ] }, "limit": { - "context": 262144, - "output": 65536 + "context": 128000, + "output": 8000 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": true, "default": true }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } - }, - "attachment": true, - "open_weights": true, - "release_date": "2026-02-23", - "last_updated": "2026-02-23", + "attachment": false, + "open_weights": false, + "knowledge": "2025-03", + "release_date": "2025-03-16", + "last_updated": "2025-03-16", "cost": { - "input": 0.3, - "output": 2.4 + "input": 0.07, + "output": 0.28 }, "type": "chat" }, { - "id": "qwen-omni-turbo-realtime", - "name": "Qwen-Omni Turbo Realtime", - "display_name": "Qwen-Omni Turbo Realtime", + "id": "llama-4-scout", + "name": "Meta Llama 4 Scout 17B 16E", + "display_name": "Meta Llama 4 Scout 17B 16E", "modalities": { "input": [ "text", - "image", - "audio" + "image" ], "output": [ - "text", - "audio" + "text" ] }, "limit": { - "context": 32768, - "output": 2048 + "context": 131072, + "output": 8192 }, "temperature": true, "tool_call": true, @@ -67128,21 +70959,19 @@ }, "attachment": false, "open_weights": false, - "knowledge": "2024-04", - "release_date": "2025-05-08", - "last_updated": "2025-05-08", + "knowledge": "2025-01", + "release_date": "2025-01-01", + "last_updated": "2025-01-01", "cost": { - "input": 0.27, - "output": 1.07, - "input_audio": 4.44, - "output_audio": 8.89 + "input": 0.08, + "output": 0.3 }, "type": "chat" }, { - "id": "qwen-mt-plus", - "name": "Qwen Mt Plus", - "display_name": "Qwen Mt Plus", + "id": "sonar-pro", + "name": "Perplexity Sonar Pro", + "display_name": "Perplexity Sonar Pro", "modalities": { "input": [ "text" @@ -67152,8 +70981,8 @@ ] }, "limit": { - "context": 16384, - "output": 8192 + "context": 200000, + "output": 4096 }, "temperature": true, "tool_call": false, @@ -67162,19 +70991,19 @@ }, "attachment": false, "open_weights": false, - "knowledge": "2024-04", - "release_date": "2025-01", - "last_updated": "2025-01", + "knowledge": "2025-01", + "release_date": "2025-01-27", + "last_updated": "2025-01-27", "cost": { - "input": 2.46, - "output": 7.37 + "input": 3, + "output": 15 }, "type": "chat" }, { - "id": "qvq-max", - "name": "QVQ Max", - "display_name": "QVQ Max", + "id": "gpt-4.1", + "name": "OpenAI GPT-4.1", + "display_name": "OpenAI GPT-4.1", "modalities": { "input": [ "text", @@ -67185,30 +71014,30 @@ ] }, "limit": { - "context": 131072, - "output": 8192 + "context": 1047576, + "output": 32768 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, "attachment": false, "open_weights": false, - "knowledge": "2024-04", - "release_date": "2025-03-25", - "last_updated": "2025-03-25", + "knowledge": "2025-04", + "release_date": "2025-04-14", + "last_updated": "2025-04-14", "cost": { - "input": 1.2, - "output": 4.8 + "input": 2, + "output": 8, + "cache_read": 0.5 }, "type": "chat" }, { - "id": "qwen2-5-vl-7b-instruct", - "name": "Qwen2.5-VL 7B Instruct", - "display_name": "Qwen2.5-VL 7B Instruct", + "id": "claude-sonnet-4-5-20250929", + "name": "Anthropic: Claude Sonnet 4.5 (20250929)", + "display_name": "Anthropic: Claude Sonnet 4.5 (20250929)", "modalities": { "input": [ "text", @@ -67219,29 +71048,53 @@ ] }, "limit": { - "context": 131072, - "output": 8192 + "context": 200000, + "output": 64000 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": false + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": false, + "mode": "budget", + "budget": { + "min": 1024, + "unit": "tokens" + }, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ], + "notes": [ + "Claude 4 manual thinking uses thinking.type = \"enabled\" with budget_tokens.", + "Interleaved thinking requires the interleaved-thinking-2025-05-14 beta header for this model family." + ] + } }, "attachment": false, - "open_weights": true, - "knowledge": "2024-04", - "release_date": "2024-09", - "last_updated": "2024-09", + "open_weights": false, + "knowledge": "2025-09", + "release_date": "2025-09-29", + "last_updated": "2025-09-29", "cost": { - "input": 0.35, - "output": 1.05 + "input": 3, + "output": 15, + "cache_read": 0.30000000000000004, + "cache_write": 3.75 }, "type": "chat" }, { - "id": "qwen-plus", - "name": "Qwen Plus", - "display_name": "Qwen Plus", + "id": "deepseek-reasoner", + "name": "DeepSeek Reasoner", + "display_name": "DeepSeek Reasoner", "modalities": { "input": [ "text" @@ -67251,19 +71104,13 @@ ] }, "limit": { - "context": 1000000, - "output": 32768 + "context": 128000, + "output": 64000 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": false, - "budget": { - "default": 81920, - "min": 0, - "max": 81920 - } + "supported": true }, "extra_capabilities": { "reasoning": { @@ -67276,133 +71123,116 @@ ] } }, - "search": { - "supported": true, - "default": false, - "forced_search": false, - "search_strategy": "turbo" - }, "attachment": false, "open_weights": false, - "knowledge": "2024-04", - "release_date": "2024-01-25", - "last_updated": "2025-09-11", + "knowledge": "2025-01", + "release_date": "2025-01-20", + "last_updated": "2025-01-20", "cost": { - "input": 0.4, - "output": 1.2, - "reasoning": 4 + "input": 0.56, + "output": 1.68, + "cache_read": 0.07 }, "type": "chat" }, { - "id": "qwen2-5-7b-instruct", - "name": "Qwen2.5 7B Instruct", - "display_name": "Qwen2.5 7B Instruct", + "id": "grok-4-1-fast-reasoning", + "name": "xAI Grok 4.1 Fast Reasoning", + "display_name": "xAI Grok 4.1 Fast Reasoning", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 131072, - "output": 8192 + "context": 2000000, + "output": 2000000 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true + } }, "attachment": false, - "open_weights": true, - "knowledge": "2024-04", - "release_date": "2024-09", - "last_updated": "2024-09", + "open_weights": false, + "knowledge": "2025-11", + "release_date": "2025-11-17", + "last_updated": "2025-11-17", "cost": { - "input": 0.175, - "output": 0.7 + "input": 0.19999999999999998, + "output": 0.5, + "cache_read": 0.049999999999999996 }, "type": "chat" }, { - "id": "qwen3-coder-plus-2025-09-23", - "name": "Qwen3 Coder Plus 2025 09 23", - "display_name": "Qwen3 Coder Plus 2025 09 23", + "id": "gemini-3-pro-preview", + "name": "Google Gemini 3 Pro Preview", + "display_name": "Google Gemini 3 Pro Preview", "modalities": { "input": [ - "text" + "text", + "image", + "audio", + "video" ], "output": [ "text" ] }, "limit": { - "context": 1000000, + "context": 1048576, "output": 65536 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false - }, - "attachment": false, - "type": "chat" - }, - { - "id": "qwen3-coder-plus-2025-07-22", - "name": "Qwen3 Coder Plus 2025 07 22", - "display_name": "Qwen3 Coder Plus 2025 07 22", - "modalities": { - "input": [ - "text" - ], - "output": [ - "text" - ] - }, - "limit": { - "context": 1000000, - "output": 65536 + "supported": true, + "default": true }, - "temperature": true, - "tool_call": true, - "reasoning": { - "supported": false + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": true, + "mode": "level", + "level": "high", + "level_options": [ + "low", + "high" + ], + "summaries": true, + "visibility": "summary", + "continuation": [ + "thought_signatures" + ] + } }, "attachment": false, - "type": "chat" - }, - { - "id": "qwen-vl-ocr-latest", - "name": "Qwen Vl Ocr Latest", - "display_name": "Qwen Vl Ocr Latest", - "modalities": { - "input": [ - "text", - "image" - ], - "output": [ - "text" - ] - }, - "limit": { - "context": 34096, - "output": 4096 - }, - "temperature": true, - "tool_call": false, - "reasoning": { - "supported": false + "open_weights": false, + "knowledge": "2025-11", + "release_date": "2025-11-18", + "last_updated": "2025-11-18", + "cost": { + "input": 2, + "output": 12, + "cache_read": 0.19999999999999998 }, - "attachment": false, "type": "chat" }, { - "id": "qvq-max-2025-05-15", - "name": "Qvq Max 2025 05 15", - "display_name": "Qvq Max 2025 05 15", + "id": "gpt-5-mini", + "name": "OpenAI GPT-5 Mini", + "display_name": "OpenAI GPT-5 Mini", "modalities": { "input": [ "text", @@ -67413,51 +71243,86 @@ ] }, "limit": { - "context": 131072, - "output": 8192 + "context": 400000, + "output": 128000 }, - "temperature": true, - "tool_call": false, + "temperature": false, + "tool_call": true, "reasoning": { "supported": true, - "default": false, - "budget": { - "default": 16384, - "min": 0, - "max": 16384 + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": true, + "mode": "effort", + "effort": "medium", + "effort_options": [ + "minimal", + "low", + "medium", + "high" + ], + "verbosity": "medium", + "verbosity_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" } }, "attachment": false, + "open_weights": false, + "knowledge": "2025-01", + "release_date": "2025-01-01", + "last_updated": "2025-01-01", + "cost": { + "input": 0.25, + "output": 2, + "cache_read": 0.024999999999999998 + }, "type": "chat" }, { - "id": "qwen-long", - "name": "Qwen Long", - "display_name": "Qwen Long", + "id": "gpt-4.1-mini", + "name": "OpenAI GPT-4.1 Mini", + "display_name": "OpenAI GPT-4.1 Mini", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 1000000, - "output": 8192 + "context": 1047576, + "output": 32768 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { "supported": false }, "attachment": false, + "open_weights": false, + "knowledge": "2025-04", + "release_date": "2025-04-14", + "last_updated": "2025-04-14", + "cost": { + "input": 0.39999999999999997, + "output": 1.5999999999999999, + "cache_read": 0.09999999999999999 + }, "type": "chat" }, { - "id": "qwen-turbo-latest", - "name": "Qwen Turbo Latest", - "display_name": "Qwen Turbo Latest", + "id": "sonar-reasoning", + "name": "Perplexity Sonar Reasoning", + "display_name": "Perplexity Sonar Reasoning", "modalities": { "input": [ "text" @@ -67467,44 +71332,30 @@ ] }, "limit": { - "context": 131072, - "output": 16384 + "context": 127000, + "output": 4096 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": true, - "default": false, - "budget": { - "default": 38912, - "min": 0, - "max": 38912 - } - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } - }, - "search": { - "supported": true, - "default": false, - "forced_search": false, - "search_strategy": "turbo" + "default": true }, "attachment": false, + "open_weights": false, + "knowledge": "2025-01", + "release_date": "2025-01-27", + "last_updated": "2025-01-27", + "cost": { + "input": 1, + "output": 5 + }, "type": "chat" }, { - "id": "qwen-turbo-2024-09-19", - "name": "Qwen Turbo 2024 09 19", - "display_name": "Qwen Turbo 2024 09 19", + "id": "sonar-deep-research", + "name": "Perplexity Sonar Deep Research", + "display_name": "Perplexity Sonar Deep Research", "modalities": { "input": [ "text" @@ -67514,21 +71365,30 @@ ] }, "limit": { - "context": 131072, - "output": 8192 + "context": 127000, + "output": 4096 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": false + "supported": true, + "default": true }, "attachment": false, + "open_weights": false, + "knowledge": "2025-01", + "release_date": "2025-01-27", + "last_updated": "2025-01-27", + "cost": { + "input": 2, + "output": 8 + }, "type": "chat" }, { - "id": "qwen-flash-2025-07-28", - "name": "Qwen Flash 2025 07 28", - "display_name": "Qwen Flash 2025 07 28", + "id": "kimi-k2-0905", + "name": "Kimi K2 (09/05)", + "display_name": "Kimi K2 (09/05)", "modalities": { "input": [ "text" @@ -67538,91 +71398,86 @@ ] }, "limit": { - "context": 1000000, - "output": 32768 + "context": 262144, + "output": 16384 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": false, - "budget": { - "default": 81920, - "min": 0, - "max": 81920 - } - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } - }, - "search": { - "supported": true, - "default": false, - "forced_search": false, - "search_strategy": "turbo" + "supported": false }, "attachment": false, + "open_weights": false, + "knowledge": "2025-09", + "release_date": "2025-09-05", + "last_updated": "2025-09-05", + "cost": { + "input": 0.5, + "output": 2, + "cache_read": 0.39999999999999997 + }, "type": "chat" }, { - "id": "qwen-plus-latest", - "name": "Qwen Plus Latest", - "display_name": "Qwen Plus Latest", + "id": "gpt-5-nano", + "name": "OpenAI GPT-5 Nano", + "display_name": "OpenAI GPT-5 Nano", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 1000000, - "output": 32768 + "context": 400000, + "output": 128000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { "supported": true, - "default": false, - "budget": { - "default": 81920, - "min": 0, - "max": 81920 - } + "default": true }, "extra_capabilities": { "reasoning": { "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] + "default_enabled": true, + "mode": "effort", + "effort": "medium", + "effort_options": [ + "minimal", + "low", + "medium", + "high" + ], + "verbosity": "medium", + "verbosity_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" } }, - "search": { - "supported": true, - "default": false, - "forced_search": false, - "search_strategy": "turbo" - }, "attachment": false, + "open_weights": false, + "knowledge": "2025-01", + "release_date": "2025-01-01", + "last_updated": "2025-01-01", + "cost": { + "input": 0.049999999999999996, + "output": 0.39999999999999997, + "cache_read": 0.005 + }, "type": "chat" }, { - "id": "qwen-plus-2024-09-19", - "name": "Qwen Plus 2024 09 19", - "display_name": "Qwen Plus 2024 09 19", + "id": "grok-4", + "name": "xAI Grok 4", + "display_name": "xAI Grok 4", "modalities": { "input": [ "text" @@ -67632,43 +71487,54 @@ ] }, "limit": { - "context": 131072, - "output": 8192 + "context": 256000, + "output": 256000 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true + } }, "attachment": false, + "open_weights": false, + "knowledge": "2024-07", + "release_date": "2024-07-09", + "last_updated": "2024-07-09", + "cost": { + "input": 3, + "output": 15, + "cache_read": 0.75 + }, "type": "chat" }, { - "id": "qwen-plus-2025-07-14", - "name": "Qwen Plus 2025 07 14", - "display_name": "Qwen Plus 2025 07 14", + "id": "qwen3-235b-a22b-thinking", + "name": "Qwen3 235B A22B Thinking", + "display_name": "Qwen3 235B A22B Thinking", "modalities": { "input": [ - "text" + "text", + "image", + "video" ], "output": [ "text" ] }, "limit": { - "context": 131072, - "output": 16384 + "context": 262144, + "output": 81920 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": true, - "default": false, - "budget": { - "default": 38912, - "min": 0, - "max": 38912 - } + "default": true }, "extra_capabilities": { "reasoning": { @@ -67681,137 +71547,162 @@ ] } }, - "search": { - "supported": true, - "default": false, - "forced_search": false, - "search_strategy": "turbo" - }, "attachment": false, + "open_weights": false, + "knowledge": "2025-07", + "release_date": "2025-07-25", + "last_updated": "2025-07-25", + "cost": { + "input": 0.3, + "output": 2.9000000000000004 + }, "type": "chat" }, { - "id": "qwen-plus-2025-09-11", - "name": "Qwen Plus 2025 09 11", - "display_name": "Qwen Plus 2025 09 11", + "id": "claude-opus-4", + "name": "Anthropic: Claude Opus 4", + "display_name": "Anthropic: Claude Opus 4", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 1000000, - "output": 32768 + "context": 200000, + "output": 32000 }, "temperature": true, "tool_call": true, "reasoning": { "supported": true, - "default": false, - "budget": { - "default": 81920, - "min": 0, - "max": 81920 - } + "default": false }, "extra_capabilities": { "reasoning": { "supported": true, + "default_enabled": false, + "mode": "budget", + "budget": { + "min": 1024, + "unit": "tokens" + }, "interleaved": true, "summaries": true, "visibility": "summary", "continuation": [ "thinking_blocks" + ], + "notes": [ + "Claude 4 manual thinking uses thinking.type = \"enabled\" with budget_tokens.", + "Interleaved thinking requires the interleaved-thinking-2025-05-14 beta header for this model family." ] } }, - "search": { - "supported": true, - "default": false, - "forced_search": false, - "search_strategy": "turbo" - }, "attachment": false, + "open_weights": false, + "knowledge": "2025-05", + "release_date": "2025-05-14", + "last_updated": "2025-05-14", + "cost": { + "input": 15, + "output": 75, + "cache_read": 1.5, + "cache_write": 18.75 + }, "type": "chat" }, { - "id": "qwen-max-latest", - "name": "Qwen Max Latest", - "display_name": "Qwen Max Latest", + "id": "grok-4-fast-non-reasoning", + "name": "xAI Grok 4 Fast Non-Reasoning", + "display_name": "xAI Grok 4 Fast Non-Reasoning", "modalities": { "input": [ - "text" + "text", + "image", + "audio" ], "output": [ "text" ] }, "limit": { - "context": 131072, - "output": 8192 + "context": 2000000, + "output": 2000000 }, "temperature": true, "tool_call": true, "reasoning": { "supported": false }, - "search": { - "supported": true, - "default": false, - "forced_search": false, - "search_strategy": "turbo" - }, "attachment": false, + "open_weights": false, + "knowledge": "2025-09", + "release_date": "2025-09-19", + "last_updated": "2025-09-19", + "cost": { + "input": 0.19999999999999998, + "output": 0.5, + "cache_read": 0.049999999999999996 + }, "type": "chat" }, { - "id": "qwen-max-2024-09-19", - "name": "Qwen Max 2024 09 19", - "display_name": "Qwen Max 2024 09 19", + "id": "claude-4.5-opus", + "name": "Anthropic: Claude Opus 4.5", + "display_name": "Anthropic: Claude Opus 4.5", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 32768, - "output": 8192 + "context": 200000, + "output": 64000 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false - }, - "search": { "supported": true, - "default": false, - "forced_search": false, - "search_strategy": "turbo" + "default": true }, "attachment": false, + "open_weights": false, + "knowledge": "2025-11", + "release_date": "2025-11-24", + "last_updated": "2025-11-24", + "cost": { + "input": 5, + "output": 25, + "cache_read": 0.5, + "cache_write": 6.25 + }, "type": "chat" }, { - "id": "qwen-max-2024-04-28", - "name": "Qwen Max 2024 04 28", - "display_name": "Qwen Max 2024 04 28", + "id": "qwen3-vl-235b-a22b-instruct", + "name": "Qwen3 VL 235B A22B Instruct", + "display_name": "Qwen3 VL 235B A22B Instruct", "modalities": { "input": [ - "text" + "text", + "image", + "video" ], "output": [ "text" ] }, "limit": { - "context": 8000, - "output": 2000 + "context": 256000, + "output": 16384 }, "temperature": true, "tool_call": true, @@ -67819,12 +71710,20 @@ "supported": false }, "attachment": false, + "open_weights": false, + "knowledge": "2025-09", + "release_date": "2025-09-23", + "last_updated": "2025-09-23", + "cost": { + "input": 0.3, + "output": 1.5 + }, "type": "chat" }, { - "id": "qwen-max-2024-04-03", - "name": "Qwen Max 2024 04 03", - "display_name": "Qwen Max 2024 04 03", + "id": "kimi-k2-0711", + "name": "Kimi K2 (07/11)", + "display_name": "Kimi K2 (07/11)", "modalities": { "input": [ "text" @@ -67834,8 +71733,8 @@ ] }, "limit": { - "context": 8000, - "output": 2000 + "context": 131072, + "output": 16384 }, "temperature": true, "tool_call": true, @@ -67843,15 +71742,24 @@ "supported": false }, "attachment": false, + "open_weights": false, + "knowledge": "2025-01", + "release_date": "2025-01-01", + "last_updated": "2025-01-01", + "cost": { + "input": 0.5700000000000001, + "output": 2.3 + }, "type": "chat" }, { - "id": "qwen-max-2025-01-25", - "name": "Qwen Max 2025 01 25", - "display_name": "Qwen Max 2025 01 25", + "id": "gemma-3-12b-it", + "name": "Google Gemma 3 12B", + "display_name": "Google Gemma 3 12B", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" @@ -67862,94 +71770,59 @@ "output": 8192 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": false }, - "search": { - "supported": true, - "default": false, - "forced_search": false, - "search_strategy": "turbo" - }, "attachment": false, + "open_weights": false, + "knowledge": "2024-12", + "release_date": "2024-12-01", + "last_updated": "2024-12-01", + "cost": { + "input": 0.049999999999999996, + "output": 0.09999999999999999 + }, "type": "chat" }, { - "id": "qwen3-max-2025-09-23", - "name": "Qwen3 Max 20250923", - "display_name": "Qwen3 Max 20250923", + "id": "gpt-4o-mini", + "name": "OpenAI GPT-4o-mini", + "display_name": "OpenAI GPT-4o-mini", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 262144, - "output": 65536 + "context": 128000, + "output": 16384 }, "temperature": true, "tool_call": true, "reasoning": { "supported": false }, - "search": { - "supported": true, - "default": false, - "forced_search": false, - "search_strategy": "turbo" - }, "attachment": false, - "type": "chat" - }, - { - "id": "qwen3-max-preview", - "name": "Qwen3 Max Preview", - "display_name": "Qwen3 Max Preview", - "modalities": { - "input": [ - "text" - ], - "output": [ - "text" - ] - }, - "limit": { - "context": 262144, - "output": 65536 - }, - "temperature": true, - "tool_call": true, - "reasoning": { - "supported": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } - }, - "search": { - "supported": true, - "default": false, - "forced_search": false, - "search_strategy": "turbo" + "open_weights": false, + "knowledge": "2024-07", + "release_date": "2024-07-18", + "last_updated": "2024-07-18", + "cost": { + "input": 0.15, + "output": 0.6, + "cache_read": 0.075 }, - "attachment": false, "type": "chat" }, { - "id": "qwen3-235b-a22b-thinking-2507", - "name": "Qwen3 235B A22B Thinking 2507", - "display_name": "Qwen3 235B A22B Thinking 2507", + "id": "gpt-oss-20b", + "name": "OpenAI GPT-OSS 20b", + "display_name": "OpenAI GPT-OSS 20b", "modalities": { "input": [ "text" @@ -67960,72 +71833,46 @@ }, "limit": { "context": 131072, - "output": 32768 + "output": 131072 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { "supported": true, - "default": true, - "budget": { - "default": 81920, - "min": 0, - "max": 81920 - } + "default": true }, "extra_capabilities": { "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] + "supported": true } }, "attachment": false, - "type": "chat" - }, - { - "id": "qwen3-235b-a22b-instruct-2507", - "name": "Qwen3 235B A22B Instruct 2507", - "display_name": "Qwen3 235B A22B Instruct 2507", - "modalities": { - "input": [ - "text" - ], - "output": [ - "text" - ] - }, - "limit": { - "context": 131072, - "output": 32768 - }, - "temperature": true, - "tool_call": true, - "reasoning": { - "supported": false + "open_weights": false, + "knowledge": "2024-06", + "release_date": "2024-06-01", + "last_updated": "2024-06-01", + "cost": { + "input": 0.049999999999999996, + "output": 0.19999999999999998 }, - "attachment": false, "type": "chat" }, { - "id": "qwen3-30b-a3b-instruct-2507", - "name": "Qwen3 30B A3B Instruct 2507", - "display_name": "Qwen3 30B A3B Instruct 2507", + "id": "claude-3.5-sonnet-v2", + "name": "Anthropic: Claude 3.5 Sonnet v2", + "display_name": "Anthropic: Claude 3.5 Sonnet v2", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 131072, - "output": 32768 + "context": 200000, + "output": 8192 }, "temperature": true, "tool_call": true, @@ -68033,34 +71880,39 @@ "supported": false }, "attachment": false, + "open_weights": false, + "knowledge": "2024-10", + "release_date": "2024-10-22", + "last_updated": "2024-10-22", + "cost": { + "input": 3, + "output": 15, + "cache_read": 0.30000000000000004, + "cache_write": 3.75 + }, "type": "chat" }, { - "id": "qwen3-30b-a3b-thinking-2507", - "name": "Qwen3 30B A3B Thinking 2507", - "display_name": "Qwen3 30B A3B Thinking 2507", + "id": "qwen3-30b-a3b", + "name": "Qwen3 30B A3B", + "display_name": "Qwen3 30B A3B", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 131072, - "output": 32768 + "context": 41000, + "output": 41000 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { - "supported": true, - "default": true, - "budget": { - "default": 81920, - "min": 0, - "max": 81920 - } + "supported": true }, "extra_capabilities": { "reasoning": { @@ -68074,12 +71926,20 @@ } }, "attachment": false, + "open_weights": false, + "knowledge": "2025-06", + "release_date": "2025-06-01", + "last_updated": "2025-06-01", + "cost": { + "input": 0.08, + "output": 0.29 + }, "type": "chat" }, { - "id": "qwen3-30b-a3b", - "name": "Qwen3 30B A3B", - "display_name": "Qwen3 30B A3B", + "id": "gpt-5-codex", + "name": "OpenAI: GPT-5 Codex", + "display_name": "OpenAI: GPT-5 Codex", "modalities": { "input": [ "text" @@ -68089,38 +71949,52 @@ ] }, "limit": { - "context": 131072, - "output": 32768 + "context": 400000, + "output": 128000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { "supported": true, - "default": false, - "budget": { - "default": 81920, - "min": 0, - "max": 81920 - } + "default": true }, "extra_capabilities": { "reasoning": { "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] + "default_enabled": true, + "mode": "effort", + "effort": "medium", + "effort_options": [ + "minimal", + "low", + "medium", + "high" + ], + "verbosity": "medium", + "verbosity_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" } }, "attachment": false, + "open_weights": false, + "knowledge": "2025-01", + "release_date": "2025-01-01", + "last_updated": "2025-01-01", + "cost": { + "input": 1.25, + "output": 10, + "cache_read": 0.12500000000000003 + }, "type": "chat" }, { - "id": "qwen3-4b", - "name": "Qwen3 4B", - "display_name": "Qwen3 4B", + "id": "deepseek-v3.2", + "name": "DeepSeek V3.2", + "display_name": "DeepSeek V3.2", "modalities": { "input": [ "text" @@ -68130,229 +72004,211 @@ ] }, "limit": { - "context": 131072, - "output": 8192 + "context": 163840, + "output": 65536 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true, - "budget": { - "default": 38912, - "min": 0, - "max": 38912 - } + "supported": true }, "extra_capabilities": { "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] + "supported": true } }, "attachment": false, + "open_weights": false, + "knowledge": "2025-09", + "release_date": "2025-09-22", + "last_updated": "2025-09-22", + "cost": { + "input": 0.27, + "output": 0.41 + }, "type": "chat" }, { - "id": "qwen3-1.7b", - "name": "Qwen3 1.7B", - "display_name": "Qwen3 1.7B", + "id": "claude-4.5-sonnet", + "name": "Anthropic: Claude Sonnet 4.5", + "display_name": "Anthropic: Claude Sonnet 4.5", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 32768, - "output": 8192 + "context": 200000, + "output": 64000 }, "temperature": true, "tool_call": true, "reasoning": { "supported": true, - "default": true, - "budget": { - "default": 30720, - "min": 0, - "max": 30720 - } - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } + "default": true }, "attachment": false, + "open_weights": false, + "knowledge": "2025-09", + "release_date": "2025-09-29", + "last_updated": "2025-09-29", + "cost": { + "input": 3, + "output": 15, + "cache_read": 0.30000000000000004, + "cache_write": 3.75 + }, "type": "chat" }, { - "id": "qwen3-0.6b", - "name": "Qwen3 0.6B", - "display_name": "Qwen3 0.6B", + "id": "mistral-small", + "name": "Mistral Small 3.2", + "display_name": "Mistral Small 3.2", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 32768, - "output": 8192 + "context": 128000, + "output": 16384 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true, - "budget": { - "default": 30720, - "min": 0, - "max": 30720 - } - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } + "supported": false }, "attachment": false, + "open_weights": true, + "knowledge": "2025-03", + "release_date": "2025-06-20", + "last_updated": "2025-06-20", + "cost": { + "input": 0.075, + "output": 0.2 + }, "type": "chat" }, { - "id": "qwen3-vl-plus-2025-09-23", - "name": "Qwen3 VL Plus 2025 09 23", - "display_name": "Qwen3 VL Plus 2025 09 23", + "id": "llama-3.1-8b-instruct-turbo", + "name": "Meta Llama 3.1 8B Instruct Turbo", + "display_name": "Meta Llama 3.1 8B Instruct Turbo", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 262144, - "output": 32768 + "context": 128000, + "output": 128000 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { - "supported": true, - "default": false, - "budget": { - "default": 81920, - "min": 0, - "max": 81920 - } - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } + "supported": false }, "attachment": false, + "open_weights": false, + "knowledge": "2024-07", + "release_date": "2024-07-23", + "last_updated": "2024-07-23", + "cost": { + "input": 0.02, + "output": 0.03 + }, "type": "chat" }, { - "id": "qwq-plus-latest", - "name": "QwQ Plus Latest", - "display_name": "QwQ Plus Latest", + "id": "gpt-5.1", + "name": "OpenAI GPT-5.1", + "display_name": "OpenAI GPT-5.1", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ - "text" + "text", + "image" ] }, "limit": { - "context": 131072, - "output": 8192 + "context": 400000, + "output": 128000 }, - "temperature": true, - "tool_call": false, + "temperature": false, + "tool_call": true, "reasoning": { "supported": true, - "default": true, - "budget": { - "default": 32768, - "min": 0, - "max": 32768 - } + "default": false }, "extra_capabilities": { "reasoning": { "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] + "default_enabled": false, + "mode": "effort", + "effort": "none", + "effort_options": [ + "none", + "low", + "medium", + "high" + ], + "verbosity": "medium", + "verbosity_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" } }, - "search": { - "supported": false - }, "attachment": false, + "open_weights": false, + "knowledge": "2025-01", + "release_date": "2025-01-01", + "last_updated": "2025-01-01", + "cost": { + "input": 1.25, + "output": 10, + "cache_read": 0.12500000000000003 + }, "type": "chat" } ] }, - "xiaomi": { - "id": "xiaomi", - "name": "Xiaomi", - "display_name": "Xiaomi", - "api": "https://api.xiaomimimo.com/v1", - "doc": "https://platform.xiaomimimo.com/#/docs", + "zai": { + "id": "zai", + "name": "Z.AI", + "display_name": "Z.AI", + "api": "https://api.z.ai/api/paas/v4", + "doc": "https://docs.z.ai/guides/overview/pricing", "models": [ { - "id": "mimo-v2-omni", - "name": "MiMo-V2-Omni", - "display_name": "MiMo-V2-Omni", + "id": "glm-4.7", + "name": "GLM-4.7", + "display_name": "GLM-4.7", "modalities": { "input": [ - "text", - "image", - "audio", - "video", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 262144, + "context": 204800, "output": 131072 }, "temperature": true, @@ -68372,33 +72228,36 @@ ] } }, - "attachment": true, - "open_weights": false, - "knowledge": "2024-12", - "release_date": "2026-03-18", - "last_updated": "2026-03-18", + "attachment": false, + "open_weights": true, + "knowledge": "2025-04", + "release_date": "2025-12-22", + "last_updated": "2025-12-22", "cost": { - "input": 0.4, - "output": 2, - "cache_read": 0.08 + "input": 0.6, + "output": 2.2, + "cache_read": 0.11, + "cache_write": 0 }, "type": "chat" }, { - "id": "mimo-v2.5-pro-ultraspeed", - "name": "MiMo-V2.5-Pro-UltraSpeed", - "display_name": "MiMo-V2.5-Pro-UltraSpeed", + "id": "glm-4.5v", + "name": "GLM-4.5V", + "display_name": "GLM-4.5V", "modalities": { "input": [ - "text" + "text", + "image", + "video" ], "output": [ "text" ] }, "limit": { - "context": 1048576, - "output": 131072 + "context": 64000, + "output": 16384 }, "temperature": true, "tool_call": true, @@ -68406,33 +72265,21 @@ "supported": true, "default": true }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } - }, - "attachment": false, + "attachment": true, "open_weights": true, - "knowledge": "2024-12", - "release_date": "2026-06-08", - "last_updated": "2026-06-09", + "knowledge": "2025-04", + "release_date": "2025-08-11", + "last_updated": "2025-08-11", "cost": { - "input": 1.305, - "output": 2.61, - "cache_read": 0.0108 + "input": 0.6, + "output": 1.8 }, "type": "chat" }, { - "id": "mimo-v2-pro", - "name": "MiMo-V2-Pro", - "display_name": "MiMo-V2-Pro", + "id": "glm-4.5", + "name": "GLM-4.5", + "display_name": "GLM-4.5", "modalities": { "input": [ "text" @@ -68442,8 +72289,8 @@ ] }, "limit": { - "context": 1048576, - "output": 131072 + "context": 131072, + "output": 98304 }, "temperature": true, "tool_call": true, @@ -68451,113 +72298,58 @@ "supported": true, "default": true }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } - }, "attachment": false, - "open_weights": false, - "knowledge": "2024-12", - "release_date": "2026-03-18", - "last_updated": "2026-03-18", + "open_weights": true, + "knowledge": "2025-04", + "release_date": "2025-07-28", + "last_updated": "2025-07-28", "cost": { - "input": 1, - "output": 3, - "cache_read": 0.2, - "tiers": [ - { - "input": 2, - "output": 6, - "cache_read": 0.4, - "tier": { - "type": "context", - "size": 256000 - } - } - ], - "context_over_200k": { - "input": 2, - "output": 6, - "cache_read": 0.4 - } + "input": 0.6, + "output": 2.2, + "cache_read": 0.11, + "cache_write": 0 }, "type": "chat" }, { - "id": "mimo-v2.5", - "name": "MiMo-V2.5", - "display_name": "MiMo-V2.5", + "id": "glm-4.7-flashx", + "name": "GLM-4.7-FlashX", + "display_name": "GLM-4.7-FlashX", "modalities": { "input": [ - "text", - "image", - "audio", - "video" + "text" ], "output": [ "text" ] }, "limit": { - "context": 1048576, + "context": 200000, "output": 131072 }, "temperature": true, "tool_call": true, "reasoning": { "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } + "default": true }, - "attachment": true, + "attachment": false, "open_weights": true, - "knowledge": "2024-12", - "release_date": "2026-04-22", - "last_updated": "2026-04-22", + "knowledge": "2025-04", + "release_date": "2026-01-19", + "last_updated": "2026-01-19", "cost": { - "input": 0.4, - "output": 2, - "cache_read": 0.08, - "tiers": [ - { - "input": 0.8, - "output": 4, - "cache_read": 0.16, - "tier": { - "type": "context", - "size": 256000 - } - } - ], - "context_over_200k": { - "input": 0.8, - "output": 4, - "cache_read": 0.16 - } + "input": 0.07, + "output": 0.4, + "cache_read": 0.01, + "cache_write": 0 }, "type": "chat" }, { - "id": "mimo-v2-flash", - "name": "MiMo-V2-Flash", - "display_name": "MiMo-V2-Flash", + "id": "glm-5.1", + "name": "GLM-5.1", + "display_name": "GLM-5.1", "modalities": { "input": [ "text" @@ -68567,8 +72359,8 @@ ] }, "limit": { - "context": 262144, - "output": 65536 + "context": 200000, + "output": 131072 }, "temperature": true, "tool_call": true, @@ -68588,21 +72380,21 @@ } }, "attachment": false, - "open_weights": true, - "knowledge": "2024-12-01", - "release_date": "2025-12-16", - "last_updated": "2026-02-04", + "open_weights": false, + "release_date": "2026-03-27", + "last_updated": "2026-03-27", "cost": { - "input": 0.1, - "output": 0.3, - "cache_read": 0.01 + "input": 1.4, + "output": 4.4, + "cache_read": 0.26, + "cache_write": 0 }, "type": "chat" }, { - "id": "mimo-v2.5-pro", - "name": "MiMo-V2.5-Pro", - "display_name": "MiMo-V2.5-Pro", + "id": "glm-4.6", + "name": "GLM-4.6", + "display_name": "GLM-4.6", "modalities": { "input": [ "text" @@ -68612,7 +72404,7 @@ ] }, "limit": { - "context": 1048576, + "context": 204800, "output": 131072 }, "temperature": true, @@ -68623,153 +72415,144 @@ }, "extra_capabilities": { "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] + "supported": true } }, "attachment": false, "open_weights": true, - "knowledge": "2024-12", - "release_date": "2026-04-22", - "last_updated": "2026-04-22", + "knowledge": "2025-04", + "release_date": "2025-09-30", + "last_updated": "2025-09-30", "cost": { - "input": 1, - "output": 3, - "cache_read": 0.2, - "tiers": [ - { - "input": 2, - "output": 6, - "cache_read": 0.4, - "tier": { - "type": "context", - "size": 256000 - } - } - ], - "context_over_200k": { - "input": 2, - "output": 6, - "cache_read": 0.4 - } + "input": 0.6, + "output": 2.2, + "cache_read": 0.11, + "cache_write": 0 }, "type": "chat" - } - ] - }, - "mistral": { - "id": "mistral", - "name": "Mistral", - "display_name": "Mistral", - "doc": "https://docs.mistral.ai/getting-started/models/", - "models": [ + }, { - "id": "mistral-large-2411", - "name": "Mistral Large 2.1", - "display_name": "Mistral Large 2.1", + "id": "glm-4.6v", + "name": "GLM-4.6V", + "display_name": "GLM-4.6V", "modalities": { "input": [ - "text" + "text", + "image", + "video" ], "output": [ "text" ] }, "limit": { - "context": 131072, - "output": 16384 + "context": 128000, + "output": 32768 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": false, + "attachment": true, "open_weights": true, - "knowledge": "2024-11", - "release_date": "2024-11-01", - "last_updated": "2024-11-04", + "knowledge": "2025-04", + "release_date": "2025-12-08", + "last_updated": "2025-12-08", "cost": { - "input": 2, - "output": 6 + "input": 0.3, + "output": 0.9 }, "type": "chat" }, { - "id": "mistral-medium-2508", - "name": "Mistral Medium 3.1", - "display_name": "Mistral Medium 3.1", + "id": "glm-5v-turbo", + "name": "GLM-5V-Turbo", + "display_name": "GLM-5V-Turbo", "modalities": { "input": [ "text", - "image" + "image", + "video", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 262144, - "output": 262144 + "context": 200000, + "output": 131072 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } }, "attachment": true, "open_weights": false, - "knowledge": "2025-05", - "release_date": "2025-08-12", - "last_updated": "2025-08-12", + "release_date": "2026-04-01", + "last_updated": "2026-04-01", "cost": { - "input": 0.4, - "output": 2 + "input": 1.2, + "output": 4, + "cache_read": 0.24, + "cache_write": 0 }, "type": "chat" }, { - "id": "mistral-medium-latest", - "name": "Mistral Medium (latest)", - "display_name": "Mistral Medium (latest)", + "id": "glm-4.5-air", + "name": "GLM-4.5-Air", + "display_name": "GLM-4.5-Air", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 262144, - "output": 262144 + "context": 131072, + "output": 98304 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": true, - "open_weights": false, - "knowledge": "2025-05", - "release_date": "2025-08-12", - "last_updated": "2025-08-12", + "attachment": false, + "open_weights": true, + "knowledge": "2025-04", + "release_date": "2025-07-28", + "last_updated": "2025-07-28", "cost": { - "input": 0.4, - "output": 2 + "input": 0.2, + "output": 1.1, + "cache_read": 0.03, + "cache_write": 0 }, "type": "chat" }, { - "id": "devstral-medium-latest", - "name": "Devstral 2 (latest)", - "display_name": "Devstral 2 (latest)", + "id": "glm-4.7-flash", + "name": "GLM-4.7-Flash", + "display_name": "GLM-4.7-Flash", "modalities": { "input": [ "text" @@ -68779,41 +72562,48 @@ ] }, "limit": { - "context": 262144, - "output": 262144 + "context": 200000, + "output": 131072 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true + } }, "attachment": false, "open_weights": true, - "knowledge": "2025-12", - "release_date": "2025-12-02", - "last_updated": "2025-12-02", + "knowledge": "2025-04", + "release_date": "2026-01-19", + "last_updated": "2026-01-19", "cost": { - "input": 0.4, - "output": 2 + "input": 0, + "output": 0, + "cache_read": 0, + "cache_write": 0 }, "type": "chat" }, { - "id": "mistral-small-2603", - "name": "Mistral Small 4", - "display_name": "Mistral Small 4", + "id": "glm-4.5-flash", + "name": "GLM-4.5-Flash", + "display_name": "GLM-4.5-Flash", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 256000, - "output": 256000 + "context": 131072, + "output": 98304 }, "temperature": true, "tool_call": true, @@ -68821,33 +72611,34 @@ "supported": true, "default": true }, - "attachment": true, + "attachment": false, "open_weights": true, - "knowledge": "2025-06", - "release_date": "2026-03-16", - "last_updated": "2026-03-16", + "knowledge": "2025-04", + "release_date": "2025-07-28", + "last_updated": "2025-07-28", "cost": { - "input": 0.15, - "output": 0.6 + "input": 0, + "output": 0, + "cache_read": 0, + "cache_write": 0 }, "type": "chat" }, { - "id": "mistral-medium-2604", - "name": "Mistral Medium 3.5", - "display_name": "Mistral Medium 3.5", + "id": "glm-5", + "name": "GLM-5", + "display_name": "GLM-5", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 262144, - "output": 262144 + "context": 204800, + "output": 131072 }, "temperature": true, "tool_call": true, @@ -68855,20 +72646,33 @@ "supported": true, "default": true }, - "attachment": true, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } + }, + "attachment": false, "open_weights": true, - "release_date": "2026-04-29", - "last_updated": "2026-04-29", + "release_date": "2026-02-11", + "last_updated": "2026-02-11", "cost": { - "input": 1.5, - "output": 7.5 + "input": 1, + "output": 3.2, + "cache_read": 0.2, + "cache_write": 0 }, "type": "chat" }, { - "id": "mistral-embed", - "name": "Mistral Embed", - "display_name": "Mistral Embed", + "id": "glm-5-turbo", + "name": "GLM-5-Turbo", + "display_name": "GLM-5-Turbo", "modalities": { "input": [ "text" @@ -68878,60 +72682,95 @@ ] }, "limit": { - "context": 8000, - "output": 3072 + "context": 200000, + "output": 131072 }, - "temperature": false, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } }, "attachment": false, "open_weights": false, - "release_date": "2023-12-11", - "last_updated": "2023-12-11", + "release_date": "2026-03-16", + "last_updated": "2026-03-16", "cost": { - "input": 0.1, - "output": 0 + "input": 1.2, + "output": 4, + "cache_read": 0.24, + "cache_write": 0 }, "type": "chat" - }, + } + ] + }, + "nearai": { + "id": "nearai", + "name": "NEAR AI Cloud", + "display_name": "NEAR AI Cloud", + "api": "https://cloud-api.near.ai/v1", + "doc": "https://docs.near.ai/", + "models": [ { - "id": "ministral-8b-latest", - "name": "Ministral 8B (latest)", - "display_name": "Ministral 8B (latest)", + "id": "google/gemini-3.1-flash-lite", + "name": "Gemini 3.1 Flash Lite", + "display_name": "Gemini 3.1 Flash Lite", "modalities": { "input": [ - "text" + "text", + "image", + "video", + "audio", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 128000 + "context": 1048576, + "output": 65536 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": false, - "open_weights": true, - "knowledge": "2024-10", - "release_date": "2024-10-01", - "last_updated": "2024-10-04", + "extra_capabilities": { + "reasoning": { + "supported": true + } + }, + "attachment": true, + "open_weights": false, + "knowledge": "2025-01", + "release_date": "2026-05-07", + "last_updated": "2026-05-07", "cost": { - "input": 0.1, - "output": 0.1 + "input": 0.25, + "output": 1.5, + "cache_read": 0.025, + "input_audio": 0.5 }, "type": "chat" }, { - "id": "mistral-nemo", - "name": "Mistral Nemo", - "display_name": "Mistral Nemo", + "id": "google/gemma-4-31B-it", + "name": "Gemma 4 31B IT", + "display_name": "Gemma 4 31B IT", "modalities": { "input": [ "text" @@ -68941,193 +72780,333 @@ ] }, "limit": { - "context": 128000, - "output": 128000 + "context": 262144, + "output": 32768 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": false, + "attachment": true, "open_weights": true, - "knowledge": "2024-07", - "release_date": "2024-07-01", - "last_updated": "2024-07-01", + "release_date": "2026-04-02", + "last_updated": "2026-04-02", "cost": { - "input": 0.15, - "output": 0.15 + "input": 0.13, + "output": 0.4, + "cache_read": 0.026 }, "type": "chat" }, { - "id": "mistral-large-2512", - "name": "Mistral Large 3", - "display_name": "Mistral Large 3", + "id": "google/gemini-2.5-pro", + "name": "Gemini 2.5 Pro", + "display_name": "Gemini 2.5 Pro", "modalities": { "input": [ "text", - "image" + "image", + "audio", + "video", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 262144, - "output": 262144 + "context": 1048576, + "output": 65536 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": true, + "mode": "budget", + "budget": { + "default": -1, + "min": 128, + "max": 32768, + "auto": -1, + "unit": "tokens" + }, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thought_signatures" + ] + } }, "attachment": true, - "open_weights": true, - "knowledge": "2024-11", - "release_date": "2024-11-01", - "last_updated": "2025-12-02", + "open_weights": false, + "knowledge": "2025-01", + "release_date": "2025-03-20", + "last_updated": "2025-06-05", "cost": { - "input": 0.5, - "output": 1.5 + "input": 1.25, + "output": 10, + "cache_read": 0.125, + "tiers": [ + { + "input": 2.5, + "output": 15, + "cache_read": 0.25, + "tier": { + "type": "context", + "size": 200000 + } + } + ], + "context_over_200k": { + "input": 2.5, + "output": 15, + "cache_read": 0.25 + } }, "type": "chat" }, { - "id": "open-mistral-7b", - "name": "Mistral 7B", - "display_name": "Mistral 7B", + "id": "google/gemini-2.5-flash", + "name": "Gemini 2.5 Flash", + "display_name": "Gemini 2.5 Flash", "modalities": { "input": [ - "text" + "text", + "image", + "audio", + "video", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 8000, - "output": 8000 + "context": 1048576, + "output": 65536 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": false, - "open_weights": true, - "knowledge": "2023-12", - "release_date": "2023-09-27", - "last_updated": "2023-09-27", + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": true, + "mode": "budget", + "budget": { + "default": -1, + "min": 0, + "max": 24576, + "auto": -1, + "off": 0, + "unit": "tokens" + }, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thought_signatures" + ] + } + }, + "attachment": true, + "open_weights": false, + "knowledge": "2025-01", + "release_date": "2025-03-20", + "last_updated": "2025-06-05", "cost": { - "input": 0.25, - "output": 0.25 + "input": 0.3, + "output": 2.5, + "cache_read": 0.03, + "input_audio": 1 }, "type": "chat" }, { - "id": "labs-devstral-small-2512", - "name": "Devstral Small 2", - "display_name": "Devstral Small 2", + "id": "google/gemini-3.5-flash", + "name": "Gemini 3.5 Flash", + "display_name": "Gemini 3.5 Flash", "modalities": { "input": [ "text", - "image" + "image", + "video", + "audio", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 256000, - "output": 256000 + "context": 1048576, + "output": 65536 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": false, - "open_weights": true, - "knowledge": "2025-12", - "release_date": "2025-12-09", - "last_updated": "2025-12-09", + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": true, + "mode": "level", + "level": "high", + "level_options": [ + "minimal", + "low", + "medium", + "high" + ], + "summaries": true, + "visibility": "summary", + "continuation": [ + "thought_signatures" + ] + } + }, + "attachment": true, + "open_weights": false, + "knowledge": "2025-01", + "release_date": "2026-05-19", + "last_updated": "2026-05-19", "cost": { - "input": 0, - "output": 0 + "input": 1.5, + "output": 9, + "cache_read": 0.15, + "input_audio": 1.5 }, "type": "chat" }, { - "id": "mistral-large-latest", - "name": "Mistral Large (latest)", - "display_name": "Mistral Large (latest)", + "id": "google/gemini-3-pro", + "name": "Gemini 3 Pro Preview", + "display_name": "Gemini 3 Pro Preview", "modalities": { "input": [ "text", - "image" + "image", + "video", + "audio", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 262144, - "output": 262144 + "context": 1048576, + "output": 65536 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": true, + "mode": "level", + "level": "high", + "level_options": [ + "low", + "high" + ], + "summaries": true, + "visibility": "summary", + "continuation": [ + "thought_signatures" + ] + } }, "attachment": true, - "open_weights": true, - "knowledge": "2024-11", - "release_date": "2024-11-01", - "last_updated": "2025-12-02", + "open_weights": false, + "knowledge": "2025-01", + "release_date": "2025-11-18", + "last_updated": "2025-11-18", "cost": { - "input": 0.5, - "output": 1.5 + "input": 1.25, + "output": 15, + "cache_read": 0 }, "type": "chat" }, { - "id": "mistral-medium-2505", - "name": "Mistral Medium 3", - "display_name": "Mistral Medium 3", + "id": "google/gemini-2.5-flash-lite", + "name": "Gemini 2.5 Flash-Lite", + "display_name": "Gemini 2.5 Flash-Lite", "modalities": { "input": [ "text", - "image" + "image", + "audio", + "video", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 131072, - "output": 131072 + "context": 1048576, + "output": 65536 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": false + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": false, + "mode": "budget", + "budget": { + "default": -1, + "min": 512, + "max": 24576, + "auto": -1, + "unit": "tokens" + }, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thought_signatures" + ] + } }, "attachment": true, "open_weights": false, - "knowledge": "2025-05", - "release_date": "2025-05-07", - "last_updated": "2025-05-07", + "knowledge": "2025-01", + "release_date": "2025-06-17", + "last_updated": "2025-06-17", "cost": { - "input": 0.4, - "output": 2 + "input": 0.1, + "output": 0.4, + "cache_read": 0.01, + "input_audio": 0.3 }, "type": "chat" }, { - "id": "magistral-small", - "name": "Magistral Small", - "display_name": "Magistral Small", + "id": "Qwen/Qwen3-Embedding-0.6B", + "name": "Qwen3 Embedding 0.6B", + "display_name": "Qwen3 Embedding 0.6B", "modalities": { "input": [ "text" @@ -69137,30 +73116,59 @@ ] }, "limit": { - "context": 128000, - "output": 128000 + "context": 40960, + "output": 1024 }, - "temperature": true, - "tool_call": true, + "temperature": false, + "tool_call": false, "reasoning": { - "supported": true, - "default": true + "supported": false }, "attachment": false, "open_weights": true, - "knowledge": "2025-06", - "release_date": "2025-03-17", - "last_updated": "2025-03-17", + "release_date": "2025-06-03", + "last_updated": "2025-06-03", "cost": { - "input": 0.5, - "output": 1.5 + "input": 0.01, + "output": 0 }, - "type": "chat" + "type": "embedding" }, { - "id": "devstral-latest", - "name": "Devstral 2", - "display_name": "Devstral 2", + "id": "Qwen/Qwen3-Reranker-0.6B", + "name": "Qwen3 Reranker 0.6B", + "display_name": "Qwen3 Reranker 0.6B", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 40960, + "output": 1024 + }, + "temperature": false, + "tool_call": false, + "reasoning": { + "supported": false + }, + "attachment": false, + "open_weights": true, + "release_date": "2025-06-03", + "last_updated": "2025-06-03", + "cost": { + "input": 0.01, + "output": 0.01 + }, + "type": "rerank" + }, + { + "id": "Qwen/Qwen3.6-35B-A3B-FP8", + "name": "Qwen 3.6 35B A3B FP8", + "display_name": "Qwen 3.6 35B A3B FP8", "modalities": { "input": [ "text" @@ -69171,28 +73179,40 @@ }, "limit": { "context": 262144, - "output": 262144 + "output": 32768 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": false, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } + }, + "attachment": true, "open_weights": true, - "knowledge": "2025-12", - "release_date": "2025-12-09", - "last_updated": "2025-12-09", + "release_date": "2026-04-17", + "last_updated": "2026-04-17", "cost": { - "input": 0.4, - "output": 2 + "input": 0.17, + "output": 1.1, + "cache_read": 0.056 }, "type": "chat" }, { - "id": "open-mixtral-8x22b", - "name": "Mixtral 8x22B", - "display_name": "Mixtral 8x22B", + "id": "Qwen/Qwen3.5-122B-A10B", + "name": "Qwen3.5 122B-A10B", + "display_name": "Qwen3.5 122B-A10B", "modalities": { "input": [ "text" @@ -69202,41 +73222,51 @@ ] }, "limit": { - "context": 64000, - "output": 64000 + "context": 131072, + "output": 32768 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": false, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } + }, + "attachment": true, "open_weights": true, - "knowledge": "2024-04", - "release_date": "2024-04-17", - "last_updated": "2024-04-17", + "release_date": "2026-02-23", + "last_updated": "2026-02-23", "cost": { - "input": 2, - "output": 6 + "input": 0.4, + "output": 3.2 }, "type": "chat" }, { - "id": "mistral-small-2506", - "name": "Mistral Small 3.2", - "display_name": "Mistral Small 3.2", + "id": "Qwen/Qwen3-30B-A3B-Instruct-2507", + "name": "Qwen3 30B-A3B Instruct 2507", + "display_name": "Qwen3 30B-A3B Instruct 2507", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 16384 + "context": 262144, + "output": 32768 }, "temperature": true, "tool_call": true, @@ -69245,19 +73275,18 @@ }, "attachment": false, "open_weights": true, - "knowledge": "2025-03", - "release_date": "2025-06-20", - "last_updated": "2025-06-20", + "release_date": "2025-07-29", + "last_updated": "2025-07-29", "cost": { - "input": 0.1, - "output": 0.3 + "input": 0.15, + "output": 0.55 }, "type": "chat" }, { - "id": "pixtral-12b", - "name": "Pixtral 12B", - "display_name": "Pixtral 12B", + "id": "Qwen/Qwen3-VL-30B-A3B-Instruct", + "name": "Qwen3-VL 30B-A3B Instruct", + "display_name": "Qwen3-VL 30B-A3B Instruct", "modalities": { "input": [ "text", @@ -69268,8 +73297,8 @@ ] }, "limit": { - "context": 128000, - "output": 128000 + "context": 256000, + "output": 32768 }, "temperature": true, "tool_call": true, @@ -69278,115 +73307,173 @@ }, "attachment": true, "open_weights": true, - "knowledge": "2024-09", - "release_date": "2024-09-01", - "last_updated": "2024-09-01", + "release_date": "2025-09-23", + "last_updated": "2025-09-23", "cost": { "input": 0.15, - "output": 0.15 + "output": 0.55 }, "type": "chat" }, { - "id": "devstral-small-2507", - "name": "Devstral Small", - "display_name": "Devstral Small", + "id": "openai/o3", + "name": "o3", + "display_name": "o3", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 128000 + "context": 200000, + "output": 100000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": false, - "open_weights": true, - "knowledge": "2025-05", - "release_date": "2025-07-10", - "last_updated": "2025-07-10", + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": true, + "mode": "effort", + "effort": "medium", + "effort_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" + } + }, + "attachment": true, + "open_weights": false, + "knowledge": "2024-05", + "release_date": "2025-04-16", + "last_updated": "2025-04-16", "cost": { - "input": 0.1, - "output": 0.3 + "input": 2, + "output": 8, + "cache_read": 0.5 }, "type": "chat" }, { - "id": "devstral-2512", - "name": "Devstral 2", - "display_name": "Devstral 2", + "id": "openai/gpt-5", + "name": "GPT-5", + "display_name": "GPT-5", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 262144, - "output": 262144 + "context": 400000, + "output": 128000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": false, - "open_weights": true, - "knowledge": "2025-12", - "release_date": "2025-12-09", - "last_updated": "2025-12-09", + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": true, + "mode": "effort", + "effort": "medium", + "effort_options": [ + "minimal", + "low", + "medium", + "high" + ], + "verbosity": "medium", + "verbosity_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" + } + }, + "attachment": true, + "open_weights": false, + "knowledge": "2024-09-30", + "release_date": "2025-08-07", + "last_updated": "2025-08-07", "cost": { - "input": 0.4, - "output": 2 + "input": 1.25, + "output": 10, + "cache_read": 0.125 }, "type": "chat" }, { - "id": "codestral-latest", - "name": "Codestral (latest)", - "display_name": "Codestral (latest)", + "id": "openai/o4-mini", + "name": "o4-mini", + "display_name": "o4-mini", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 256000, - "output": 4096 + "context": 200000, + "output": 100000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": false, - "open_weights": true, - "knowledge": "2024-10", - "release_date": "2024-05-29", - "last_updated": "2025-01-04", + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": true, + "mode": "effort", + "effort": "medium", + "effort_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" + } + }, + "attachment": true, + "open_weights": false, + "knowledge": "2024-05", + "release_date": "2025-04-16", + "last_updated": "2025-04-16", "cost": { - "input": 0.3, - "output": 0.9 + "input": 1.1, + "output": 4.4, + "cache_read": 0.275 }, "type": "chat" }, { - "id": "pixtral-large-latest", - "name": "Pixtral Large (latest)", - "display_name": "Pixtral Large (latest)", + "id": "openai/gpt-5.4-nano", + "name": "GPT-5.4 nano", + "display_name": "GPT-5.4 nano", "modalities": { "input": [ "text", @@ -69397,29 +73484,53 @@ ] }, "limit": { - "context": 128000, + "context": 400000, "output": 128000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": false + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": false, + "mode": "effort", + "effort": "none", + "effort_options": [ + "none", + "low", + "medium", + "high", + "xhigh" + ], + "verbosity": "medium", + "verbosity_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" + } }, "attachment": true, - "open_weights": true, - "knowledge": "2024-11", - "release_date": "2024-11-01", - "last_updated": "2024-11-04", + "open_weights": false, + "knowledge": "2025-08-31", + "release_date": "2026-03-17", + "last_updated": "2026-03-17", "cost": { - "input": 2, - "output": 6 + "input": 0.2, + "output": 1.25, + "cache_read": 0.02 }, "type": "chat" }, { - "id": "open-mistral-nemo", - "name": "Open Mistral Nemo", - "display_name": "Open Mistral Nemo", + "id": "openai/o3-mini", + "name": "o3-mini", + "display_name": "o3-mini", "modalities": { "input": [ "text" @@ -69429,93 +73540,136 @@ ] }, "limit": { - "context": 128000, - "output": 128000 + "context": 200000, + "output": 100000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": true, + "mode": "effort", + "effort": "medium", + "effort_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" + } }, "attachment": false, - "open_weights": true, - "knowledge": "2024-07", - "release_date": "2024-07-01", - "last_updated": "2024-07-01", + "open_weights": false, + "knowledge": "2024-05", + "release_date": "2024-12-20", + "last_updated": "2025-01-29", "cost": { - "input": 0.15, - "output": 0.15 + "input": 1.1, + "output": 4.4, + "cache_read": 0.55 }, "type": "chat" }, { - "id": "ministral-3b-latest", - "name": "Ministral 3B (latest)", - "display_name": "Ministral 3B (latest)", + "id": "openai/gpt-5.2", + "name": "GPT-5.2", + "display_name": "GPT-5.2", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 128000, + "context": 400000, "output": 128000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": false }, - "attachment": false, - "open_weights": true, - "knowledge": "2024-10", - "release_date": "2024-10-01", - "last_updated": "2024-10-04", + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": false, + "mode": "effort", + "effort": "none", + "effort_options": [ + "none", + "low", + "medium", + "high", + "xhigh" + ], + "verbosity": "medium", + "verbosity_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" + } + }, + "attachment": true, + "open_weights": false, + "knowledge": "2025-08-31", + "release_date": "2025-12-11", + "last_updated": "2025-12-11", "cost": { - "input": 0.04, - "output": 0.04 + "input": 1.8, + "output": 15.5, + "cache_read": 0.18 }, "type": "chat" }, { - "id": "devstral-small-2505", - "name": "Devstral Small 2505", - "display_name": "Devstral Small 2505", + "id": "openai/gpt-4.1-nano", + "name": "GPT-4.1 nano", + "display_name": "GPT-4.1 nano", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 128000 + "context": 1047576, + "output": 32768 }, "temperature": true, "tool_call": true, "reasoning": { "supported": false }, - "attachment": false, - "open_weights": true, - "knowledge": "2025-05", - "release_date": "2025-05-07", - "last_updated": "2025-05-07", + "attachment": true, + "open_weights": false, + "knowledge": "2024-04", + "release_date": "2025-04-14", + "last_updated": "2025-04-14", "cost": { "input": 0.1, - "output": 0.3 + "output": 0.4, + "cache_read": 0.025 }, "type": "chat" }, { - "id": "open-mixtral-8x7b", - "name": "Mixtral 8x7B", - "display_name": "Mixtral 8x7B", + "id": "openai/gpt-oss-120b", + "name": "GPT-OSS 120B", + "display_name": "GPT-OSS 120B", "modalities": { "input": [ "text" @@ -69525,62 +73679,108 @@ ] }, "limit": { - "context": 32000, - "output": 32000 + "context": 131000, + "output": 32768 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true + } }, "attachment": false, "open_weights": true, - "knowledge": "2024-01", - "release_date": "2023-12-11", - "last_updated": "2023-12-11", + "release_date": "2025-08-05", + "last_updated": "2025-08-05", "cost": { - "input": 0.7, - "output": 0.7 + "input": 0.15, + "output": 0.55 }, "type": "chat" }, { - "id": "magistral-medium-latest", - "name": "Magistral Medium (latest)", - "display_name": "Magistral Medium (latest)", + "id": "openai/gpt-5.4", + "name": "GPT-5.4", + "display_name": "GPT-5.4", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 16384 + "context": 1050000, + "output": 128000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { "supported": true, - "default": true + "default": false }, - "attachment": false, - "open_weights": true, - "knowledge": "2025-06", - "release_date": "2025-03-17", - "last_updated": "2025-03-20", + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": false, + "mode": "effort", + "effort": "none", + "effort_options": [ + "none", + "low", + "medium", + "high", + "xhigh" + ], + "verbosity": "medium", + "verbosity_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" + } + }, + "attachment": true, + "open_weights": false, + "knowledge": "2025-08-31", + "release_date": "2026-03-05", + "last_updated": "2026-03-05", "cost": { - "input": 2, - "output": 5 + "input": 2.5, + "output": 15, + "cache_read": 0.25, + "tiers": [ + { + "input": 5, + "output": 22.5, + "cache_read": 0.5, + "tier": { + "type": "context", + "size": 272000 + } + } + ], + "context_over_200k": { + "input": 5, + "output": 22.5, + "cache_read": 0.5 + } }, "type": "chat" }, { - "id": "mistral-small-latest", - "name": "Mistral Small (latest)", - "display_name": "Mistral Small (latest)", + "id": "openai/gpt-5.4-mini", + "name": "GPT-5.4 mini", + "display_name": "GPT-5.4 mini", "modalities": { "input": [ "text", @@ -69591,69 +73791,86 @@ ] }, "limit": { - "context": 256000, - "output": 256000 + "context": 400000, + "output": 128000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { "supported": true, - "default": true + "default": false + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": false, + "mode": "effort", + "effort": "none", + "effort_options": [ + "none", + "low", + "medium", + "high", + "xhigh" + ], + "verbosity": "medium", + "verbosity_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" + } }, "attachment": true, - "open_weights": true, - "knowledge": "2025-06", - "release_date": "2026-03-16", - "last_updated": "2026-03-16", + "open_weights": false, + "knowledge": "2025-08-31", + "release_date": "2026-03-17", + "last_updated": "2026-03-17", "cost": { - "input": 0.15, - "output": 0.6 + "input": 0.75, + "output": 4.5, + "cache_read": 0.075 }, "type": "chat" }, { - "id": "devstral-medium-2507", - "name": "Devstral Medium", - "display_name": "Devstral Medium", + "id": "openai/gpt-4.1", + "name": "GPT-4.1", + "display_name": "GPT-4.1", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 128000 + "context": 1047576, + "output": 32768 }, "temperature": true, "tool_call": true, "reasoning": { "supported": false }, - "attachment": false, - "open_weights": true, - "knowledge": "2025-05", - "release_date": "2025-07-10", - "last_updated": "2025-07-10", + "attachment": true, + "open_weights": false, + "knowledge": "2024-04", + "release_date": "2025-04-14", + "last_updated": "2025-04-14", "cost": { - "input": 0.4, - "output": 2 + "input": 2, + "output": 8, + "cache_read": 0.5 }, "type": "chat" - } - ] - }, - "vivgrid": { - "id": "vivgrid", - "name": "Vivgrid", - "display_name": "Vivgrid", - "api": "https://api.vivgrid.com/v1", - "doc": "https://docs.vivgrid.com/models", - "models": [ + }, { - "id": "gpt-5-mini", + "id": "openai/gpt-5-mini", "name": "GPT-5 Mini", "display_name": "GPT-5 Mini", "modalities": { @@ -69666,7 +73883,7 @@ ] }, "limit": { - "context": 272000, + "context": 400000, "output": 128000 }, "temperature": false, @@ -69704,20 +73921,18 @@ "cost": { "input": 0.25, "output": 2, - "cache_read": 0.03 + "cache_read": 0.025 }, "type": "chat" }, { - "id": "gemini-3.1-flash-lite-preview", - "name": "Gemini 3.1 Flash Lite Preview", - "display_name": "Gemini 3.1 Flash Lite Preview", + "id": "openai/gpt-4.1-mini", + "name": "GPT-4.1 mini", + "display_name": "GPT-4.1 mini", "modalities": { "input": [ "text", "image", - "video", - "audio", "pdf" ], "output": [ @@ -69725,50 +73940,44 @@ ] }, "limit": { - "context": 1048576, - "output": 65536 + "context": 1047576, + "output": 32768 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true - } + "supported": false }, "attachment": true, "open_weights": false, - "knowledge": "2025-01", - "release_date": "2026-03-03", - "last_updated": "2026-03-03", + "knowledge": "2024-04", + "release_date": "2025-04-14", + "last_updated": "2025-04-14", "cost": { - "input": 0.25, - "output": 1.5, - "cache_read": 0.025, - "cache_write": 1 + "input": 0.4, + "output": 1.6, + "cache_read": 0.1 }, "type": "chat" }, { - "id": "deepseek-v3.2", - "name": "DeepSeek-V3.2", - "display_name": "DeepSeek-V3.2", + "id": "openai/gpt-5-nano", + "name": "GPT-5 Nano", + "display_name": "GPT-5 Nano", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 128000, + "context": 400000, "output": 128000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { "supported": true, @@ -69776,29 +73985,76 @@ }, "extra_capabilities": { "reasoning": { - "supported": true + "supported": true, + "default_enabled": true, + "mode": "effort", + "effort": "medium", + "effort_options": [ + "minimal", + "low", + "medium", + "high" + ], + "verbosity": "medium", + "verbosity_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" } }, + "attachment": true, + "open_weights": false, + "knowledge": "2024-05-30", + "release_date": "2025-08-07", + "last_updated": "2025-08-07", + "cost": { + "input": 0.05, + "output": 0.4, + "cache_read": 0.005 + }, + "type": "chat" + }, + { + "id": "openai/whisper-large-v3", + "name": "Whisper Large v3", + "display_name": "Whisper Large v3", + "modalities": { + "input": [ + "audio" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 448, + "output": 448 + }, + "temperature": false, + "tool_call": false, + "reasoning": { + "supported": false + }, "attachment": false, "open_weights": true, - "knowledge": "2024-07", - "release_date": "2025-12-01", - "last_updated": "2025-12-01", + "release_date": "2023-11-06", + "last_updated": "2023-11-06", "cost": { - "input": 0.28, - "output": 0.42 + "input": 0.01, + "output": 0 }, "type": "chat" }, { - "id": "gpt-5.4", - "name": "GPT-5.4", - "display_name": "GPT-5.4", + "id": "openai/gpt-5.1", + "name": "GPT-5.1", + "display_name": "GPT-5.1", "modalities": { "input": [ "text", - "image", - "pdf" + "image" ], "output": [ "text" @@ -69824,8 +74080,7 @@ "none", "low", "medium", - "high", - "xhigh" + "high" ], "verbosity": "medium", "verbosity_options": [ @@ -69838,18 +74093,18 @@ }, "attachment": true, "open_weights": false, - "knowledge": "2025-08-31", - "release_date": "2026-03-05", - "last_updated": "2026-03-05", + "knowledge": "2024-09-30", + "release_date": "2025-11-13", + "last_updated": "2025-11-13", "cost": { - "input": 2.5, - "output": 15, - "cache_read": 0.25 + "input": 1.25, + "output": 10, + "cache_read": 0.125 }, "type": "chat" }, { - "id": "gpt-5.5", + "id": "openai/gpt-5.5", "name": "GPT-5.5", "display_name": "GPT-5.5", "modalities": { @@ -69922,23 +74177,24 @@ "type": "chat" }, { - "id": "gpt-5.1-codex-max", - "name": "GPT-5.1 Codex Max", - "display_name": "GPT-5.1 Codex Max", + "id": "anthropic/claude-sonnet-4-5", + "name": "Claude Sonnet 4.5 (latest)", + "display_name": "Claude Sonnet 4.5 (latest)", "modalities": { "input": [ "text", - "image" + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 400000, - "output": 128000 + "context": 200000, + "output": 64000 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, @@ -69948,39 +74204,40 @@ "reasoning": { "supported": true, "default_enabled": false, - "mode": "effort", - "effort": "none", - "effort_options": [ - "none", - "low", - "medium", - "high" - ], - "verbosity": "medium", - "verbosity_options": [ - "low", - "medium", - "high" + "mode": "budget", + "budget": { + "min": 1024, + "unit": "tokens" + }, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" ], - "visibility": "hidden" + "notes": [ + "Claude 4 manual thinking uses thinking.type = \"enabled\" with budget_tokens.", + "Interleaved thinking requires the interleaved-thinking-2025-05-14 beta header for this model family." + ] } }, - "attachment": false, + "attachment": true, "open_weights": false, - "knowledge": "2024-09-30", - "release_date": "2025-11-13", - "last_updated": "2025-11-13", + "knowledge": "2025-07-31", + "release_date": "2025-09-29", + "last_updated": "2025-09-29", "cost": { - "input": 1.25, - "output": 10, - "cache_read": 0.125 + "input": 3, + "output": 15.5, + "cache_read": 0.3, + "cache_write": 3.75 }, "type": "chat" }, { - "id": "gpt-5.4-nano", - "name": "GPT-5.4 Nano", - "display_name": "GPT-5.4 Nano", + "id": "anthropic/claude-opus-4-7", + "name": "Claude Opus 4.7", + "display_name": "Claude Opus 4.7", "modalities": { "input": [ "text", @@ -69992,7 +74249,7 @@ ] }, "limit": { - "context": 400000, + "context": 1000000, "output": 128000 }, "temperature": false, @@ -70006,45 +74263,48 @@ "supported": true, "default_enabled": false, "mode": "effort", - "effort": "none", + "effort": "high", "effort_options": [ - "none", "low", "medium", "high", - "xhigh" + "xhigh", + "max" ], - "verbosity": "medium", - "verbosity_options": [ - "low", - "medium", - "high" + "interleaved": true, + "summaries": true, + "visibility": "omitted", + "continuation": [ + "thinking_blocks" ], - "visibility": "hidden" + "notes": [ + "Claude Opus 4.7 and newer Opus models require thinking.type = \"adaptive\" to enable thinking explicitly.", + "Manual budget_tokens requests return 400 on Claude Opus 4.7 and newer adaptive-only Opus models.", + "task_budget is separate from thinking control and should not be treated as a thinking budget." + ] } }, "attachment": true, "open_weights": false, - "knowledge": "2025-08-31", - "release_date": "2026-03-17", - "last_updated": "2026-03-17", + "knowledge": "2026-01-31", + "release_date": "2026-04-16", + "last_updated": "2026-04-16", "cost": { - "input": 0.2, - "output": 1.25, - "cache_read": 0.02 + "input": 5, + "output": 25, + "cache_read": 0.5, + "cache_write": 6.25 }, "type": "chat" }, { - "id": "gemini-3.1-pro-preview", - "name": "Gemini 3.1 Pro Preview", - "display_name": "Gemini 3.1 Pro Preview", + "id": "anthropic/claude-haiku-4-5", + "name": "Claude Haiku 4.5 (latest)", + "display_name": "Claude Haiku 4.5 (latest)", "modalities": { "input": [ "text", "image", - "video", - "audio", "pdf" ], "output": [ @@ -70052,247 +74312,280 @@ ] }, "limit": { - "context": 1048576, - "output": 65536 + "context": 200000, + "output": 64000 }, "temperature": true, "tool_call": true, "reasoning": { "supported": true, - "default": true + "default": false }, "extra_capabilities": { "reasoning": { "supported": true, - "default_enabled": true, - "mode": "level", - "level": "high", - "level_options": [ - "low", - "high" - ], + "default_enabled": false, + "mode": "budget", + "budget": { + "min": 1024, + "unit": "tokens" + }, + "interleaved": true, "summaries": true, "visibility": "summary", "continuation": [ - "thought_signatures" + "thinking_blocks" + ], + "notes": [ + "Claude 4 manual thinking uses thinking.type = \"enabled\" with budget_tokens.", + "Interleaved thinking requires the interleaved-thinking-2025-05-14 beta header for this model family." ] } }, "attachment": true, "open_weights": false, - "knowledge": "2025-01", - "release_date": "2026-02-19", - "last_updated": "2026-02-19", + "knowledge": "2025-02-28", + "release_date": "2025-10-15", + "last_updated": "2025-10-15", "cost": { - "input": 2, - "output": 12, - "cache_read": 0.2, - "tiers": [ - { - "input": 4, - "output": 18, - "cache_read": 0.4, - "tier": { - "type": "context", - "size": 200000 - } - } - ], - "context_over_200k": { - "input": 4, - "output": 18, - "cache_read": 0.4 - } + "input": 1, + "output": 5, + "cache_read": 0.1, + "cache_write": 1.25 }, "type": "chat" }, { - "id": "gpt-5.3-codex", - "name": "GPT-5.3 Codex", - "display_name": "GPT-5.3 Codex", + "id": "anthropic/claude-opus-4-6", + "name": "Claude Opus 4.6", + "display_name": "Claude Opus 4.6", "modalities": { "input": [ "text", - "image" + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 400000, + "context": 200000, "output": 128000 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, - "default": true + "default": false }, "extra_capabilities": { "reasoning": { "supported": true, - "default_enabled": true, - "mode": "effort", - "effort": "medium", + "default_enabled": false, + "mode": "mixed", + "budget": { + "min": 1024, + "unit": "tokens" + }, + "effort": "high", "effort_options": [ "low", "medium", "high", - "xhigh" + "max" ], - "verbosity": "medium", - "verbosity_options": [ - "low", - "medium", - "high" + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" ], - "visibility": "hidden" + "notes": [ + "Anthropic recommends adaptive thinking with effort for Claude 4.6; budget_tokens remains a deprecated compatibility path.", + "Anthropic API defaults effort to high; lower effort levels should be chosen per workload." + ] } }, - "attachment": false, + "attachment": true, "open_weights": false, - "knowledge": "2025-08-31", - "release_date": "2026-02-24", - "last_updated": "2026-02-24", + "knowledge": "2025-05-31", + "release_date": "2026-02-05", + "last_updated": "2026-03-13", "cost": { - "input": 1.75, - "output": 14, - "cache_read": 0.175 + "input": 5, + "output": 25, + "cache_read": 0.5, + "cache_write": 6.25 }, "type": "chat" }, { - "id": "gpt-5.2-codex", - "name": "GPT-5.2 Codex", - "display_name": "GPT-5.2 Codex", + "id": "anthropic/claude-sonnet-4-6", + "name": "Claude Sonnet 4.6", + "display_name": "Claude Sonnet 4.6", "modalities": { "input": [ "text", - "image" + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 400000, - "output": 128000 + "context": 1000000, + "output": 64000 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, - "default": true + "default": false }, "extra_capabilities": { "reasoning": { "supported": true, - "default_enabled": true, - "mode": "effort", - "effort": "medium", + "default_enabled": false, + "mode": "mixed", + "budget": { + "min": 1024, + "unit": "tokens" + }, + "effort": "high", "effort_options": [ "low", "medium", "high", - "xhigh" + "max" ], - "verbosity": "medium", - "verbosity_options": [ - "low", - "medium", - "high" + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" ], - "visibility": "hidden" + "notes": [ + "Anthropic recommends adaptive thinking with effort for Claude 4.6; budget_tokens remains a deprecated compatibility path.", + "Anthropic API defaults effort to high; lower effort levels should be chosen per workload." + ] } }, - "attachment": false, + "attachment": true, "open_weights": false, "knowledge": "2025-08-31", - "release_date": "2026-01-14", - "last_updated": "2026-01-14", + "release_date": "2026-02-17", + "last_updated": "2026-03-13", "cost": { - "input": 1.75, - "output": 14, - "cache_read": 0.175 + "input": 3, + "output": 15, + "cache_read": 0.3, + "cache_write": 3.75 }, "type": "chat" }, { - "id": "gpt-5.1-codex", - "name": "GPT-5.1 Codex", - "display_name": "GPT-5.1 Codex", + "id": "zai-org/GLM-5.1-FP8", + "name": "GLM-5.1 FP8", + "display_name": "GLM-5.1 FP8", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 400000, - "output": 128000 + "context": 202752, + "output": 131072 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, - "default": false + "default": true }, "extra_capabilities": { "reasoning": { "supported": true, - "default_enabled": false, - "mode": "effort", - "effort": "none", - "effort_options": [ - "none", - "low", - "medium", - "high" - ], - "verbosity": "medium", - "verbosity_options": [ - "low", - "medium", - "high" - ], - "visibility": "hidden" + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] } }, "attachment": false, - "open_weights": false, - "knowledge": "2024-09-30", - "release_date": "2025-11-13", - "last_updated": "2025-11-13", + "open_weights": true, + "release_date": "2026-03-27", + "last_updated": "2026-03-27", "cost": { - "input": 1.25, - "output": 10, - "cache_read": 0.125 + "input": 0.85, + "output": 3.3 }, "type": "chat" }, { - "id": "gpt-5.4-mini", - "name": "GPT-5.4 Mini", - "display_name": "GPT-5.4 Mini", + "id": "black-forest-labs/FLUX.2-klein-4B", + "name": "FLUX.2 Klein 4B", + "display_name": "FLUX.2 Klein 4B", "modalities": { "input": [ "text", - "image", - "pdf" + "image" ], "output": [ - "text" + "image" ] }, "limit": { - "context": 400000, + "context": 128000, "output": 128000 }, - "temperature": false, + "temperature": true, + "tool_call": false, + "reasoning": { + "supported": false + }, + "attachment": false, + "open_weights": true, + "release_date": "2026-01-14", + "last_updated": "2026-01-14", + "cost": { + "input": 1, + "output": 1 + }, + "type": "chat" + } + ] + }, + "llmgateway": { + "id": "llmgateway", + "name": "LLM Gateway", + "display_name": "LLM Gateway", + "api": "https://api.llmgateway.io/v1", + "doc": "https://llmgateway.io/docs", + "models": [ + { + "id": "claude-3-7-sonnet", + "name": "Claude 3.7 Sonnet", + "display_name": "Claude 3.7 Sonnet", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 200000, + "output": 8192 + }, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, @@ -70302,40 +74595,37 @@ "reasoning": { "supported": true, "default_enabled": false, - "mode": "effort", - "effort": "none", - "effort_options": [ - "none", - "low", - "medium", - "high", - "xhigh" - ], - "verbosity": "medium", - "verbosity_options": [ - "low", - "medium", - "high" + "mode": "budget", + "budget": { + "min": 1024, + "unit": "tokens" + }, + "interleaved": false, + "summaries": false, + "visibility": "full", + "continuation": [ + "thinking_blocks" ], - "visibility": "hidden" + "notes": [ + "Anthropic uses thinking budget tokens" + ] } }, - "attachment": true, + "attachment": false, "open_weights": false, - "knowledge": "2025-08-31", - "release_date": "2026-03-17", - "last_updated": "2026-03-17", + "release_date": "2025-02-24", + "last_updated": "2025-02-24", "cost": { - "input": 0.75, - "output": 4.5, - "cache_read": 0.075 + "input": 3, + "output": 15, + "cache_read": 0.3 }, "type": "chat" }, { - "id": "deepseek-v4-pro", - "name": "DeepSeek V4 Pro", - "display_name": "DeepSeek V4 Pro", + "id": "qwen-coder-plus", + "name": "Qwen Coder Plus", + "display_name": "Qwen Coder Plus", "modalities": { "input": [ "text" @@ -70345,179 +74635,180 @@ ] }, "limit": { - "context": 1000000, - "output": 384000 + "context": 131072, + "output": 8192 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } + "supported": false }, "attachment": false, + "open_weights": false, + "release_date": "2024-09-18", + "last_updated": "2024-09-18", + "cost": { + "input": 0.502, + "output": 1.004 + }, + "type": "chat" + }, + { + "id": "mistral-large-latest", + "name": "Mistral Large (latest)", + "display_name": "Mistral Large (latest)", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 262144, + "output": 262144 + }, + "temperature": true, + "tool_call": true, + "reasoning": { + "supported": false + }, + "attachment": true, "open_weights": true, - "knowledge": "2025-05", - "release_date": "2026-04-24", - "last_updated": "2026-04-24", + "knowledge": "2024-11", + "release_date": "2024-11-01", + "last_updated": "2025-12-02", "cost": { - "input": 0.435, - "output": 0.87, - "cache_read": 0.003625 + "input": 0.5, + "output": 1.5 }, "type": "chat" - } - ] - }, - "databricks": { - "id": "databricks", - "name": "Databricks", - "display_name": "Databricks", - "api": "https://${DATABRICKS_HOST}/ai-gateway/mlflow/v1", - "doc": "https://docs.databricks.com/aws/en/machine-learning/foundation-models/", - "models": [ + }, { - "id": "databricks-claude-sonnet-4", - "name": "Claude Sonnet 4.5", - "display_name": "Claude Sonnet 4.5", + "id": "qwen3-vl-235b-a22b-thinking", + "name": "Qwen3 VL 235B A22B Thinking", + "display_name": "Qwen3 VL 235B A22B Thinking", "modalities": { "input": [ "text", - "image", - "pdf" + "image" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 64000 + "context": 131072, + "output": 8192 }, "temperature": true, "tool_call": true, "reasoning": { "supported": true, - "default": false + "default": true }, "extra_capabilities": { "reasoning": { "supported": true, - "default_enabled": false, - "mode": "budget", - "budget": { - "min": 1024, - "unit": "tokens" - }, "interleaved": true, "summaries": true, "visibility": "summary", "continuation": [ "thinking_blocks" - ], - "notes": [ - "Claude 4 manual thinking uses thinking.type = \"enabled\" with budget_tokens.", - "Interleaved thinking requires the interleaved-thinking-2025-05-14 beta header for this model family." ] } }, "attachment": true, - "open_weights": false, - "knowledge": "2025-07-31", - "release_date": "2025-09-29", - "last_updated": "2025-09-29", + "open_weights": true, + "release_date": "2025-09-15", + "last_updated": "2025-09-15", "cost": { - "input": 3, - "output": 15, - "cache_read": 0.3, - "cache_write": 3.75 + "input": 0.5, + "output": 2 }, "type": "chat" }, { - "id": "databricks-gpt-5-1", - "name": "GPT-5.1", - "display_name": "GPT-5.1", + "id": "deepseek-r1-0528", + "name": "DeepSeek R1 (0528)", + "display_name": "DeepSeek R1 (0528)", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 400000, - "output": 128000 + "context": 64000, + "output": 16384 }, - "temperature": false, - "tool_call": true, + "temperature": true, + "tool_call": false, "reasoning": { "supported": true, "default": true }, - "attachment": true, - "open_weights": false, - "knowledge": "2024-09-30", - "release_date": "2025-11-13", - "last_updated": "2025-11-13", + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } + }, + "attachment": false, + "open_weights": true, + "release_date": "2025-05-28", + "last_updated": "2025-05-28", "cost": { - "input": 1.25, - "output": 10, - "cache_read": 0.125 + "input": 0.55, + "output": 2.19 }, "type": "chat" }, { - "id": "databricks-gpt-5-4-nano", - "name": "GPT-5.4 nano", - "display_name": "GPT-5.4 nano", + "id": "devstral-small-2507", + "name": "Devstral Small", + "display_name": "Devstral Small", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 400000, + "context": 128000, "output": 128000 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, - "attachment": true, - "open_weights": false, - "knowledge": "2025-08-31", - "release_date": "2026-03-17", - "last_updated": "2026-03-17", + "attachment": false, + "open_weights": true, + "knowledge": "2025-05", + "release_date": "2025-07-10", + "last_updated": "2025-07-10", "cost": { - "input": 0.2, - "output": 1.25, - "cache_read": 0.02 + "input": 0.1, + "output": 0.3 }, "type": "chat" }, { - "id": "databricks-gpt-5-nano", - "name": "GPT-5 Nano", - "display_name": "GPT-5 Nano", + "id": "qwen3-vl-30b-a3b-thinking", + "name": "Qwen3 VL 30B A3B Thinking", + "display_name": "Qwen3 VL 30B A3B Thinking", "modalities": { "input": [ "text", @@ -70528,73 +74819,88 @@ ] }, "limit": { - "context": 400000, - "output": 128000 + "context": 131072, + "output": 8192 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, "default": true }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } + }, "attachment": true, - "open_weights": false, - "knowledge": "2024-05-30", - "release_date": "2025-08-07", - "last_updated": "2025-08-07", + "open_weights": true, + "release_date": "2025-10-02", + "last_updated": "2025-10-02", "cost": { - "input": 0.05, - "output": 0.4, - "cache_read": 0.005 + "input": 0.2, + "output": 1 }, "type": "chat" }, { - "id": "databricks-gpt-5-mini", - "name": "GPT-5 Mini", - "display_name": "GPT-5 Mini", + "id": "deepseek-v4-flash", + "name": "DeepSeek V4 Flash", + "display_name": "DeepSeek V4 Flash", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 400000, - "output": 128000 + "context": 1000000, + "output": 384000 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, "default": true }, - "attachment": true, - "open_weights": false, - "knowledge": "2024-05-30", - "release_date": "2025-08-07", - "last_updated": "2025-08-07", + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } + }, + "attachment": false, + "open_weights": true, + "knowledge": "2025-05", + "release_date": "2026-04-24", + "last_updated": "2026-04-24", "cost": { - "input": 0.25, - "output": 2, - "cache_read": 0.025 + "input": 0.14, + "output": 0.28, + "cache_read": 0.0028 }, "type": "chat" }, { - "id": "databricks-gemini-2-5-pro", - "name": "Gemini 2.5 Pro", - "display_name": "Gemini 2.5 Pro", + "id": "qwen3-coder-plus", + "name": "Qwen3 Coder Plus", + "display_name": "Qwen3 Coder Plus", "modalities": { "input": [ - "text", - "image", - "audio", - "video", - "pdf" + "text" ], "output": [ "text" @@ -70607,226 +74913,141 @@ "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, - "attachment": true, + "attachment": false, "open_weights": false, - "knowledge": "2025-01", - "release_date": "2025-03-20", - "last_updated": "2025-06-05", + "knowledge": "2025-04", + "release_date": "2025-07-23", + "last_updated": "2025-07-23", "cost": { - "input": 1.25, - "output": 10, - "cache_read": 0.125, - "tiers": [ - { - "input": 2.5, - "output": 15, - "cache_read": 0.25, - "tier": { - "type": "context", - "size": 200000 - } - } - ], - "context_over_200k": { - "input": 2.5, - "output": 15, - "cache_read": 0.25 - } + "input": 1, + "output": 5 }, "type": "chat" }, { - "id": "databricks-gpt-5-4-mini", - "name": "GPT-5.4 mini", - "display_name": "GPT-5.4 mini", + "id": "qwen25-coder-7b", + "name": "Qwen2.5 Coder 7B", + "display_name": "Qwen2.5 Coder 7B", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 400000, - "output": 128000 + "context": 131072, + "output": 8192 }, - "temperature": false, - "tool_call": true, + "temperature": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": true + "supported": false }, - "attachment": true, - "open_weights": false, - "knowledge": "2025-08-31", - "release_date": "2026-03-17", - "last_updated": "2026-03-17", + "attachment": false, + "open_weights": true, + "release_date": "2024-09-19", + "last_updated": "2024-09-19", "cost": { - "input": 0.75, - "output": 4.5, - "cache_read": 0.075 + "input": 0.05, + "output": 0.05 }, "type": "chat" }, { - "id": "databricks-claude-opus-4-6", - "name": "Claude Opus 4.6", - "display_name": "Claude Opus 4.6", + "id": "minimax-m2.7-highspeed", + "name": "MiniMax-M2.7-highspeed", + "display_name": "MiniMax-M2.7-highspeed", "modalities": { "input": [ - "text", - "image", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 1000000, - "output": 128000 + "context": 204800, + "output": 131072 }, "temperature": true, "tool_call": true, "reasoning": { "supported": true, - "default": false + "default": true }, "extra_capabilities": { "reasoning": { "supported": true, - "default_enabled": false, - "mode": "mixed", - "budget": { - "min": 1024, - "unit": "tokens" - }, - "effort": "high", - "effort_options": [ - "low", - "medium", - "high", - "max" - ], "interleaved": true, "summaries": true, "visibility": "summary", "continuation": [ "thinking_blocks" - ], - "notes": [ - "Anthropic recommends adaptive thinking with effort for Claude 4.6; budget_tokens remains a deprecated compatibility path.", - "Anthropic API defaults effort to high; lower effort levels should be chosen per workload." ] } }, - "attachment": true, - "open_weights": false, - "knowledge": "2025-05-31", - "release_date": "2026-02-05", - "last_updated": "2026-03-13", + "attachment": false, + "open_weights": true, + "release_date": "2026-03-18", + "last_updated": "2026-03-18", "cost": { - "input": 5, - "output": 25, - "cache_read": 0.5, - "cache_write": 6.25 + "input": 0.6, + "output": 2.4, + "cache_read": 0.06, + "cache_write": 0.375 }, "type": "chat" }, { - "id": "databricks-gpt-5", - "name": "GPT-5", - "display_name": "GPT-5", + "id": "llama-3.1-8b-instruct", + "name": "Llama 3.1 8B Instruct", + "display_name": "Llama 3.1 8B Instruct", "modalities": { "input": [ - "text", - "image" - ], - "output": [ "text" - ] - }, - "limit": { - "context": 400000, - "output": 128000 - }, - "temperature": false, - "tool_call": true, - "reasoning": { - "supported": true, - "default": true - }, - "attachment": true, - "open_weights": false, - "knowledge": "2024-09-30", - "release_date": "2025-08-07", - "last_updated": "2025-08-07", - "cost": { - "input": 1.25, - "output": 10, - "cache_read": 0.125 - }, - "type": "chat" - }, - { - "id": "databricks-gpt-5-2", - "name": "GPT-5.2", - "display_name": "GPT-5.2", - "modalities": { - "input": [ - "text", - "image" ], "output": [ "text" ] }, "limit": { - "context": 400000, - "output": 128000 + "context": 128000, + "output": 2048 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, - "attachment": true, - "open_weights": false, - "knowledge": "2025-08-31", - "release_date": "2025-12-11", - "last_updated": "2025-12-11", + "attachment": false, + "open_weights": true, + "release_date": "2024-07-23", + "last_updated": "2024-07-23", "cost": { - "input": 1.75, - "output": 14, - "cache_read": 0.175 + "input": 0.22, + "output": 0.22 }, "type": "chat" }, { - "id": "databricks-gemini-2-5-flash", - "name": "Gemini 2.5 Flash", - "display_name": "Gemini 2.5 Flash", + "id": "qwen-plus", + "name": "Qwen Plus", + "display_name": "Qwen Plus", "modalities": { "input": [ - "text", - "image", - "audio", - "video", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 1048576, - "output": 65536 + "context": 1000000, + "output": 32768 }, "temperature": true, "tool_call": true, @@ -70834,23 +75055,33 @@ "supported": true, "default": true }, - "attachment": true, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } + }, + "attachment": false, "open_weights": false, - "knowledge": "2025-01", - "release_date": "2025-03-20", - "last_updated": "2025-06-05", + "knowledge": "2024-04", + "release_date": "2024-01-25", + "last_updated": "2025-09-11", "cost": { - "input": 0.3, - "output": 2.5, - "cache_read": 0.03, - "input_audio": 1 + "input": 0.4, + "output": 1.2, + "reasoning": 4 }, "type": "chat" }, { - "id": "databricks-claude-opus-4-7", - "name": "Claude Opus 4.7", - "display_name": "Claude Opus 4.7", + "id": "o3", + "name": "o3", + "display_name": "o3", "modalities": { "input": [ "text", @@ -70862,58 +75093,45 @@ ] }, "limit": { - "context": 1000000, - "output": 128000 + "context": 200000, + "output": 100000 }, "temperature": false, "tool_call": true, "reasoning": { "supported": true, - "default": false + "default": true }, "extra_capabilities": { "reasoning": { "supported": true, - "default_enabled": false, + "default_enabled": true, "mode": "effort", - "effort": "high", + "effort": "medium", "effort_options": [ "low", "medium", - "high", - "xhigh", - "max" - ], - "interleaved": true, - "summaries": true, - "visibility": "omitted", - "continuation": [ - "thinking_blocks" + "high" ], - "notes": [ - "Claude Opus 4.7 and newer Opus models require thinking.type = \"adaptive\" to enable thinking explicitly.", - "Manual budget_tokens requests return 400 on Claude Opus 4.7 and newer adaptive-only Opus models.", - "task_budget is separate from thinking control and should not be treated as a thinking budget." - ] + "visibility": "hidden" } }, "attachment": true, "open_weights": false, - "knowledge": "2026-01-31", - "release_date": "2026-04-16", - "last_updated": "2026-04-16", + "knowledge": "2024-05", + "release_date": "2025-04-16", + "last_updated": "2025-04-16", "cost": { - "input": 5, - "output": 25, - "cache_read": 0.5, - "cache_write": 6.25 + "input": 2, + "output": 8, + "cache_read": 0.5 }, "type": "chat" }, { - "id": "databricks-gpt-oss-20b", - "name": "GPT OSS 20B", - "display_name": "GPT OSS 20B", + "id": "minimax-m2.5", + "name": "MiniMax-M2.5", + "display_name": "MiniMax-M2.5", "modalities": { "input": [ "text" @@ -70923,8 +75141,8 @@ ] }, "limit": { - "context": 131072, - "output": 32768 + "context": 204800, + "output": 131072 }, "temperature": true, "tool_call": true, @@ -70932,26 +75150,31 @@ "supported": true, "default": true }, + "extra_capabilities": { + "reasoning": { + "supported": true + } + }, "attachment": false, "open_weights": true, - "release_date": "2025-08-05", - "last_updated": "2025-08-05", + "release_date": "2026-02-12", + "last_updated": "2026-02-12", "cost": { - "input": 0.05, - "output": 0.2 + "input": 0.3, + "output": 1.2, + "cache_read": 0.03, + "cache_write": 0.375 }, "type": "chat" }, { - "id": "databricks-gemini-3-flash", - "name": "Gemini 3 Flash Preview", - "display_name": "Gemini 3 Flash Preview", + "id": "grok-4-20-beta-0309-non-reasoning", + "name": "Grok 4.20 (Non-Reasoning)", + "display_name": "Grok 4.20 (Non-Reasoning)", "modalities": { "input": [ "text", "image", - "video", - "audio", "pdf" ], "output": [ @@ -70959,100 +75182,97 @@ ] }, "limit": { - "context": 1048576, - "output": 65536 + "context": 1000000, + "output": 30000 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, "attachment": true, "open_weights": false, - "knowledge": "2025-01", - "release_date": "2025-12-17", - "last_updated": "2025-12-17", + "release_date": "2026-03-09", + "last_updated": "2026-03-09", "cost": { - "input": 0.5, - "output": 3, - "cache_read": 0.05, - "input_audio": 1 + "input": 1.25, + "output": 2.5, + "cache_read": 0.2, + "tiers": [ + { + "input": 2.5, + "output": 5, + "cache_read": 0.4, + "tier": { + "type": "context", + "size": 200000 + } + } + ], + "context_over_200k": { + "input": 2.5, + "output": 5, + "cache_read": 0.4 + } }, "type": "chat" }, { - "id": "databricks-claude-opus-4-5", - "name": "Claude Opus 4.5 (latest)", - "display_name": "Claude Opus 4.5 (latest)", + "id": "glm-4.7", + "name": "GLM-4.7", + "display_name": "GLM-4.7", "modalities": { "input": [ - "text", - "image", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 64000 + "context": 204800, + "output": 131072 }, "temperature": true, "tool_call": true, "reasoning": { "supported": true, - "default": false + "default": true }, "extra_capabilities": { "reasoning": { "supported": true, - "default_enabled": false, - "mode": "mixed", - "budget": { - "min": 1024, - "unit": "tokens" - }, - "effort": "high", - "effort_options": [ - "low", - "medium", - "high" - ], "interleaved": true, "summaries": true, "visibility": "summary", "continuation": [ "thinking_blocks" - ], - "notes": [ - "Claude Opus 4.5 uses manual thinking.type = \"enabled\" with budget_tokens; effort can be used alongside the thinking budget.", - "Interleaved thinking requires the interleaved-thinking-2025-05-14 beta header." ] } }, - "attachment": true, - "open_weights": false, - "knowledge": "2025-03-31", - "release_date": "2025-11-24", - "last_updated": "2025-11-24", + "attachment": false, + "open_weights": true, + "knowledge": "2025-04", + "release_date": "2025-12-22", + "last_updated": "2025-12-22", "cost": { - "input": 5, - "output": 25, - "cache_read": 0.5, - "cache_write": 6.25 + "input": 0.6, + "output": 2.2, + "cache_read": 0.11, + "cache_write": 0 }, "type": "chat" }, { - "id": "databricks-gpt-5-4", - "name": "GPT-5.4", - "display_name": "GPT-5.4", + "id": "gemini-3.1-flash-lite", + "name": "Gemini 3.1 Flash Lite", + "display_name": "Gemini 3.1 Flash Lite", "modalities": { "input": [ "text", "image", + "video", + "audio", "pdf" ], "output": [ @@ -71060,47 +75280,37 @@ ] }, "limit": { - "context": 1050000, - "output": 128000 + "context": 1048576, + "output": 65536 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, "default": true }, + "extra_capabilities": { + "reasoning": { + "supported": true + } + }, "attachment": true, "open_weights": false, - "knowledge": "2025-08-31", - "release_date": "2026-03-05", - "last_updated": "2026-03-05", + "knowledge": "2025-01", + "release_date": "2026-05-07", + "last_updated": "2026-05-07", "cost": { - "input": 2.5, - "output": 15, - "cache_read": 0.25, - "tiers": [ - { - "input": 5, - "output": 22.5, - "cache_read": 0.5, - "tier": { - "type": "context", - "size": 272000 - } - } - ], - "context_over_200k": { - "input": 5, - "output": 22.5, - "cache_read": 0.5 - } + "input": 0.25, + "output": 1.5, + "cache_read": 0.025, + "input_audio": 0.5 }, "type": "chat" }, { - "id": "databricks-gpt-oss-120b", - "name": "GPT OSS 120B", - "display_name": "GPT OSS 120B", + "id": "qwen3-235b-a22b-instruct-2507", + "name": "Qwen3 235B A22B Instruct (2507)", + "display_name": "Qwen3 235B A22B Instruct (2507)", "modalities": { "input": [ "text" @@ -71111,147 +75321,102 @@ }, "limit": { "context": 131072, - "output": 32768 + "output": 8192 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, "attachment": false, "open_weights": true, - "release_date": "2025-08-05", - "last_updated": "2025-08-05", + "release_date": "2025-07-08", + "last_updated": "2025-07-08", "cost": { - "input": 0.072, - "output": 0.28 + "input": 0.09, + "output": 0.58 }, "type": "chat" }, { - "id": "databricks-claude-sonnet-4-6", - "name": "Claude Sonnet 4.6", - "display_name": "Claude Sonnet 4.6", + "id": "llama-3-70b-instruct", + "name": "Llama 3 70B Instruct", + "display_name": "Llama 3 70B Instruct", "modalities": { "input": [ - "text", - "image", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 1000000, - "output": 64000 + "context": 8192, + "output": 8000 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": false - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": false, - "mode": "mixed", - "budget": { - "min": 1024, - "unit": "tokens" - }, - "effort": "high", - "effort_options": [ - "low", - "medium", - "high", - "max" - ], - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ], - "notes": [ - "Anthropic recommends adaptive thinking with effort for Claude 4.6; budget_tokens remains a deprecated compatibility path.", - "Anthropic API defaults effort to high; lower effort levels should be chosen per workload." - ] - } + "supported": false }, - "attachment": true, - "open_weights": false, - "knowledge": "2025-08-31", - "release_date": "2026-02-17", - "last_updated": "2026-03-13", + "attachment": false, + "open_weights": true, + "release_date": "2024-04-18", + "last_updated": "2024-04-18", "cost": { - "input": 3, - "output": 15, - "cache_read": 0.3, - "cache_write": 3.75 + "input": 0.51, + "output": 0.74 }, "type": "chat" }, { - "id": "databricks-gemini-3-1-flash-lite", - "name": "Gemini 3.1 Flash Lite Preview", - "display_name": "Gemini 3.1 Flash Lite Preview", + "id": "qwen3-coder-30b-a3b-instruct", + "name": "Qwen3-Coder 30B-A3B Instruct", + "display_name": "Qwen3-Coder 30B-A3B Instruct", "modalities": { "input": [ - "text", - "image", - "video", - "audio", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 1048576, + "context": 262144, "output": 65536 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, - "attachment": true, - "open_weights": false, - "knowledge": "2025-01", - "release_date": "2026-03-03", - "last_updated": "2026-03-03", + "attachment": false, + "open_weights": true, + "knowledge": "2025-04", + "release_date": "2025-04", + "last_updated": "2025-04", "cost": { - "input": 0.25, - "output": 1.5, - "cache_read": 0.025, - "input_audio": 0.5 + "input": 0.45, + "output": 2.25 }, "type": "chat" }, { - "id": "databricks-gemini-3-pro", - "name": "Gemini 3 Pro Preview", - "display_name": "Gemini 3 Pro Preview", + "id": "seed-1-8-251228", + "name": "Seed 1.8 (251228)", + "display_name": "Seed 1.8 (251228)", "modalities": { "input": [ "text", - "image", - "video", - "audio", - "pdf" + "image" ], "output": [ "text" ] }, "limit": { - "context": 1048576, - "output": 65536 + "context": 256000, + "output": 8192 }, "temperature": true, "tool_call": true, @@ -71260,326 +75425,283 @@ "default": true }, "attachment": true, - "open_weights": false, - "knowledge": "2025-01", - "release_date": "2025-11-18", - "last_updated": "2025-11-18", + "open_weights": true, + "release_date": "2025-12-18", + "last_updated": "2025-12-18", "cost": { - "input": 2, - "output": 12, - "cache_read": 0.2, - "tiers": [ - { - "input": 4, - "output": 18, - "cache_read": 0.4, - "tier": { - "type": "context", - "size": 200000 - } - } + "input": 0.25, + "output": 2, + "cache_read": 0.05 + }, + "type": "chat" + }, + { + "id": "hermes-2-pro-llama-3-8b", + "name": "Hermes 2 Pro Llama 3 8B", + "display_name": "Hermes 2 Pro Llama 3 8B", + "modalities": { + "input": [ + "text" ], - "context_over_200k": { - "input": 4, - "output": 18, - "cache_read": 0.4 - } + "output": [ + "text" + ] + }, + "limit": { + "context": 8192, + "output": 8192 + }, + "temperature": true, + "tool_call": false, + "reasoning": { + "supported": false + }, + "attachment": false, + "open_weights": true, + "release_date": "2024-05-27", + "last_updated": "2024-05-27", + "cost": { + "input": 0.14, + "output": 0.14 }, "type": "chat" }, { - "id": "databricks-claude-opus-4-1", - "name": "Claude Opus 4.1 (latest)", - "display_name": "Claude Opus 4.1 (latest)", + "id": "kimi-k2", + "name": "Kimi K2", + "display_name": "Kimi K2", "modalities": { "input": [ - "text", - "image", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 32000 + "context": 131072, + "output": 16384 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": false + "supported": false }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": false, - "mode": "budget", - "budget": { - "min": 1024, - "unit": "tokens" - }, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ], - "notes": [ - "Claude 4 manual thinking uses thinking.type = \"enabled\" with budget_tokens.", - "Interleaved thinking requires the interleaved-thinking-2025-05-14 beta header for this model family." - ] - } + "attachment": false, + "open_weights": true, + "release_date": "2025-07-11", + "last_updated": "2025-07-11", + "cost": { + "input": 0.6, + "output": 2.5, + "cache_read": 0.12 }, - "attachment": true, - "open_weights": false, - "knowledge": "2025-03-31", - "release_date": "2025-08-05", - "last_updated": "2025-08-05", + "type": "chat" + }, + { + "id": "llama-3.1-70b-instruct", + "name": "Llama 3.1 70B Instruct", + "display_name": "Llama 3.1 70B Instruct", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 128000, + "output": 2048 + }, + "temperature": true, + "tool_call": false, + "reasoning": { + "supported": false + }, + "attachment": false, + "open_weights": true, + "release_date": "2024-07-23", + "last_updated": "2024-07-23", "cost": { - "input": 15, - "output": 75, - "cache_read": 1.5, - "cache_write": 18.75 + "input": 0.72, + "output": 0.72 }, "type": "chat" }, { - "id": "databricks-claude-sonnet-4-5", - "name": "Claude Sonnet 4.5 (latest)", - "display_name": "Claude Sonnet 4.5 (latest)", + "id": "gpt-5.2-pro", + "name": "GPT-5.2 Pro", + "display_name": "GPT-5.2 Pro", "modalities": { "input": [ "text", - "image", - "pdf" + "image" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 64000 + "context": 400000, + "output": 128000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { "supported": true, - "default": false + "default": true }, "extra_capabilities": { "reasoning": { "supported": true, - "default_enabled": false, - "mode": "budget", - "budget": { - "min": 1024, - "unit": "tokens" - }, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" + "default_enabled": true, + "mode": "effort", + "effort": "high", + "effort_options": [ + "medium", + "high", + "xhigh" ], - "notes": [ - "Claude 4 manual thinking uses thinking.type = \"enabled\" with budget_tokens.", - "Interleaved thinking requires the interleaved-thinking-2025-05-14 beta header for this model family." - ] + "verbosity": "medium", + "verbosity_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" } }, "attachment": true, "open_weights": false, - "knowledge": "2025-07-31", - "release_date": "2025-09-29", - "last_updated": "2025-09-29", + "knowledge": "2025-08-31", + "release_date": "2025-12-11", + "last_updated": "2025-12-11", "cost": { - "input": 3, - "output": 15, - "cache_read": 0.3, - "cache_write": 3.75 + "input": 21, + "output": 168 }, "type": "chat" }, { - "id": "databricks-gpt-5-5", - "name": "GPT-5.5", - "display_name": "GPT-5.5", + "id": "minimax-m2.1", + "name": "MiniMax-M2.1", + "display_name": "MiniMax-M2.1", "modalities": { "input": [ - "text", - "image", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 1050000, - "output": 128000 + "context": 204800, + "output": 131072 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, "default": true }, - "attachment": true, - "open_weights": false, - "knowledge": "2025-12-01", - "release_date": "2026-04-23", - "last_updated": "2026-04-23", - "cost": { - "input": 5, - "output": 30, - "cache_read": 0.5, - "tiers": [ - { - "input": 10, - "output": 45, - "cache_read": 1, - "tier": { - "type": "context", - "size": 272000 - } - } - ], - "context_over_200k": { - "input": 10, - "output": 45, - "cache_read": 1 + "extra_capabilities": { + "reasoning": { + "supported": true } }, + "attachment": false, + "open_weights": true, + "release_date": "2025-12-23", + "last_updated": "2025-12-23", + "cost": { + "input": 0.3, + "output": 1.2 + }, "type": "chat" }, { - "id": "databricks-claude-haiku-4-5", - "name": "Claude Haiku 4.5 (latest)", - "display_name": "Claude Haiku 4.5 (latest)", + "id": "qwen3-32b", + "name": "Qwen3 32B", + "display_name": "Qwen3 32B", "modalities": { "input": [ - "text", - "image", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 64000 + "context": 131072, + "output": 16384 }, "temperature": true, "tool_call": true, "reasoning": { "supported": true, - "default": false + "default": true }, "extra_capabilities": { "reasoning": { "supported": true, - "default_enabled": false, - "mode": "budget", - "budget": { - "min": 1024, - "unit": "tokens" - }, "interleaved": true, "summaries": true, "visibility": "summary", "continuation": [ "thinking_blocks" - ], - "notes": [ - "Claude 4 manual thinking uses thinking.type = \"enabled\" with budget_tokens.", - "Interleaved thinking requires the interleaved-thinking-2025-05-14 beta header for this model family." ] } }, - "attachment": true, - "open_weights": false, - "knowledge": "2025-02-28", - "release_date": "2025-10-15", - "last_updated": "2025-10-15", + "attachment": false, + "open_weights": true, + "knowledge": "2025-04", + "release_date": "2025-04", + "last_updated": "2025-04", "cost": { - "input": 1, - "output": 5, - "cache_read": 0.1, - "cache_write": 1.25 + "input": 0.7, + "output": 2.8, + "reasoning": 8.4 }, "type": "chat" }, { - "id": "databricks-gemini-3-1-pro", - "name": "Gemini 3.1 Pro Preview Custom Tools", - "display_name": "Gemini 3.1 Pro Preview Custom Tools", + "id": "pixtral-large-latest", + "name": "Pixtral Large (latest)", + "display_name": "Pixtral Large (latest)", "modalities": { "input": [ "text", - "image", - "video", - "audio", - "pdf" + "image" ], "output": [ "text" ] }, - "limit": { - "context": 1048576, - "output": 65536 + "limit": { + "context": 128000, + "output": 128000 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, "attachment": true, - "open_weights": false, - "knowledge": "2025-01", - "release_date": "2026-02-19", - "last_updated": "2026-02-19", + "open_weights": true, + "knowledge": "2024-11", + "release_date": "2024-11-01", + "last_updated": "2024-11-04", "cost": { "input": 2, - "output": 12, - "cache_read": 0.2, - "tiers": [ - { - "input": 4, - "output": 18, - "cache_read": 0.4, - "tier": { - "type": "context", - "size": 200000 - } - } - ], - "context_over_200k": { - "input": 4, - "output": 18, - "cache_read": 0.4 - } + "output": 6 }, "type": "chat" - } - ] - }, - "siliconflow": { - "id": "siliconflow", - "name": "SiliconFlow", - "display_name": "SiliconFlow", - "api": "https://api.siliconflow.cn/v1", - "doc": "https://cloud.siliconflow.com/models", - "models": [ + }, { - "id": "THUDM/GLM-4-9B-0414", - "name": "THUDM/GLM-4-9B-0414", - "display_name": "THUDM/GLM-4-9B-0414", + "id": "glm-4-32b-0414-128k", + "name": "GLM-4 32B (0414-128k)", + "display_name": "GLM-4 32B (0414-128k)", "modalities": { "input": [ "text" @@ -71589,8 +75711,8 @@ ] }, "limit": { - "context": 131072, - "output": 8192 + "context": 128000, + "output": 16384 }, "temperature": true, "tool_call": true, @@ -71599,49 +75721,52 @@ }, "attachment": false, "open_weights": false, - "release_date": "2025-04-18", - "last_updated": "2025-11-25", + "release_date": "2025-04-14", + "last_updated": "2025-04-14", "cost": { - "input": 0.086, - "output": 0.086 + "input": 0.1, + "output": 0.1 }, "type": "chat" }, { - "id": "THUDM/GLM-4-32B-0414", - "name": "THUDM/GLM-4-32B-0414", - "display_name": "THUDM/GLM-4-32B-0414", + "id": "seed-1-6-flash-250715", + "name": "Seed 1.6 Flash (250715)", + "display_name": "Seed 1.6 Flash (250715)", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 131072, + "context": 256000, "output": 8192 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": false, - "open_weights": false, - "release_date": "2025-04-18", - "last_updated": "2025-11-25", + "attachment": true, + "open_weights": true, + "release_date": "2025-07-26", + "last_updated": "2025-07-26", "cost": { - "input": 0.27, - "output": 0.27 + "input": 0.07, + "output": 0.3, + "cache_read": 0.015 }, "type": "chat" }, { - "id": "THUDM/GLM-Z1-9B-0414", - "name": "THUDM/GLM-Z1-9B-0414", - "display_name": "THUDM/GLM-Z1-9B-0414", + "id": "qwen3-next-80b-a3b-instruct", + "name": "Qwen3-Next 80B-A3B Instruct", + "display_name": "Qwen3-Next 80B-A3B Instruct", "modalities": { "input": [ "text" @@ -71652,7 +75777,7 @@ }, "limit": { "context": 131072, - "output": 8192 + "output": 32768 }, "temperature": true, "tool_call": true, @@ -71660,22 +75785,24 @@ "supported": false }, "attachment": false, - "open_weights": false, - "release_date": "2025-04-18", - "last_updated": "2025-11-25", + "open_weights": true, + "knowledge": "2025-04", + "release_date": "2025-09", + "last_updated": "2025-09", "cost": { - "input": 0.086, - "output": 0.086 + "input": 0.5, + "output": 2 }, "type": "chat" }, { - "id": "THUDM/GLM-Z1-32B-0414", - "name": "THUDM/GLM-Z1-32B-0414", - "display_name": "THUDM/GLM-Z1-32B-0414", + "id": "qwen3-vl-8b-instruct", + "name": "Qwen3 VL 8B Instruct", + "display_name": "Qwen3 VL 8B Instruct", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" @@ -71686,159 +75813,205 @@ "output": 8192 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": false }, - "attachment": false, - "open_weights": false, - "release_date": "2025-04-18", - "last_updated": "2025-11-25", + "attachment": true, + "open_weights": true, + "release_date": "2025-08-19", + "last_updated": "2025-08-19", "cost": { - "input": 0.14, - "output": 0.57 + "input": 0.08, + "output": 0.5 }, "type": "chat" }, { - "id": "inclusionAI/Ring-flash-2.0", - "name": "inclusionAI/Ring-flash-2.0", - "display_name": "inclusionAI/Ring-flash-2.0", + "id": "gpt-4o-mini-search-preview", + "name": "GPT-4o Mini Search Preview", + "display_name": "GPT-4o Mini Search Preview", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 131072, - "output": 8192 + "context": 128000, + "output": 16384 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true - } + "supported": false }, - "attachment": false, + "attachment": true, "open_weights": false, - "release_date": "2025-09-29", - "last_updated": "2025-11-25", + "release_date": "2024-10-01", + "last_updated": "2024-10-01", "cost": { - "input": 0.14, - "output": 0.57 + "input": 0.15, + "output": 0.6 }, "type": "chat" }, { - "id": "inclusionAI/Ling-flash-2.0", - "name": "inclusionAI/Ling-flash-2.0", - "display_name": "inclusionAI/Ling-flash-2.0", + "id": "glm-4.5v", + "name": "GLM-4.5V", + "display_name": "GLM-4.5V", "modalities": { "input": [ - "text" + "text", + "image", + "video" ], "output": [ "text" ] }, "limit": { - "context": 131072, - "output": 8192 + "context": 64000, + "output": 16384 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": false, - "open_weights": false, - "release_date": "2025-09-18", - "last_updated": "2025-11-25", + "attachment": true, + "open_weights": true, + "knowledge": "2025-04", + "release_date": "2025-08-11", + "last_updated": "2025-08-11", "cost": { - "input": 0.14, - "output": 0.57 + "input": 0.6, + "output": 1.8 }, "type": "chat" }, { - "id": "inclusionAI/Ling-mini-2.0", - "name": "inclusionAI/Ling-mini-2.0", - "display_name": "inclusionAI/Ling-mini-2.0", + "id": "qwen3.7-plus", + "name": "Qwen3.7 Plus", + "display_name": "Qwen3.7 Plus", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 131072, - "output": 8192 + "context": 1000000, + "output": 64000 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true + } }, "attachment": false, "open_weights": false, - "release_date": "2025-09-10", - "last_updated": "2025-11-25", + "knowledge": "2025-04", + "release_date": "2026-06-02", + "last_updated": "2026-06-02", "cost": { - "input": 0.07, - "output": 0.28 + "input": 0.4, + "output": 1.6, + "cache_read": 0.08, + "cache_write": 0.5 }, "type": "chat" }, { - "id": "zai-org/GLM-4.6", - "name": "zai-org/GLM-4.6", - "display_name": "zai-org/GLM-4.6", + "id": "gemini-2.5-pro", + "name": "Gemini 2.5 Pro", + "display_name": "Gemini 2.5 Pro", "modalities": { "input": [ - "text" + "text", + "image", + "audio", + "video", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 131072, - "output": 8192 + "context": 1048576, + "output": 65536 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true + "supported": true, + "default": true }, "extra_capabilities": { "reasoning": { - "supported": true + "supported": true, + "default_enabled": true, + "mode": "budget", + "budget": { + "default": -1, + "min": 128, + "max": 32768, + "auto": -1, + "unit": "tokens" + }, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thought_signatures" + ] } }, - "attachment": false, + "attachment": true, "open_weights": false, - "release_date": "2025-10-04", - "last_updated": "2025-11-25", + "knowledge": "2025-01", + "release_date": "2025-03-20", + "last_updated": "2025-06-05", "cost": { - "input": 0.5, - "output": 1.9 + "input": 1.25, + "output": 10, + "cache_read": 0.125, + "tiers": [ + { + "input": 2.5, + "output": 15, + "cache_read": 0.25, + "tier": { + "type": "context", + "size": 200000 + } + } + ], + "context_over_200k": { + "input": 2.5, + "output": 15, + "cache_read": 0.25 + } }, "type": "chat" }, { - "id": "zai-org/GLM-4.6V", - "name": "zai-org/GLM-4.6V", - "display_name": "zai-org/GLM-4.6V", + "id": "gpt-5", + "name": "GPT-5", + "display_name": "GPT-5", "modalities": { "input": [ "text", @@ -71849,60 +76022,110 @@ ] }, "limit": { - "context": 131000, - "output": 131000 + "context": 400000, + "output": 128000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { "supported": true, "default": true }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": true, + "mode": "effort", + "effort": "medium", + "effort_options": [ + "minimal", + "low", + "medium", + "high" + ], + "verbosity": "medium", + "verbosity_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" + } + }, "attachment": true, "open_weights": false, - "release_date": "2025-12-07", - "last_updated": "2025-12-07", + "knowledge": "2024-09-30", + "release_date": "2025-08-07", + "last_updated": "2025-08-07", "cost": { - "input": 0.3, - "output": 0.9 + "input": 1.25, + "output": 10, + "cache_read": 0.125 }, "type": "chat" }, { - "id": "zai-org/GLM-4.5V", - "name": "zai-org/GLM-4.5V", - "display_name": "zai-org/GLM-4.5V", + "id": "claude-haiku-4-5-20251001", + "name": "Claude Haiku 4.5", + "display_name": "Claude Haiku 4.5", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 131072, - "output": 8192 + "context": 200000, + "output": 64000 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": false + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": false, + "mode": "budget", + "budget": { + "min": 1024, + "unit": "tokens" + }, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ], + "notes": [ + "Claude 4 manual thinking uses thinking.type = \"enabled\" with budget_tokens.", + "Interleaved thinking requires the interleaved-thinking-2025-05-14 beta header for this model family." + ] + } }, "attachment": true, "open_weights": false, - "release_date": "2025-08-13", - "last_updated": "2025-11-25", + "knowledge": "2025-02-28", + "release_date": "2025-10-15", + "last_updated": "2025-10-15", "cost": { - "input": 0.14, - "output": 0.86 + "input": 1, + "output": 5, + "cache_read": 0.1, + "cache_write": 1.25 }, "type": "chat" }, { - "id": "zai-org/GLM-4.5-Air", - "name": "zai-org/GLM-4.5-Air", - "display_name": "zai-org/GLM-4.5-Air", + "id": "kimi-k2-thinking-turbo", + "name": "Kimi K2 Thinking Turbo", + "display_name": "Kimi K2 Thinking Turbo", "modalities": { "input": [ "text" @@ -71912,39 +76135,56 @@ ] }, "limit": { - "context": 131072, - "output": 8192 + "context": 262144, + "output": 262144 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } }, "attachment": false, - "open_weights": false, - "release_date": "2025-07-28", - "last_updated": "2025-11-25", + "open_weights": true, + "knowledge": "2024-08", + "release_date": "2025-11-06", + "last_updated": "2025-11-06", "cost": { - "input": 0.14, - "output": 0.86 + "input": 1.15, + "output": 8, + "cache_read": 0.15 }, "type": "chat" }, { - "id": "moonshotai/Kimi-K2-Thinking", - "name": "moonshotai/Kimi-K2-Thinking", - "display_name": "moonshotai/Kimi-K2-Thinking", + "id": "qwen3.6-35b-a3b", + "name": "Qwen3.6 35B-A3B", + "display_name": "Qwen3.6 35B-A3B", "modalities": { "input": [ - "text" + "text", + "image", + "video", + "audio" ], "output": [ "text" ] }, "limit": { - "context": 262000, - "output": 262000 + "context": 262144, + "output": 65536 }, "temperature": true, "tool_call": true, @@ -71963,20 +76203,20 @@ ] } }, - "attachment": false, - "open_weights": false, - "release_date": "2025-11-07", - "last_updated": "2025-11-25", + "attachment": true, + "open_weights": true, + "release_date": "2026-04-17", + "last_updated": "2026-04-17", "cost": { - "input": 0.55, - "output": 2.5 + "input": 0.248, + "output": 1.485 }, "type": "chat" }, { - "id": "moonshotai/Kimi-K2-Instruct-0905", - "name": "moonshotai/Kimi-K2-Instruct-0905", - "display_name": "moonshotai/Kimi-K2-Instruct-0905", + "id": "gpt-3.5-turbo", + "name": "GPT-3.5-turbo", + "display_name": "GPT-3.5-turbo", "modalities": { "input": [ "text" @@ -71986,44 +76226,81 @@ ] }, "limit": { - "context": 131072, - "output": 8192 + "context": 16385, + "output": 4096 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": false }, "attachment": false, "open_weights": false, - "release_date": "2025-09-08", - "last_updated": "2025-11-25", + "knowledge": "2021-09-01", + "release_date": "2023-03-01", + "last_updated": "2023-11-06", "cost": { - "input": 0.4, - "output": 2 + "input": 0.5, + "output": 1.5, + "cache_read": 0 }, "type": "chat" }, { - "id": "ByteDance-Seed/Seed-OSS-36B-Instruct", - "name": "ByteDance-Seed/Seed-OSS-36B-Instruct", - "display_name": "ByteDance-Seed/Seed-OSS-36B-Instruct", + "id": "seed-1-6-250615", + "name": "Seed 1.6 (250615)", + "display_name": "Seed 1.6 (250615)", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 131072, + "context": 256000, "output": 8192 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true + "supported": true, + "default": true + }, + "attachment": true, + "open_weights": true, + "release_date": "2025-06-25", + "last_updated": "2025-06-25", + "cost": { + "input": 0.25, + "output": 2, + "cache_read": 0.05 + }, + "type": "chat" + }, + { + "id": "qwen3.7-max", + "name": "Qwen3.7 Max", + "display_name": "Qwen3.7 Max", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 1000000, + "output": 65536 + }, + "temperature": true, + "tool_call": true, + "reasoning": { + "supported": true, + "default": true }, "extra_capabilities": { "reasoning": { @@ -72032,18 +76309,20 @@ }, "attachment": false, "open_weights": false, - "release_date": "2025-09-04", - "last_updated": "2025-11-25", + "release_date": "2026-05-21", + "last_updated": "2026-05-21", "cost": { - "input": 0.21, - "output": 0.57 + "input": 2.5, + "output": 7.5, + "cache_read": 0.5, + "cache_write": 3.125 }, "type": "chat" }, { - "id": "baidu/ERNIE-4.5-300B-A47B", - "name": "baidu/ERNIE-4.5-300B-A47B", - "display_name": "baidu/ERNIE-4.5-300B-A47B", + "id": "glm-4.5", + "name": "GLM-4.5", + "display_name": "GLM-4.5", "modalities": { "input": [ "text" @@ -72054,38 +76333,95 @@ }, "limit": { "context": 131072, - "output": 8192 + "output": 98304 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "attachment": false, - "open_weights": false, - "release_date": "2025-07-02", - "last_updated": "2025-11-25", + "open_weights": true, + "knowledge": "2025-04", + "release_date": "2025-07-28", + "last_updated": "2025-07-28", "cost": { - "input": 0.28, - "output": 1.1 + "input": 0.6, + "output": 2.2, + "cache_read": 0.11, + "cache_write": 0 }, "type": "chat" }, { - "id": "deepseek-ai/DeepSeek-V4-Pro", - "name": "deepseek-ai/DeepSeek-V4-Pro", - "display_name": "deepseek-ai/DeepSeek-V4-Pro", + "id": "gpt-5-pro", + "name": "GPT-5 Pro", + "display_name": "GPT-5 Pro", "modalities": { "input": [ + "text", + "image" + ], + "output": [ "text" + ] + }, + "limit": { + "context": 400000, + "output": 272000 + }, + "temperature": false, + "tool_call": true, + "reasoning": { + "supported": true, + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": true, + "mode": "fixed", + "effort": "high", + "verbosity": "medium", + "verbosity_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" + } + }, + "attachment": true, + "open_weights": false, + "knowledge": "2024-09-30", + "release_date": "2025-10-06", + "last_updated": "2025-10-06", + "cost": { + "input": 15, + "output": 120 + }, + "type": "chat" + }, + { + "id": "gemini-2.5-flash", + "name": "Gemini 2.5 Flash", + "display_name": "Gemini 2.5 Flash", + "modalities": { + "input": [ + "text", + "image", + "audio", + "video", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 1049000, - "output": 393000 + "context": 1048576, + "output": 65536 }, "temperature": true, "tool_call": true, @@ -72096,31 +76432,78 @@ "extra_capabilities": { "reasoning": { "supported": true, - "interleaved": true, + "default_enabled": true, + "mode": "budget", + "budget": { + "default": -1, + "min": 0, + "max": 24576, + "auto": -1, + "off": 0, + "unit": "tokens" + }, "summaries": true, "visibility": "summary", "continuation": [ - "thinking_blocks" + "thought_signatures" ] } }, - "attachment": false, - "open_weights": true, - "release_date": "2026-04-24", - "last_updated": "2026-04-24", + "attachment": true, + "open_weights": false, + "knowledge": "2025-01", + "release_date": "2025-03-20", + "last_updated": "2025-06-05", "cost": { - "input": 1.74, - "output": 3.48, - "cache_read": 0.145 + "input": 0.3, + "output": 2.5, + "cache_read": 0.03, + "input_audio": 1 }, "type": "chat" }, { - "id": "deepseek-ai/DeepSeek-OCR", - "name": "deepseek-ai/DeepSeek-OCR", - "display_name": "deepseek-ai/DeepSeek-OCR", + "id": "gpt-4o", + "name": "GPT-4o", + "display_name": "GPT-4o", + "modalities": { + "input": [ + "text", + "image", + "pdf" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 128000, + "output": 16384 + }, + "temperature": true, + "tool_call": true, + "reasoning": { + "supported": false + }, + "attachment": true, + "open_weights": false, + "knowledge": "2023-09", + "release_date": "2024-05-13", + "last_updated": "2024-08-06", + "cost": { + "input": 2.5, + "output": 10, + "cache_read": 1.25 + }, + "type": "chat" + }, + { + "id": "ministral-8b-2512", + "name": "Ministral 8B", + "display_name": "Ministral 8B", "modalities": { "input": [ + "text", "image" ], "output": [ @@ -72128,7 +76511,7 @@ ] }, "limit": { - "context": 8192, + "context": 262144, "output": 8192 }, "temperature": true, @@ -72138,17 +76521,18 @@ }, "attachment": true, "open_weights": true, - "release_date": "2025-10-20", - "last_updated": "2025-10-20", + "release_date": "2025-12-02", + "last_updated": "2025-12-02", "cost": { - "input": 0, - "output": 0 - } + "input": 0.15, + "output": 0.15 + }, + "type": "chat" }, { - "id": "deepseek-ai/DeepSeek-V3", - "name": "deepseek-ai/DeepSeek-V3", - "display_name": "deepseek-ai/DeepSeek-V3", + "id": "gpt-4", + "name": "GPT-4", + "display_name": "GPT-4", "modalities": { "input": [ "text" @@ -72158,7 +76542,7 @@ ] }, "limit": { - "context": 131072, + "context": 8192, "output": 8192 }, "temperature": true, @@ -72166,52 +76550,70 @@ "reasoning": { "supported": false }, - "attachment": false, + "attachment": true, "open_weights": false, - "release_date": "2024-12-26", - "last_updated": "2025-11-25", + "knowledge": "2023-11", + "release_date": "2023-11-06", + "last_updated": "2024-04-09", "cost": { - "input": 0.25, - "output": 1 + "input": 30, + "output": 60 }, "type": "chat" }, { - "id": "deepseek-ai/DeepSeek-R1-Distill-Qwen-14B", - "name": "deepseek-ai/DeepSeek-R1-Distill-Qwen-14B", - "display_name": "deepseek-ai/DeepSeek-R1-Distill-Qwen-14B", + "id": "o4-mini", + "name": "o4-mini", + "display_name": "o4-mini", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 131072, - "output": 8192 + "context": 200000, + "output": 100000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { "supported": true, "default": true }, - "attachment": false, + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": true, + "mode": "effort", + "effort": "medium", + "effort_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" + } + }, + "attachment": true, "open_weights": false, - "release_date": "2025-01-20", - "last_updated": "2025-11-25", + "knowledge": "2024-05", + "release_date": "2025-04-16", + "last_updated": "2025-04-16", "cost": { - "input": 0.1, - "output": 0.1 + "input": 1.1, + "output": 4.4, + "cache_read": 0.275 }, "type": "chat" }, { - "id": "deepseek-ai/DeepSeek-R1", - "name": "deepseek-ai/DeepSeek-R1", - "display_name": "deepseek-ai/DeepSeek-R1", + "id": "qwen3-max", + "name": "Qwen3 Max", + "display_name": "Qwen3 Max", "modalities": { "input": [ "text" @@ -72221,14 +76623,13 @@ ] }, "limit": { - "context": 131072, - "output": 8192 + "context": 262144, + "output": 65536 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": true }, "extra_capabilities": { "reasoning": { @@ -72243,61 +76644,67 @@ }, "attachment": false, "open_weights": false, - "release_date": "2025-05-28", - "last_updated": "2025-11-25", + "knowledge": "2025-04", + "release_date": "2025-09-23", + "last_updated": "2025-09-23", "cost": { - "input": 0.5, - "output": 2.18 + "input": 1.2, + "output": 6 }, "type": "chat" }, { - "id": "deepseek-ai/DeepSeek-R1-Distill-Qwen-32B", - "name": "deepseek-ai/DeepSeek-R1-Distill-Qwen-32B", - "display_name": "deepseek-ai/DeepSeek-R1-Distill-Qwen-32B", + "id": "mistral-small-2506", + "name": "Mistral Small 3.2", + "display_name": "Mistral Small 3.2", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 131072, - "output": 8192 + "context": 128000, + "output": 16384 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, "attachment": false, - "open_weights": false, - "release_date": "2025-01-20", - "last_updated": "2025-11-25", + "open_weights": true, + "knowledge": "2025-03", + "release_date": "2025-06-20", + "last_updated": "2025-06-20", "cost": { - "input": 0.18, - "output": 0.18 + "input": 0.1, + "output": 0.3 }, "type": "chat" }, { - "id": "deepseek-ai/DeepSeek-V3.2", - "name": "deepseek-ai/DeepSeek-V3.2", - "display_name": "deepseek-ai/DeepSeek-V3.2", + "id": "gemini-3.5-flash", + "name": "Gemini 3.5 Flash", + "display_name": "Gemini 3.5 Flash", "modalities": { "input": [ - "text" + "text", + "image", + "video", + "audio", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 164000, - "output": 164000 + "context": 1048576, + "output": 65536 }, "temperature": true, "tool_call": true, @@ -72307,26 +76714,44 @@ }, "extra_capabilities": { "reasoning": { - "supported": true + "supported": true, + "default_enabled": true, + "mode": "level", + "level": "high", + "level_options": [ + "minimal", + "low", + "medium", + "high" + ], + "summaries": true, + "visibility": "summary", + "continuation": [ + "thought_signatures" + ] } }, - "attachment": false, + "attachment": true, "open_weights": false, - "release_date": "2025-12-03", - "last_updated": "2025-12-03", + "knowledge": "2025-01", + "release_date": "2026-05-19", + "last_updated": "2026-05-19", "cost": { - "input": 0.27, - "output": 0.42 + "input": 1.5, + "output": 9, + "cache_read": 0.15, + "input_audio": 1.5 }, "type": "chat" }, { - "id": "deepseek-ai/DeepSeek-V3.1-Terminus", - "name": "deepseek-ai/DeepSeek-V3.1-Terminus", - "display_name": "deepseek-ai/DeepSeek-V3.1-Terminus", + "id": "qwen-plus-latest", + "name": "Qwen Plus Latest", + "display_name": "Qwen Plus Latest", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" @@ -72339,86 +76764,142 @@ "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": true }, - "attachment": false, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } + }, + "attachment": true, "open_weights": false, - "release_date": "2025-09-29", - "last_updated": "2025-11-25", + "release_date": "2025-01-25", + "last_updated": "2025-01-25", "cost": { - "input": 0.27, - "output": 1 + "input": 0.115, + "output": 0.287 }, "type": "chat" }, { - "id": "deepseek-ai/deepseek-vl2", - "name": "deepseek-ai/deepseek-vl2", - "display_name": "deepseek-ai/deepseek-vl2", + "id": "claude-opus-4-1-20250805", + "name": "Claude Opus 4.1", + "display_name": "Claude Opus 4.1", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 131072, - "output": 8192 + "context": 200000, + "output": 32000 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": false + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": false, + "mode": "budget", + "budget": { + "min": 1024, + "unit": "tokens" + }, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ], + "notes": [ + "Claude 4 manual thinking uses thinking.type = \"enabled\" with budget_tokens.", + "Interleaved thinking requires the interleaved-thinking-2025-05-14 beta header for this model family." + ] + } }, "attachment": true, "open_weights": false, - "release_date": "2024-12-13", - "last_updated": "2025-11-25", + "knowledge": "2025-03-31", + "release_date": "2025-08-05", + "last_updated": "2025-08-05", "cost": { - "input": 0.15, - "output": 0.15 + "input": 15, + "output": 75, + "cache_read": 1.5, + "cache_write": 18.75 }, "type": "chat" }, { - "id": "PaddlePaddle/PaddleOCR-VL-1.5", - "name": "PaddlePaddle/PaddleOCR-VL-1.5", - "display_name": "PaddlePaddle/PaddleOCR-VL-1.5", + "id": "grok-4-3", + "name": "Grok 4.3", + "display_name": "Grok 4.3", "modalities": { "input": [ "text", - "image" + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 16384, - "output": 16384 + "context": 1000000, + "output": 30000 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "attachment": true, - "open_weights": true, - "release_date": "2026-01-29", - "last_updated": "2026-01-29", + "open_weights": false, + "release_date": "2026-04-17", + "last_updated": "2026-04-17", "cost": { - "input": 0, - "output": 0 + "input": 1.25, + "output": 2.5, + "cache_read": 0.2, + "tiers": [ + { + "input": 2.5, + "output": 5, + "cache_read": 0.4, + "tier": { + "type": "context", + "size": 200000 + } + } + ], + "context_over_200k": { + "input": 2.5, + "output": 5, + "cache_read": 0.4 + } }, "type": "chat" }, { - "id": "PaddlePaddle/PaddleOCR-VL", - "name": "PaddlePaddle/PaddleOCR-VL", - "display_name": "PaddlePaddle/PaddleOCR-VL", + "id": "llama-4-scout-17b-instruct", + "name": "Llama 4 Scout 17B Instruct", + "display_name": "Llama 4 Scout 17B Instruct", "modalities": { "input": [ "text", @@ -72429,8 +76910,8 @@ ] }, "limit": { - "context": 16384, - "output": 16384 + "context": 8192, + "output": 2048 }, "temperature": true, "tool_call": false, @@ -72439,49 +76920,18 @@ }, "attachment": true, "open_weights": true, - "release_date": "2025-10-16", - "last_updated": "2025-10-16", - "cost": { - "input": 0, - "output": 0 - }, - "type": "chat" - }, - { - "id": "Kwaipilot/KAT-Dev", - "name": "Kwaipilot/KAT-Dev", - "display_name": "Kwaipilot/KAT-Dev", - "modalities": { - "input": [ - "text" - ], - "output": [ - "text" - ] - }, - "limit": { - "context": 128000, - "output": 128000 - }, - "temperature": true, - "tool_call": true, - "reasoning": { - "supported": false - }, - "attachment": false, - "open_weights": false, - "release_date": "2025-09-27", - "last_updated": "2026-01-16", + "release_date": "2025-04-05", + "last_updated": "2025-04-05", "cost": { - "input": 0.2, - "output": 0.6 + "input": 0.17, + "output": 0.66 }, "type": "chat" }, { - "id": "stepfun-ai/Step-3.5-Flash", - "name": "stepfun-ai/Step-3.5-Flash", - "display_name": "stepfun-ai/Step-3.5-Flash", + "id": "llama-3.3-70b-instruct", + "name": "Llama-3.3-70B-Instruct", + "display_name": "Llama-3.3-70B-Instruct", "modalities": { "input": [ "text" @@ -72491,70 +76941,77 @@ ] }, "limit": { - "context": 262000, - "output": 262000 + "context": 128000, + "output": 4096 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, - "attachment": false, - "open_weights": false, - "release_date": "2026-02-11", - "last_updated": "2026-02-11", + "attachment": true, + "open_weights": true, + "knowledge": "2023-12", + "release_date": "2024-12-06", + "last_updated": "2024-12-06", "cost": { - "input": 0.1, - "output": 0.3 + "input": 0, + "output": 0 }, "type": "chat" }, { - "id": "ascend-tribe/pangu-pro-moe", - "name": "ascend-tribe/pangu-pro-moe", - "display_name": "ascend-tribe/pangu-pro-moe", + "id": "sonar-reasoning-pro", + "name": "Sonar Reasoning Pro", + "display_name": "Sonar Reasoning Pro", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 131072, - "output": 8192 + "context": 128000, + "output": 4096 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": false, + "attachment": true, "open_weights": false, - "release_date": "2025-07-02", - "last_updated": "2026-01-16", + "knowledge": "2025-09-01", + "release_date": "2024-01-01", + "last_updated": "2025-09-01", "cost": { - "input": 0.2, - "output": 0.6 + "input": 2, + "output": 8 }, "type": "chat" }, { - "id": "tencent/Hunyuan-MT-7B", - "name": "tencent/Hunyuan-MT-7B", - "display_name": "tencent/Hunyuan-MT-7B", + "id": "gemini-2.0-flash", + "name": "Gemini 2.0 Flash", + "display_name": "Gemini 2.0 Flash", "modalities": { "input": [ - "text" + "text", + "image", + "audio", + "video", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 131072, + "context": 1048576, "output": 8192 }, "temperature": true, @@ -72562,51 +77019,77 @@ "reasoning": { "supported": false }, - "attachment": false, + "attachment": true, "open_weights": false, - "release_date": "2025-09-18", - "last_updated": "2025-11-25", + "knowledge": "2024-06", + "release_date": "2024-12-11", + "last_updated": "2024-12-11", "cost": { - "input": 0, - "output": 0 + "input": 0.1, + "output": 0.4, + "cache_read": 0.025 }, "type": "chat" }, { - "id": "tencent/Hunyuan-A13B-Instruct", - "name": "tencent/Hunyuan-A13B-Instruct", - "display_name": "tencent/Hunyuan-A13B-Instruct", + "id": "grok-4-20-non-reasoning", + "name": "Grok 4.20 (Non-Reasoning)", + "display_name": "Grok 4.20 (Non-Reasoning)", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 131072, - "output": 8192 + "context": 1000000, + "output": 30000 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true }, - "attachment": false, + "extra_capabilities": { + "reasoning": { + "supported": true + } + }, + "attachment": true, "open_weights": false, - "release_date": "2025-06-30", - "last_updated": "2025-11-25", + "release_date": "2026-03-09", + "last_updated": "2026-03-09", "cost": { - "input": 0.14, - "output": 0.57 + "input": 1.25, + "output": 2.5, + "cache_read": 0.2, + "tiers": [ + { + "input": 2.5, + "output": 5, + "cache_read": 0.4, + "tier": { + "type": "context", + "size": 200000 + } + } + ], + "context_over_200k": { + "input": 2.5, + "output": 5, + "cache_read": 0.4 + } }, "type": "chat" }, { - "id": "Pro/MiniMaxAI/MiniMax-M2.5", - "name": "Pro/MiniMaxAI/MiniMax-M2.5", - "display_name": "Pro/MiniMaxAI/MiniMax-M2.5", + "id": "glm-4.7-flashx", + "name": "GLM-4.7-FlashX", + "display_name": "GLM-4.7-FlashX", "modalities": { "input": [ "text" @@ -72616,39 +77099,32 @@ ] }, "limit": { - "context": 192000, - "output": 131000 + "context": 200000, + "output": 131072 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } + "supported": true, + "default": true }, "attachment": false, - "open_weights": false, - "release_date": "2026-02-13", - "last_updated": "2026-02-13", + "open_weights": true, + "knowledge": "2025-04", + "release_date": "2026-01-19", + "last_updated": "2026-01-19", "cost": { - "input": 0.3, - "output": 1.22 + "input": 0.07, + "output": 0.4, + "cache_read": 0.01, + "cache_write": 0 }, "type": "chat" }, { - "id": "Pro/MiniMaxAI/MiniMax-M2.1", - "name": "Pro/MiniMaxAI/MiniMax-M2.1", - "display_name": "Pro/MiniMaxAI/MiniMax-M2.1", + "id": "qwen3-30b-a3b-instruct-2507", + "name": "Qwen3 30B A3B Instruct (2507)", + "display_name": "Qwen3 30B A3B Instruct (2507)", "modalities": { "input": [ "text" @@ -72658,33 +77134,28 @@ ] }, "limit": { - "context": 197000, - "output": 131000 + "context": 131072, + "output": 8192 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true - } + "supported": false }, "attachment": false, - "open_weights": false, - "release_date": "2025-12-23", - "last_updated": "2025-12-23", + "open_weights": true, + "release_date": "2025-07-08", + "last_updated": "2025-07-08", "cost": { - "input": 0.3, - "output": 1.2 + "input": 0.1, + "output": 0.3 }, "type": "chat" }, { - "id": "Pro/zai-org/GLM-4.7", - "name": "Pro/zai-org/GLM-4.7", - "display_name": "Pro/zai-org/GLM-4.7", + "id": "glm-5.1", + "name": "GLM-5.1", + "display_name": "GLM-5.1", "modalities": { "input": [ "text" @@ -72694,8 +77165,8 @@ ] }, "limit": { - "context": 205000, - "output": 205000 + "context": 200000, + "output": 131072 }, "temperature": true, "tool_call": true, @@ -72715,19 +77186,21 @@ } }, "attachment": false, - "open_weights": false, - "release_date": "2025-12-22", - "last_updated": "2025-12-22", + "open_weights": true, + "release_date": "2026-03-27", + "last_updated": "2026-03-27", "cost": { - "input": 0.6, - "output": 2.2 + "input": 6, + "output": 24, + "cache_read": 1.3, + "cache_write": 0 }, "type": "chat" }, { - "id": "Pro/zai-org/GLM-5", - "name": "Pro/zai-org/GLM-5", - "display_name": "Pro/zai-org/GLM-5", + "id": "deepseek-v4-pro", + "name": "DeepSeek V4 Pro", + "display_name": "DeepSeek V4 Pro", "modalities": { "input": [ "text" @@ -72737,8 +77210,8 @@ ] }, "limit": { - "context": 205000, - "output": 205000 + "context": 1000000, + "output": 384000 }, "temperature": true, "tool_call": true, @@ -72759,18 +77232,20 @@ }, "attachment": false, "open_weights": true, - "release_date": "2026-02-12", - "last_updated": "2026-02-12", + "knowledge": "2025-05", + "release_date": "2026-04-24", + "last_updated": "2026-04-24", "cost": { - "input": 1, - "output": 3.2 + "input": 0.435, + "output": 0.87, + "cache_read": 0.003625 }, "type": "chat" }, { - "id": "Pro/zai-org/GLM-5.1", - "name": "Pro/zai-org/GLM-5.1", - "display_name": "Pro/zai-org/GLM-5.1", + "id": "qwen3-next-80b-a3b-thinking", + "name": "Qwen3-Next 80B-A3B (Thinking)", + "display_name": "Qwen3-Next 80B-A3B (Thinking)", "modalities": { "input": [ "text" @@ -72780,8 +77255,8 @@ ] }, "limit": { - "context": 205000, - "output": 205000 + "context": 131072, + "output": 32768 }, "temperature": true, "tool_call": true, @@ -72802,31 +77277,30 @@ }, "attachment": false, "open_weights": true, - "release_date": "2026-04-08", - "last_updated": "2026-04-08", + "knowledge": "2025-04", + "release_date": "2025-09", + "last_updated": "2025-09", "cost": { - "input": 1.4, - "output": 4.4, - "cache_write": 0 + "input": 0.5, + "output": 6 }, "type": "chat" }, { - "id": "Pro/moonshotai/Kimi-K2.6", - "name": "Pro/moonshotai/Kimi-K2.6", - "display_name": "Pro/moonshotai/Kimi-K2.6", + "id": "glm-4.6", + "name": "GLM-4.6", + "display_name": "GLM-4.6", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 262000, - "output": 262000 + "context": 204800, + "output": 131072 }, "temperature": true, "tool_call": true, @@ -72836,73 +77310,72 @@ }, "extra_capabilities": { "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] + "supported": true } }, "attachment": false, "open_weights": true, - "release_date": "2026-04-21", - "last_updated": "2026-04-21", + "knowledge": "2025-04", + "release_date": "2025-09-30", + "last_updated": "2025-09-30", "cost": { - "input": 0.95, - "output": 4, - "cache_read": 0.16 + "input": 0.6, + "output": 2.2, + "cache_read": 0.11, + "cache_write": 0 }, "type": "chat" }, { - "id": "Pro/moonshotai/Kimi-K2-Instruct-0905", - "name": "Pro/moonshotai/Kimi-K2-Instruct-0905", - "display_name": "Pro/moonshotai/Kimi-K2-Instruct-0905", + "id": "qwen35-397b-a17b", + "name": "Qwen3.5 397B-A17B", + "display_name": "Qwen3.5 397B-A17B", "modalities": { "input": [ - "text" + "text", + "image", + "video", + "audio" ], "output": [ "text" ] }, "limit": { - "context": 131072, - "output": 8192 + "context": 262144, + "output": 65536 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": false, - "open_weights": false, - "release_date": "2025-09-08", - "last_updated": "2025-11-25", + "attachment": true, + "open_weights": true, + "release_date": "2026-02-15", + "last_updated": "2026-02-15", "cost": { - "input": 0.4, - "output": 2 + "input": 0.6, + "output": 3.6 }, "type": "chat" }, { - "id": "Pro/moonshotai/Kimi-K2.5", - "name": "Pro/moonshotai/Kimi-K2.5", - "display_name": "Pro/moonshotai/Kimi-K2.5", + "id": "qwen3-235b-a22b-thinking-2507", + "name": "Qwen3 235B A22B Thinking (2507)", + "display_name": "Qwen3 235B A22B Thinking (2507)", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 262000, - "output": 262000 + "context": 131072, + "output": 8192 }, "temperature": true, "tool_call": true, @@ -72923,18 +77396,18 @@ }, "attachment": false, "open_weights": true, - "release_date": "2026-01-27", - "last_updated": "2026-01-27", + "release_date": "2025-07-08", + "last_updated": "2025-07-08", "cost": { - "input": 0.45, - "output": 2.25 + "input": 0.2, + "output": 0.6 }, "type": "chat" }, { - "id": "Pro/moonshotai/Kimi-K2-Thinking", - "name": "Pro/moonshotai/Kimi-K2-Thinking", - "display_name": "Pro/moonshotai/Kimi-K2-Thinking", + "id": "kimi-k2-thinking", + "name": "Kimi K2 Thinking", + "display_name": "Kimi K2 Thinking", "modalities": { "input": [ "text" @@ -72944,8 +77417,8 @@ ] }, "limit": { - "context": 262000, - "output": 262000 + "context": 262144, + "output": 262144 }, "temperature": true, "tool_call": true, @@ -72965,62 +77438,91 @@ } }, "attachment": false, - "open_weights": false, - "release_date": "2025-11-07", - "last_updated": "2025-11-25", + "open_weights": true, + "knowledge": "2024-08", + "release_date": "2025-11-06", + "last_updated": "2025-11-06", "cost": { - "input": 0.55, - "output": 2.5 + "input": 0.6, + "output": 2.5, + "cache_read": 0.15 }, "type": "chat" }, { - "id": "Pro/deepseek-ai/DeepSeek-V3.1-Terminus", - "name": "Pro/deepseek-ai/DeepSeek-V3.1-Terminus", - "display_name": "Pro/deepseek-ai/DeepSeek-V3.1-Terminus", + "id": "claude-sonnet-4-5", + "name": "Claude Sonnet 4.5 (latest)", + "display_name": "Claude Sonnet 4.5 (latest)", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 131072, - "output": 8192 + "context": 200000, + "output": 64000 }, "temperature": true, "tool_call": true, "reasoning": { "supported": true, - "default": true + "default": false }, - "attachment": false, + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": false, + "mode": "budget", + "budget": { + "min": 1024, + "unit": "tokens" + }, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ], + "notes": [ + "Claude 4 manual thinking uses thinking.type = \"enabled\" with budget_tokens.", + "Interleaved thinking requires the interleaved-thinking-2025-05-14 beta header for this model family." + ] + } + }, + "attachment": true, "open_weights": false, + "knowledge": "2025-07-31", "release_date": "2025-09-29", - "last_updated": "2025-11-25", + "last_updated": "2025-09-29", "cost": { - "input": 0.27, - "output": 1 + "input": 3, + "output": 15, + "cache_read": 0.3, + "cache_write": 3.75 }, "type": "chat" }, { - "id": "Pro/deepseek-ai/DeepSeek-V3.2", - "name": "Pro/deepseek-ai/DeepSeek-V3.2", - "display_name": "Pro/deepseek-ai/DeepSeek-V3.2", + "id": "gemini-pro-latest", + "name": "Gemini Pro Latest", + "display_name": "Gemini Pro Latest", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 164000, - "output": 164000 + "context": 1048576, + "output": 65536 }, "temperature": true, "tool_call": true, @@ -73028,25 +77530,21 @@ "supported": true, "default": true }, - "extra_capabilities": { - "reasoning": { - "supported": true - } - }, - "attachment": false, + "attachment": true, "open_weights": false, - "release_date": "2025-12-03", - "last_updated": "2025-12-03", + "release_date": "2026-02-27", + "last_updated": "2026-02-27", "cost": { - "input": 0.27, - "output": 0.42 + "input": 2, + "output": 12, + "cache_read": 0.2 }, "type": "chat" }, { - "id": "Pro/deepseek-ai/DeepSeek-R1", - "name": "Pro/deepseek-ai/DeepSeek-R1", - "display_name": "Pro/deepseek-ai/DeepSeek-R1", + "id": "gemma-3-1b-it", + "name": "Gemma 3 1B IT", + "display_name": "Gemma 3 1B IT", "modalities": { "input": [ "text" @@ -73056,40 +77554,28 @@ ] }, "limit": { - "context": 131072, - "output": 8192 + "context": 1000000, + "output": 16384 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } + "supported": false }, "attachment": false, - "open_weights": false, - "release_date": "2025-05-28", - "last_updated": "2025-11-25", + "open_weights": true, + "release_date": "2025-03-12", + "last_updated": "2025-03-12", "cost": { - "input": 0.5, - "output": 2.18 + "input": 0.08, + "output": 0.3 }, "type": "chat" }, { - "id": "Pro/deepseek-ai/DeepSeek-V3", - "name": "Pro/deepseek-ai/DeepSeek-V3", - "display_name": "Pro/deepseek-ai/DeepSeek-V3", + "id": "glm-4.5-x", + "name": "GLM-4.5 X", + "display_name": "GLM-4.5 X", "modalities": { "input": [ "text" @@ -73099,133 +77585,163 @@ ] }, "limit": { - "context": 131072, - "output": 8192 + "context": 128000, + "output": 16384 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "attachment": false, "open_weights": false, - "release_date": "2024-12-26", - "last_updated": "2025-11-25", + "release_date": "2025-07-28", + "last_updated": "2025-07-28", "cost": { - "input": 0.25, - "output": 1 + "input": 2.2, + "output": 8.9, + "cache_read": 0.45 }, "type": "chat" }, { - "id": "Qwen/Qwen3.6-35B-A3B", - "name": "Qwen/Qwen3.6-35B-A3B", - "display_name": "Qwen/Qwen3.6-35B-A3B", + "id": "claude-opus-4-7", + "name": "Claude Opus 4.7", + "display_name": "Claude Opus 4.7", "modalities": { "input": [ "text", "image", - "video" + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 262144, - "output": 65536 + "context": 1000000, + "output": 128000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { "supported": true, - "default": true + "default": false }, "extra_capabilities": { "reasoning": { "supported": true, + "default_enabled": false, + "mode": "effort", + "effort": "high", + "effort_options": [ + "low", + "medium", + "high", + "xhigh", + "max" + ], "interleaved": true, "summaries": true, - "visibility": "summary", + "visibility": "omitted", "continuation": [ "thinking_blocks" + ], + "notes": [ + "Claude Opus 4.7 and newer Opus models require thinking.type = \"adaptive\" to enable thinking explicitly.", + "Manual budget_tokens requests return 400 on Claude Opus 4.7 and newer adaptive-only Opus models.", + "task_budget is separate from thinking control and should not be treated as a thinking budget." ] } }, - "attachment": false, - "open_weights": true, - "knowledge": "2025-04", - "release_date": "2026-04-17", - "last_updated": "2026-04-17", + "attachment": true, + "open_weights": false, + "knowledge": "2026-01-31", + "release_date": "2026-04-16", + "last_updated": "2026-04-16", "cost": { - "input": 0.23, - "output": 1.86 + "input": 5, + "output": 25, + "cache_read": 0.5, + "cache_write": 6.25 }, "type": "chat" }, { - "id": "Qwen/Qwen3.5-35B-A3B", - "name": "Qwen/Qwen3.5-35B-A3B", - "display_name": "Qwen/Qwen3.5-35B-A3B", + "id": "gpt-5.4-nano", + "name": "GPT-5.4 nano", + "display_name": "GPT-5.4 nano", "modalities": { "input": [ "text", - "image", - "video" + "image" ], "output": [ "text" ] }, "limit": { - "context": 262144, - "output": 65536 + "context": 400000, + "output": 128000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { "supported": true, - "default": true + "default": false }, "extra_capabilities": { "reasoning": { "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] + "default_enabled": false, + "mode": "effort", + "effort": "none", + "effort_options": [ + "none", + "low", + "medium", + "high", + "xhigh" + ], + "verbosity": "medium", + "verbosity_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" } }, - "attachment": false, - "open_weights": true, - "knowledge": "2025-04", - "release_date": "2026-02-25", - "last_updated": "2026-02-25", + "attachment": true, + "open_weights": false, + "knowledge": "2025-08-31", + "release_date": "2026-03-17", + "last_updated": "2026-03-17", "cost": { - "input": 0.23, - "output": 1.86 + "input": 0.2, + "output": 1.25, + "cache_read": 0.02 }, "type": "chat" }, { - "id": "Qwen/Qwen3.5-397B-A17B", - "name": "Qwen/Qwen3.5-397B-A17B", - "display_name": "Qwen/Qwen3.5-397B-A17B", + "id": "grok-4-20-beta-0309-reasoning", + "name": "Grok 4.20 (Reasoning)", + "display_name": "Grok 4.20 (Reasoning)", "modalities": { "input": [ "text", "image", - "video" + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 262144, - "output": 65536 + "context": 1000000, + "output": 30000 }, "temperature": true, "tool_call": true, @@ -73233,258 +77749,216 @@ "supported": true, "default": true }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } - }, - "attachment": false, - "open_weights": true, - "knowledge": "2025-04", - "release_date": "2026-02-16", - "last_updated": "2026-02-16", + "attachment": true, + "open_weights": false, + "release_date": "2026-03-09", + "last_updated": "2026-03-09", "cost": { - "input": 0.29, - "output": 1.74 + "input": 1.25, + "output": 2.5, + "cache_read": 0.2, + "tiers": [ + { + "input": 2.5, + "output": 5, + "cache_read": 0.4, + "tier": { + "type": "context", + "size": 200000 + } + } + ], + "context_over_200k": { + "input": 2.5, + "output": 5, + "cache_read": 0.4 + } }, "type": "chat" }, { - "id": "Qwen/Qwen3.5-9B", - "name": "Qwen/Qwen3.5-9B", - "display_name": "Qwen/Qwen3.5-9B", + "id": "glm-4.5-airx", + "name": "GLM-4.5 AirX", + "display_name": "GLM-4.5 AirX", "modalities": { "input": [ - "text", - "image", - "video" + "text" ], "output": [ "text" ] }, "limit": { - "context": 262144, - "output": 65536 + "context": 128000, + "output": 16384 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } + "supported": false }, "attachment": false, - "open_weights": true, - "knowledge": "2025-04", - "release_date": "2026-03-03", - "last_updated": "2026-03-03", + "open_weights": false, + "release_date": "2025-07-28", + "last_updated": "2025-07-28", "cost": { - "input": 0.22, - "output": 1.74 + "input": 1.1, + "output": 4.5, + "cache_read": 0.22 }, "type": "chat" }, { - "id": "Qwen/Qwen3.5-4B", - "name": "Qwen/Qwen3.5-4B", - "display_name": "Qwen/Qwen3.5-4B", + "id": "gpt-5-chat-latest", + "name": "GPT-5 Chat (latest)", + "display_name": "GPT-5 Chat (latest)", "modalities": { "input": [ "text", - "image", - "video" + "image" ], "output": [ "text" ] }, "limit": { - "context": 262144, - "output": 65536 + "context": 400000, + "output": 128000 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": true, "default": true }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } - }, - "attachment": false, - "open_weights": true, - "knowledge": "2025-04", - "release_date": "2026-03-03", - "last_updated": "2026-03-03", + "attachment": true, + "open_weights": false, + "knowledge": "2024-09-30", + "release_date": "2025-08-07", + "last_updated": "2025-08-07", "cost": { - "input": 0, - "output": 0 + "input": 1.25, + "output": 10, + "cache_read": 0.125 }, "type": "chat" }, { - "id": "Qwen/Qwen3.5-122B-A10B", - "name": "Qwen/Qwen3.5-122B-A10B", - "display_name": "Qwen/Qwen3.5-122B-A10B", + "id": "ministral-3b-2512", + "name": "Ministral 3B", + "display_name": "Ministral 3B", "modalities": { "input": [ "text", - "image", - "video" + "image" ], "output": [ "text" ] }, "limit": { - "context": 262144, - "output": 65536 + "context": 131072, + "output": 8192 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } + "supported": false }, - "attachment": false, + "attachment": true, "open_weights": true, - "knowledge": "2025-04", - "release_date": "2026-02-26", - "last_updated": "2026-02-26", + "release_date": "2025-12-02", + "last_updated": "2025-12-02", "cost": { - "input": 0.29, - "output": 2.32 + "input": 0.1, + "output": 0.1 }, "type": "chat" }, { - "id": "Qwen/Qwen3.5-27B", - "name": "Qwen/Qwen3.5-27B", - "display_name": "Qwen/Qwen3.5-27B", + "id": "qwen2-5-vl-72b-instruct", + "name": "Qwen2.5-VL 72B Instruct", + "display_name": "Qwen2.5-VL 72B Instruct", "modalities": { "input": [ "text", - "image", - "video" + "image" ], "output": [ "text" ] }, "limit": { - "context": 262144, - "output": 65536 + "context": 131072, + "output": 8192 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } + "supported": false }, "attachment": false, "open_weights": true, - "knowledge": "2025-04", - "release_date": "2026-02-25", - "last_updated": "2026-02-25", + "knowledge": "2024-04", + "release_date": "2024-09", + "last_updated": "2024-09", "cost": { - "input": 0.26, - "output": 2.09 + "input": 2.8, + "output": 8.4 }, "type": "chat" }, { - "id": "Qwen/Qwen3-VL-235B-A22B-Instruct", - "name": "Qwen/Qwen3-VL-235B-A22B-Instruct", - "display_name": "Qwen/Qwen3-VL-235B-A22B-Instruct", + "id": "glm-4.6v-flashx", + "name": "GLM-4.6V FlashX", + "display_name": "GLM-4.6V FlashX", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 131072, - "output": 8192 + "context": 128000, + "output": 16000 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "attachment": true, "open_weights": false, - "release_date": "2025-10-04", - "last_updated": "2025-11-25", + "release_date": "2025-12-08", + "last_updated": "2025-12-08", "cost": { - "input": 0.3, - "output": 1.5 + "input": 0.04, + "output": 0.4, + "cache_read": 0.004 }, "type": "chat" }, { - "id": "Qwen/Qwen3-Next-80B-A3B-Thinking", - "name": "Qwen/Qwen3-Next-80B-A3B-Thinking", - "display_name": "Qwen/Qwen3-Next-80B-A3B-Thinking", + "id": "minimax-m3", + "name": "MiniMax-M3", + "display_name": "MiniMax-M3", "modalities": { "input": [ - "text" + "text", + "image", + "video" ], "output": [ "text" ] }, "limit": { - "context": 131072, - "output": 8192 + "context": 512000, + "output": 128000 }, "temperature": true, "tool_call": true, @@ -73494,71 +77968,36 @@ }, "extra_capabilities": { "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] + "supported": true } }, - "attachment": false, - "open_weights": false, - "release_date": "2025-09-25", - "last_updated": "2025-11-25", - "cost": { - "input": 0.14, - "output": 0.57 - }, - "type": "chat" - }, - { - "id": "Qwen/Qwen2.5-7B-Instruct", - "name": "Qwen/Qwen2.5-7B-Instruct", - "display_name": "Qwen/Qwen2.5-7B-Instruct", - "modalities": { - "input": [ - "text" - ], - "output": [ - "text" - ] - }, - "limit": { - "context": 131072, - "output": 8192 - }, - "temperature": true, - "tool_call": true, - "reasoning": { - "supported": false - }, - "attachment": false, + "attachment": true, "open_weights": false, - "release_date": "2024-09-18", - "last_updated": "2025-11-25", + "release_date": "2026-06-01", + "last_updated": "2026-06-01", "cost": { - "input": 0.05, - "output": 0.05 + "input": 0.6, + "output": 2.4, + "cache_read": 0.12 }, "type": "chat" }, { - "id": "Qwen/Qwen3-VL-30B-A3B-Thinking", - "name": "Qwen/Qwen3-VL-30B-A3B-Thinking", - "display_name": "Qwen/Qwen3-VL-30B-A3B-Thinking", + "id": "qwen3-vl-plus", + "name": "Qwen3-VL Plus", + "display_name": "Qwen3-VL Plus", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 131072, - "output": 8192 + "context": 262144, + "output": 32768 }, "temperature": true, "tool_call": true, @@ -73577,94 +78016,142 @@ ] } }, - "attachment": true, + "attachment": false, "open_weights": false, - "release_date": "2025-10-11", - "last_updated": "2025-11-25", + "knowledge": "2025-04", + "release_date": "2025-09-23", + "last_updated": "2025-09-23", "cost": { - "input": 0.29, - "output": 1 + "input": 0.2, + "output": 1.6, + "reasoning": 4.8 }, "type": "chat" }, { - "id": "Qwen/Qwen3-30B-A3B-Thinking-2507", - "name": "Qwen/Qwen3-30B-A3B-Thinking-2507", - "display_name": "Qwen/Qwen3-30B-A3B-Thinking-2507", + "id": "claude-opus-4-5-20251101", + "name": "Claude Opus 4.5", + "display_name": "Claude Opus 4.5", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 131072, - "output": 8192 + "context": 200000, + "output": 64000 }, "temperature": true, "tool_call": true, "reasoning": { "supported": true, - "default": true + "default": false }, "extra_capabilities": { "reasoning": { "supported": true, + "default_enabled": false, + "mode": "mixed", + "budget": { + "min": 1024, + "unit": "tokens" + }, + "effort": "high", + "effort_options": [ + "low", + "medium", + "high" + ], "interleaved": true, "summaries": true, "visibility": "summary", "continuation": [ "thinking_blocks" + ], + "notes": [ + "Claude Opus 4.5 uses manual thinking.type = \"enabled\" with budget_tokens; effort can be used alongside the thinking budget.", + "Interleaved thinking requires the interleaved-thinking-2025-05-14 beta header." ] } }, - "attachment": false, + "attachment": true, "open_weights": false, - "release_date": "2025-07-31", - "last_updated": "2025-11-25", + "knowledge": "2025-03-31", + "release_date": "2025-11-01", + "last_updated": "2025-11-01", "cost": { - "input": 0.09, - "output": 0.3 + "input": 5, + "output": 25, + "cache_read": 0.5, + "cache_write": 6.25 }, "type": "chat" }, { - "id": "Qwen/Qwen2.5-32B-Instruct", - "name": "Qwen/Qwen2.5-32B-Instruct", - "display_name": "Qwen/Qwen2.5-32B-Instruct", + "id": "gpt-5.1-codex", + "name": "GPT-5.1 Codex", + "display_name": "GPT-5.1 Codex", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 131072, - "output": 8192 + "context": 400000, + "output": 128000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": false }, - "attachment": false, + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": false, + "mode": "effort", + "effort": "none", + "effort_options": [ + "none", + "low", + "medium", + "high" + ], + "verbosity": "medium", + "verbosity_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" + } + }, + "attachment": true, "open_weights": false, - "release_date": "2024-09-19", - "last_updated": "2025-11-25", + "knowledge": "2024-09-30", + "release_date": "2025-11-13", + "last_updated": "2025-11-13", "cost": { - "input": 0.18, - "output": 0.18 + "input": 1.25, + "output": 10, + "cache_read": 0.125 }, "type": "chat" }, { - "id": "Qwen/Qwen3-32B", - "name": "Qwen/Qwen3-32B", - "display_name": "Qwen/Qwen3-32B", + "id": "minimax-m2", + "name": "MiniMax-M2", + "display_name": "MiniMax-M2", "modalities": { "input": [ "text" @@ -73674,49 +78161,46 @@ ] }, "limit": { - "context": 131072, - "output": 8192 + "context": 196608, + "output": 128000 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true + "supported": true, + "default": true }, "extra_capabilities": { "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] + "supported": true } }, "attachment": false, - "open_weights": false, - "release_date": "2025-04-30", - "last_updated": "2025-11-25", + "open_weights": true, + "release_date": "2025-10-27", + "last_updated": "2025-10-27", "cost": { - "input": 0.14, - "output": 0.57 + "input": 0.3, + "output": 1.2 }, "type": "chat" }, { - "id": "Qwen/Qwen2.5-VL-32B-Instruct", - "name": "Qwen/Qwen2.5-VL-32B-Instruct", - "display_name": "Qwen/Qwen2.5-VL-32B-Instruct", + "id": "claude-3-5-sonnet-20241022", + "name": "Claude Sonnet 3.5 v2", + "display_name": "Claude Sonnet 3.5 v2", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 131072, + "context": 200000, "output": 8192 }, "temperature": true, @@ -73726,172 +78210,220 @@ }, "attachment": true, "open_weights": false, - "release_date": "2025-03-24", - "last_updated": "2025-11-25", + "knowledge": "2024-04-30", + "release_date": "2024-10-22", + "last_updated": "2024-10-22", "cost": { - "input": 0.27, - "output": 0.27 + "input": 3, + "output": 15, + "cache_read": 0.3, + "cache_write": 3.75 }, "type": "chat" }, { - "id": "Qwen/Qwen2.5-VL-72B-Instruct", - "name": "Qwen/Qwen2.5-VL-72B-Instruct", - "display_name": "Qwen/Qwen2.5-VL-72B-Instruct", + "id": "claude-opus-4-8", + "name": "Claude Opus 4.8", + "display_name": "Claude Opus 4.8", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 131072, - "output": 8192 + "context": 1000000, + "output": 128000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": false + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": false, + "mode": "effort", + "effort": "high", + "effort_options": [ + "low", + "medium", + "high", + "xhigh", + "max" + ], + "interleaved": true, + "summaries": true, + "visibility": "omitted", + "continuation": [ + "thinking_blocks" + ], + "notes": [ + "Claude Opus 4.7 and newer Opus models require thinking.type = \"adaptive\" to enable thinking explicitly.", + "Manual budget_tokens requests return 400 on Claude Opus 4.7 and newer adaptive-only Opus models.", + "task_budget is separate from thinking control and should not be treated as a thinking budget." + ] + } }, "attachment": true, "open_weights": false, - "release_date": "2025-01-28", - "last_updated": "2025-11-25", + "release_date": "2026-05-28", + "last_updated": "2026-05-28", "cost": { - "input": 0.59, - "output": 0.59 + "input": 5, + "output": 25, + "cache_read": 0.5, + "cache_write": 6.25 }, "type": "chat" }, { - "id": "Qwen/Qwen2.5-Coder-32B-Instruct", - "name": "Qwen/Qwen2.5-Coder-32B-Instruct", - "display_name": "Qwen/Qwen2.5-Coder-32B-Instruct", + "id": "claude-opus-4-20250514", + "name": "Claude Opus 4", + "display_name": "Claude Opus 4", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 131072, - "output": 8192 + "context": 200000, + "output": 32000 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false - }, - "attachment": false, - "open_weights": false, - "release_date": "2024-11-11", - "last_updated": "2025-11-25", - "cost": { - "input": 0.18, - "output": 0.18 - } - }, - { - "id": "Qwen/Qwen3-VL-30B-A3B-Instruct", - "name": "Qwen/Qwen3-VL-30B-A3B-Instruct", - "display_name": "Qwen/Qwen3-VL-30B-A3B-Instruct", - "modalities": { - "input": [ - "text" - ], - "output": [ - "text" - ] - }, - "limit": { - "context": 131072, - "output": 8192 + "supported": true, + "default": false }, - "temperature": true, - "tool_call": true, - "reasoning": { - "supported": false + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": false, + "mode": "budget", + "budget": { + "min": 1024, + "unit": "tokens" + }, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ], + "notes": [ + "Claude 4 manual thinking uses thinking.type = \"enabled\" with budget_tokens.", + "Interleaved thinking requires the interleaved-thinking-2025-05-14 beta header for this model family." + ] + } }, "attachment": true, "open_weights": false, - "release_date": "2025-10-05", - "last_updated": "2025-11-25", + "knowledge": "2025-03-31", + "release_date": "2025-05-22", + "last_updated": "2025-05-22", "cost": { - "input": 0.29, - "output": 1 + "input": 15, + "output": 75, + "cache_read": 1.5, + "cache_write": 18.75 }, "type": "chat" }, { - "id": "Qwen/Qwen2.5-14B-Instruct", - "name": "Qwen/Qwen2.5-14B-Instruct", - "display_name": "Qwen/Qwen2.5-14B-Instruct", + "id": "qwen3-max-2026-01-23", + "name": "Qwen3 Max (2026-01-23)", + "display_name": "Qwen3 Max (2026-01-23)", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 131072, - "output": 8192 + "context": 256000, + "output": 32800 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": false, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } + }, + "attachment": true, "open_weights": false, - "release_date": "2024-09-18", - "last_updated": "2025-11-25", + "release_date": "2026-01-23", + "last_updated": "2026-01-23", "cost": { - "input": 0.1, - "output": 0.1 + "input": 0.359, + "output": 1.434, + "cache_read": 0.072 }, "type": "chat" }, { - "id": "Qwen/Qwen3-Next-80B-A3B-Instruct", - "name": "Qwen/Qwen3-Next-80B-A3B-Instruct", - "display_name": "Qwen/Qwen3-Next-80B-A3B-Instruct", + "id": "gpt-5.3-chat-latest", + "name": "GPT-5.3 Chat (latest)", + "display_name": "GPT-5.3 Chat (latest)", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 131072, - "output": 8192 + "context": 128000, + "output": 16384 }, "temperature": true, "tool_call": true, "reasoning": { "supported": false }, - "attachment": false, + "attachment": true, "open_weights": false, - "release_date": "2025-09-18", - "last_updated": "2025-11-25", + "knowledge": "2025-08-31", + "release_date": "2026-03-03", + "last_updated": "2026-03-03", "cost": { - "input": 0.14, - "output": 1.4 + "input": 1.75, + "output": 14, + "cache_read": 0.175 }, "type": "chat" }, { - "id": "Qwen/Qwen3-VL-32B-Instruct", - "name": "Qwen/Qwen3-VL-32B-Instruct", - "display_name": "Qwen/Qwen3-VL-32B-Instruct", + "id": "claude-3-opus", + "name": "Claude 3 Opus", + "display_name": "Claude 3 Opus", "modalities": { "input": [ "text", @@ -73902,8 +78434,8 @@ ] }, "limit": { - "context": 262000, - "output": 262000 + "context": 200000, + "output": 4096 }, "temperature": true, "tool_call": true, @@ -73912,29 +78444,34 @@ }, "attachment": true, "open_weights": false, - "release_date": "2025-10-21", - "last_updated": "2025-11-25", + "release_date": "2024-03-04", + "last_updated": "2024-03-04", "cost": { - "input": 0.2, - "output": 0.6 + "input": 15, + "output": 75, + "cache_read": 1.5 }, "type": "chat" }, { - "id": "Qwen/Qwen3-235B-A22B-Instruct-2507", - "name": "Qwen/Qwen3-235B-A22B-Instruct-2507", - "display_name": "Qwen/Qwen3-235B-A22B-Instruct-2507", + "id": "qwen-omni-turbo", + "name": "Qwen-Omni Turbo", + "display_name": "Qwen-Omni Turbo", "modalities": { "input": [ - "text" + "text", + "image", + "audio", + "video" ], "output": [ - "text" + "text", + "audio" ] }, "limit": { - "context": 131072, - "output": 8192 + "context": 32768, + "output": 2048 }, "temperature": true, "tool_call": true, @@ -73943,18 +78480,21 @@ }, "attachment": false, "open_weights": false, - "release_date": "2025-07-23", - "last_updated": "2025-11-25", + "knowledge": "2024-04", + "release_date": "2025-01-19", + "last_updated": "2025-03-26", "cost": { - "input": 0.09, - "output": 0.6 + "input": 0.07, + "output": 0.27, + "input_audio": 4.44, + "output_audio": 8.89 }, "type": "chat" }, { - "id": "Qwen/Qwen3-Omni-30B-A3B-Thinking", - "name": "Qwen/Qwen3-Omni-30B-A3B-Thinking", - "display_name": "Qwen/Qwen3-Omni-30B-A3B-Thinking", + "id": "o3-mini", + "name": "o3-mini", + "display_name": "o3-mini", "modalities": { "input": [ "text" @@ -73964,10 +78504,10 @@ ] }, "limit": { - "context": 131072, - "output": 8192 + "context": 200000, + "output": 100000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { "supported": true, @@ -73976,28 +78516,33 @@ "extra_capabilities": { "reasoning": { "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] + "default_enabled": true, + "mode": "effort", + "effort": "medium", + "effort_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" } }, - "attachment": true, + "attachment": false, "open_weights": false, - "release_date": "2025-10-04", - "last_updated": "2025-11-25", + "knowledge": "2024-05", + "release_date": "2024-12-20", + "last_updated": "2025-01-29", "cost": { - "input": 0.1, - "output": 0.4 + "input": 1.1, + "output": 4.4, + "cache_read": 0.55 }, "type": "chat" }, { - "id": "Qwen/Qwen3-Coder-30B-A3B-Instruct", - "name": "Qwen/Qwen3-Coder-30B-A3B-Instruct", - "display_name": "Qwen/Qwen3-Coder-30B-A3B-Instruct", + "id": "qwen3-32b-fp8", + "name": "Qwen3 32B FP8", + "display_name": "Qwen3 32B FP8", "modalities": { "input": [ "text" @@ -74013,21 +78558,23 @@ "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "attachment": false, - "open_weights": false, - "release_date": "2025-08-01", - "last_updated": "2025-11-25", + "open_weights": true, + "release_date": "2025-04-28", + "last_updated": "2025-04-28", "cost": { - "input": 0.07, - "output": 0.28 - } + "input": 0.1, + "output": 0.1 + }, + "type": "chat" }, { - "id": "Qwen/Qwen3-235B-A22B-Thinking-2507", - "name": "Qwen/Qwen3-235B-A22B-Thinking-2507", - "display_name": "Qwen/Qwen3-235B-A22B-Thinking-2507", + "id": "claude-3-5-haiku", + "name": "Claude 3.5 Haiku", + "display_name": "Claude 3.5 Haiku", "modalities": { "input": [ "text" @@ -74037,127 +78584,133 @@ ] }, "limit": { - "context": 131072, + "context": 200000, "output": 8192 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } + "supported": false }, "attachment": false, "open_weights": false, - "release_date": "2025-07-28", - "last_updated": "2025-11-25", + "release_date": "2024-10-22", + "last_updated": "2024-10-22", "cost": { - "input": 0.13, - "output": 0.6 + "input": 0.8, + "output": 4, + "cache_read": 0.08 }, "type": "chat" }, { - "id": "Qwen/Qwen3-8B", - "name": "Qwen/Qwen3-8B", - "display_name": "Qwen/Qwen3-8B", + "id": "gpt-5.2", + "name": "GPT-5.2", + "display_name": "GPT-5.2", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 131072, - "output": 8192 + "context": 400000, + "output": 128000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { - "supported": true + "supported": true, + "default": false }, "extra_capabilities": { "reasoning": { "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] + "default_enabled": false, + "mode": "effort", + "effort": "none", + "effort_options": [ + "none", + "low", + "medium", + "high", + "xhigh" + ], + "verbosity": "medium", + "verbosity_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" } }, - "attachment": false, + "attachment": true, "open_weights": false, - "release_date": "2025-04-30", - "last_updated": "2025-11-25", + "knowledge": "2025-08-31", + "release_date": "2025-12-11", + "last_updated": "2025-12-11", "cost": { - "input": 0.06, - "output": 0.06 + "input": 1.75, + "output": 14, + "cache_read": 0.175 }, "type": "chat" }, { - "id": "Qwen/Qwen2.5-72B-Instruct-128K", - "name": "Qwen/Qwen2.5-72B-Instruct-128K", - "display_name": "Qwen/Qwen2.5-72B-Instruct-128K", + "id": "gemma-3-27b", + "name": "Gemma 3 27B", + "display_name": "Gemma 3 27B", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 131072, - "output": 8192 + "context": 128000, + "output": 16384 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": false }, - "attachment": false, - "open_weights": false, - "release_date": "2024-09-18", - "last_updated": "2025-11-25", + "attachment": true, + "open_weights": true, + "release_date": "2025-03-12", + "last_updated": "2025-03-12", "cost": { - "input": 0.59, - "output": 0.59 + "input": 0.27, + "output": 0.27 }, "type": "chat" }, { - "id": "Qwen/Qwen3-VL-32B-Thinking", - "name": "Qwen/Qwen3-VL-32B-Thinking", - "display_name": "Qwen/Qwen3-VL-32B-Thinking", + "id": "gpt-5.3-codex", + "name": "GPT-5.3 Codex", + "display_name": "GPT-5.3 Codex", "modalities": { "input": [ "text", - "image" + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 262000, - "output": 262000 + "context": 400000, + "output": 128000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { "supported": true, @@ -74166,28 +78719,40 @@ "extra_capabilities": { "reasoning": { "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] + "default_enabled": true, + "mode": "effort", + "effort": "medium", + "effort_options": [ + "low", + "medium", + "high", + "xhigh" + ], + "verbosity": "medium", + "verbosity_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" } }, "attachment": true, "open_weights": false, - "release_date": "2025-10-21", - "last_updated": "2025-11-25", + "knowledge": "2025-08-31", + "release_date": "2026-02-05", + "last_updated": "2026-02-05", "cost": { - "input": 0.2, - "output": 1.5 + "input": 1.75, + "output": 14, + "cache_read": 0.175 }, "type": "chat" }, { - "id": "Qwen/Qwen3-14B", - "name": "Qwen/Qwen3-14B", - "display_name": "Qwen/Qwen3-14B", + "id": "grok-4-0709", + "name": "Grok 4 (0709)", + "display_name": "Grok 4 (0709)", "modalities": { "input": [ "text" @@ -74197,39 +78762,28 @@ ] }, "limit": { - "context": 131072, - "output": 8192 + "context": 256000, + "output": 256000 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } + "supported": false }, "attachment": false, "open_weights": false, - "release_date": "2025-04-30", - "last_updated": "2025-11-25", + "release_date": "2025-07-09", + "last_updated": "2025-07-09", "cost": { - "input": 0.07, - "output": 0.28 + "input": 3, + "output": 15 }, "type": "chat" }, { - "id": "Qwen/Qwen3-30B-A3B-Instruct-2507", - "name": "Qwen/Qwen3-30B-A3B-Instruct-2507", - "display_name": "Qwen/Qwen3-30B-A3B-Instruct-2507", + "id": "minimax-m2.7", + "name": "MiniMax-M2.7", + "display_name": "MiniMax-M2.7", "modalities": { "input": [ "text" @@ -74239,28 +78793,42 @@ ] }, "limit": { - "context": 131072, - "output": 8192 + "context": 204800, + "output": 131072 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } }, "attachment": false, - "open_weights": false, - "release_date": "2025-07-30", - "last_updated": "2025-11-25", + "open_weights": true, + "release_date": "2026-03-18", + "last_updated": "2026-03-18", "cost": { - "input": 0.09, - "output": 0.3 + "input": 0.3, + "output": 1.2, + "cache_read": 0.06, + "cache_write": 0.375 }, "type": "chat" }, { - "id": "Qwen/Qwen3-Omni-30B-A3B-Instruct", - "name": "Qwen/Qwen3-Omni-30B-A3B-Instruct", - "display_name": "Qwen/Qwen3-Omni-30B-A3B-Instruct", + "id": "qwen-flash", + "name": "Qwen Flash", + "display_name": "Qwen Flash", "modalities": { "input": [ "text" @@ -74270,28 +78838,41 @@ ] }, "limit": { - "context": 131072, - "output": 8192 + "context": 1000000, + "output": 32768 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": true, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } + }, + "attachment": false, "open_weights": false, - "release_date": "2025-10-04", - "last_updated": "2025-11-25", + "knowledge": "2024-04", + "release_date": "2025-07-28", + "last_updated": "2025-07-28", "cost": { - "input": 0.1, + "input": 0.05, "output": 0.4 }, "type": "chat" }, { - "id": "Qwen/Qwen2.5-72B-Instruct", - "name": "Qwen/Qwen2.5-72B-Instruct", - "display_name": "Qwen/Qwen2.5-72B-Instruct", + "id": "qwen3-4b-fp8", + "name": "Qwen3 4B FP8", + "display_name": "Qwen3 4B FP8", "modalities": { "input": [ "text" @@ -74307,67 +78888,85 @@ "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "attachment": false, - "open_weights": false, - "release_date": "2024-09-18", - "last_updated": "2025-11-25", + "open_weights": true, + "release_date": "2025-04-28", + "last_updated": "2025-04-28", "cost": { - "input": 0.59, - "output": 0.59 + "input": 0.03, + "output": 0.03 }, "type": "chat" }, { - "id": "Qwen/QwQ-32B", - "name": "Qwen/QwQ-32B", - "display_name": "Qwen/QwQ-32B", + "id": "gemini-2.5-flash-lite", + "name": "Gemini 2.5 Flash-Lite", + "display_name": "Gemini 2.5 Flash-Lite", "modalities": { "input": [ - "text" + "text", + "image", + "audio", + "video", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 131072, - "output": 8192 + "context": 1048576, + "output": 65536 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true + "supported": true, + "default": false }, "extra_capabilities": { "reasoning": { "supported": true, - "interleaved": true, + "default_enabled": false, + "mode": "budget", + "budget": { + "default": -1, + "min": 512, + "max": 24576, + "auto": -1, + "unit": "tokens" + }, "summaries": true, "visibility": "summary", "continuation": [ - "thinking_blocks" + "thought_signatures" ] } }, - "attachment": false, + "attachment": true, "open_weights": false, - "release_date": "2025-03-06", - "last_updated": "2025-11-25", + "knowledge": "2025-01", + "release_date": "2025-06-17", + "last_updated": "2025-06-17", "cost": { - "input": 0.15, - "output": 0.58 + "input": 0.1, + "output": 0.4, + "cache_read": 0.01, + "input_audio": 0.3 }, "type": "chat" }, { - "id": "Qwen/Qwen3-Omni-30B-A3B-Captioner", - "name": "Qwen/Qwen3-Omni-30B-A3B-Captioner", - "display_name": "Qwen/Qwen3-Omni-30B-A3B-Captioner", + "id": "qwen2-5-vl-32b-instruct", + "name": "Qwen2.5 VL 32B Instruct", + "display_name": "Qwen2.5 VL 32B Instruct", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" @@ -74383,63 +78982,77 @@ "supported": false }, "attachment": true, - "open_weights": false, - "release_date": "2025-10-04", - "last_updated": "2025-11-25", + "open_weights": true, + "release_date": "2025-03-15", + "last_updated": "2025-03-15", "cost": { - "input": 0.1, - "output": 0.4 + "input": 1.4, + "output": 4.2 }, "type": "chat" }, { - "id": "Qwen/Qwen3-VL-8B-Thinking", - "name": "Qwen/Qwen3-VL-8B-Thinking", - "display_name": "Qwen/Qwen3-VL-8B-Thinking", + "id": "claude-sonnet-4-20250514", + "name": "Claude Sonnet 4", + "display_name": "Claude Sonnet 4", "modalities": { "input": [ "text", - "image" + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 262000, - "output": 262000 + "context": 200000, + "output": 64000 }, "temperature": true, "tool_call": true, "reasoning": { "supported": true, - "default": true + "default": false }, "extra_capabilities": { "reasoning": { "supported": true, + "default_enabled": false, + "mode": "budget", + "budget": { + "min": 1024, + "unit": "tokens" + }, "interleaved": true, "summaries": true, "visibility": "summary", "continuation": [ "thinking_blocks" + ], + "notes": [ + "Claude 4 manual thinking uses thinking.type = \"enabled\" with budget_tokens.", + "Interleaved thinking requires the interleaved-thinking-2025-05-14 beta header for this model family." ] } }, "attachment": true, "open_weights": false, - "release_date": "2025-10-15", - "last_updated": "2025-11-25", + "knowledge": "2025-03-31", + "release_date": "2025-05-22", + "last_updated": "2025-05-22", "cost": { - "input": 0.18, - "output": 2 + "input": 3, + "output": 15, + "cache_read": 0.3, + "cache_write": 3.75 }, "type": "chat" }, { - "id": "Qwen/Qwen3-VL-8B-Instruct", - "name": "Qwen/Qwen3-VL-8B-Instruct", - "display_name": "Qwen/Qwen3-VL-8B-Instruct", + "id": "gpt-5.1-codex-mini", + "name": "GPT-5.1 Codex mini", + "display_name": "GPT-5.1 Codex mini", "modalities": { "input": [ "text", @@ -74450,28 +79063,52 @@ ] }, "limit": { - "context": 262000, - "output": 262000 + "context": 400000, + "output": 128000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": false + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": false, + "mode": "effort", + "effort": "none", + "effort_options": [ + "none", + "low", + "medium", + "high" + ], + "verbosity": "medium", + "verbosity_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" + } }, "attachment": true, "open_weights": false, - "release_date": "2025-10-15", - "last_updated": "2025-11-25", + "knowledge": "2024-09-30", + "release_date": "2025-11-13", + "last_updated": "2025-11-13", "cost": { - "input": 0.18, - "output": 0.68 + "input": 0.25, + "output": 2, + "cache_read": 0.025 }, "type": "chat" }, { - "id": "Qwen/Qwen3-Coder-480B-A35B-Instruct", - "name": "Qwen/Qwen3-Coder-480B-A35B-Instruct", - "display_name": "Qwen/Qwen3-Coder-480B-A35B-Instruct", + "id": "qwen3-30b-a3b-thinking-2507", + "name": "Qwen3 30B A3B Thinking (2507)", + "display_name": "Qwen3 30B A3B Thinking (2507)", "modalities": { "input": [ "text" @@ -74487,34 +79124,49 @@ "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } }, "attachment": false, - "open_weights": false, - "release_date": "2025-07-31", - "last_updated": "2025-11-25", + "open_weights": true, + "release_date": "2025-07-08", + "last_updated": "2025-07-08", "cost": { - "input": 0.25, - "output": 1 - } + "input": 0.1, + "output": 0.1 + }, + "type": "chat" }, { - "id": "Qwen/Qwen3-VL-235B-A22B-Thinking", - "name": "Qwen/Qwen3-VL-235B-A22B-Thinking", - "display_name": "Qwen/Qwen3-VL-235B-A22B-Thinking", + "id": "kimi-k2.5", + "name": "Kimi K2.5", + "display_name": "Kimi K2.5", "modalities": { "input": [ - "text" + "text", + "image", + "video" ], "output": [ "text" ] }, "limit": { - "context": 131072, - "output": 8192 + "context": 262144, + "output": 262144 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { "supported": true, @@ -74531,92 +79183,91 @@ ] } }, - "attachment": true, - "open_weights": false, - "release_date": "2025-10-04", - "last_updated": "2025-11-25", + "attachment": false, + "open_weights": true, + "knowledge": "2025-01", + "release_date": "2026-01", + "last_updated": "2026-01", "cost": { - "input": 0.45, - "output": 3.5 + "input": 0.6, + "output": 3, + "cache_read": 0.1 }, "type": "chat" }, { - "id": "deepseek-ai/DeepSeek-V3.2-Exp", - "name": "deepseek-ai/DeepSeek-V3.2-Exp", - "display_name": "deepseek-ai/DeepSeek-V3.2-Exp", + "id": "seed-1-6-250915", + "name": "Seed 1.6 (250915)", + "display_name": "Seed 1.6 (250915)", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 131072, + "context": 256000, "output": 8192 }, + "temperature": true, "tool_call": true, "reasoning": { - "supported": false - }, - "type": "chat" - }, - { - "id": "Pro/deepseek-ai/DeepSeek-V3.2-Exp", - "name": "Pro/deepseek-ai/DeepSeek-V3.2-Exp", - "display_name": "Pro/deepseek-ai/DeepSeek-V3.2-Exp", - "modalities": { - "input": [ - "text" - ], - "output": [ - "text" - ] - }, - "limit": { - "context": 131072, - "output": 8192 + "supported": true, + "default": true }, - "tool_call": true, - "reasoning": { - "supported": false + "attachment": true, + "open_weights": true, + "release_date": "2025-09-15", + "last_updated": "2025-09-15", + "cost": { + "input": 0.25, + "output": 2, + "cache_read": 0.05 }, "type": "chat" }, { - "id": "inclusionAI/Ring-1T", - "name": "inclusionAI/Ring-1T", - "display_name": "inclusionAI/Ring-1T", + "id": "gpt-5.2-chat-latest", + "name": "GPT-5.2 Chat", + "display_name": "GPT-5.2 Chat", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 131072, - "output": 8192 + "context": 128000, + "output": 16384 }, + "temperature": false, "tool_call": true, "reasoning": { "supported": true, "default": true }, - "extra_capabilities": { - "reasoning": { - "supported": true - } + "attachment": true, + "open_weights": false, + "knowledge": "2025-08-31", + "release_date": "2025-12-11", + "last_updated": "2025-12-11", + "cost": { + "input": 1.75, + "output": 14, + "cache_read": 0.175 }, "type": "chat" }, { - "id": "inclusionAI/Ling-1T", - "name": "inclusionAI/Ling-1T", - "display_name": "inclusionAI/Ling-1T", + "id": "minimax-text-01", + "name": "MiniMax Text 01", + "display_name": "MiniMax Text 01", "modalities": { "input": [ "text" @@ -74626,171 +79277,143 @@ ] }, "limit": { - "context": 131072, - "output": 8192 - }, - "tool_call": true, - "reasoning": { - "supported": false - }, - "type": "chat" - }, - { - "id": "Qwen/Qwen-Image-Edit-2509", - "name": "Qwen/Qwen-Image-Edit-2509", - "display_name": "Qwen/Qwen-Image-Edit-2509", - "modalities": { - "input": [ - "image", - "text" - ], - "output": [ - "image" - ] - }, - "tool_call": false, - "reasoning": { - "supported": false - } - }, - { - "id": "Qwen/Qwen-Image-Edit", - "name": "Qwen/Qwen-Image-Edit", - "display_name": "Qwen/Qwen-Image-Edit", - "modalities": { - "input": [ - "image", - "text" - ], - "output": [ - "image" - ] - }, - "tool_call": false, - "reasoning": { - "supported": false - } - }, - { - "id": "Qwen/Qwen-Image", - "name": "Qwen/Qwen-Image", - "display_name": "Qwen/Qwen-Image", - "modalities": { - "input": [ - "text" - ], - "output": [ - "image" - ] + "context": 1000000, + "output": 131072 }, + "temperature": true, "tool_call": false, "reasoning": { - "supported": false - } - }, - { - "id": "Wan-AI/Wan2.2-I2V-A14B", - "name": "Wan-AI/Wan2.2-I2V-A14B", - "display_name": "Wan-AI/Wan2.2-I2V-A14B", - "modalities": { - "input": [ - "image", - "text" - ], - "output": [ - "video" - ] + "supported": true, + "default": true }, - "tool_call": false, - "reasoning": { - "supported": false - } - }, - { - "id": "Wan-AI/Wan2.2-T2V-A14B", - "name": "Wan-AI/Wan2.2-T2V-A14B", - "display_name": "Wan-AI/Wan2.2-T2V-A14B", - "modalities": { - "input": [ - "text" - ], - "output": [ - "video" - ] + "attachment": false, + "open_weights": true, + "release_date": "2025-01-15", + "last_updated": "2025-01-15", + "cost": { + "input": 0.2, + "output": 1.1 }, - "tool_call": false, - "reasoning": { - "supported": false - } + "type": "chat" }, { - "id": "zai-org/GLM-4.5", - "name": "zai-org/GLM-4.5", - "display_name": "zai-org/GLM-4.5", + "id": "grok-4-fast-reasoning", + "name": "Grok 4 Fast Reasoning", + "display_name": "Grok 4 Fast Reasoning", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 131072, - "output": 8192 + "context": 2000000, + "output": 30000 }, + "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true + } + }, + "attachment": true, + "open_weights": false, + "release_date": "2025-07-09", + "last_updated": "2025-07-09", + "cost": { + "input": 0.2, + "output": 0.5, + "cache_read": 0.05 }, "type": "chat" }, { - "id": "stepfun-ai/step3", - "name": "stepfun-ai/step3", - "display_name": "stepfun-ai/step3", + "id": "gpt-4.1-nano", + "name": "GPT-4.1 nano", + "display_name": "GPT-4.1 nano", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 131072, - "output": 8192 + "context": 1047576, + "output": 32768 }, + "temperature": true, "tool_call": true, "reasoning": { "supported": false }, + "attachment": true, + "open_weights": false, + "knowledge": "2024-04", + "release_date": "2025-04-14", + "last_updated": "2025-04-14", + "cost": { + "input": 0.1, + "output": 0.4, + "cache_read": 0.025 + }, "type": "chat" }, { - "id": "TeleAI/TeleSpeechASR", - "name": "TeleAI/TeleSpeechASR", - "display_name": "TeleAI/TeleSpeechASR", + "id": "gpt-oss-120b", + "name": "GPT OSS 120B", + "display_name": "GPT OSS 120B", "modalities": { "input": [ - "audio" + "text" ], "output": [ "text" ] }, - "tool_call": false, + "limit": { + "context": 131072, + "output": 32766 + }, + "temperature": true, + "tool_call": true, "reasoning": { - "supported": false - } + "supported": true, + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true + } + }, + "attachment": false, + "open_weights": false, + "release_date": "2025-08-05", + "last_updated": "2025-08-05", + "cost": { + "input": 0.05, + "output": 0.25 + }, + "type": "chat" }, { - "id": "THUDM/GLM-4.1V-9B-Thinking", - "name": "THUDM/GLM-4.1V-9B-Thinking", - "display_name": "THUDM/GLM-4.1V-9B-Thinking", + "id": "qwen-vl-max", + "name": "Qwen-VL Max", + "display_name": "Qwen-VL Max", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" @@ -74800,17 +79423,26 @@ "context": 131072, "output": 8192 }, + "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false + }, + "attachment": false, + "open_weights": false, + "knowledge": "2024-04", + "release_date": "2024-04-08", + "last_updated": "2025-08-13", + "cost": { + "input": 0.8, + "output": 3.2 }, "type": "chat" }, { - "id": "Pro/THUDM/GLM-4.1V-9B-Thinking", - "name": "Pro/THUDM/GLM-4.1V-9B-Thinking", - "display_name": "Pro/THUDM/GLM-4.1V-9B-Thinking", + "id": "llama-3-8b-instruct", + "name": "Llama 3 8B Instruct", + "display_name": "Llama 3 8B Instruct", "modalities": { "input": [ "text" @@ -74820,20 +79452,28 @@ ] }, "limit": { - "context": 131072, + "context": 8192, "output": 8192 }, - "tool_call": true, + "temperature": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": true + "supported": false + }, + "attachment": false, + "open_weights": true, + "release_date": "2025-04-03", + "last_updated": "2025-04-03", + "cost": { + "input": 0.04, + "output": 0.04 }, "type": "chat" }, { - "id": "moonshotai/Kimi-Dev-72B", - "name": "moonshotai/Kimi-Dev-72B", - "display_name": "moonshotai/Kimi-Dev-72B", + "id": "qwen3-30b-a3b-fp8", + "name": "Qwen3 30B A3B FP8", + "display_name": "Qwen3 30B A3B FP8", "modalities": { "input": [ "text" @@ -74846,16 +79486,26 @@ "context": 131072, "output": 8192 }, + "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true + }, + "attachment": false, + "open_weights": true, + "release_date": "2025-04-28", + "last_updated": "2025-04-28", + "cost": { + "input": 0.1, + "output": 0.1 }, "type": "chat" }, { - "id": "MiniMaxAI/MiniMax-M1-80k", - "name": "MiniMaxAI/MiniMax-M1-80k", - "display_name": "MiniMaxAI/MiniMax-M1-80k", + "id": "sonar", + "name": "Sonar", + "display_name": "Sonar", "modalities": { "input": [ "text" @@ -74865,19 +79515,29 @@ ] }, "limit": { - "context": 131072, - "output": 8192 + "context": 128000, + "output": 4096 }, - "tool_call": true, + "temperature": true, + "tool_call": false, "reasoning": { "supported": false }, + "attachment": false, + "open_weights": false, + "knowledge": "2025-09-01", + "release_date": "2024-01-01", + "last_updated": "2025-09-01", + "cost": { + "input": 1, + "output": 1 + }, "type": "chat" }, { - "id": "Tongyi-Zhiwen/QwenLong-L1-32B", - "name": "Tongyi-Zhiwen/QwenLong-L1-32B", - "display_name": "Tongyi-Zhiwen/QwenLong-L1-32B", + "id": "qwen-max", + "name": "Qwen Max", + "display_name": "Qwen Max", "modalities": { "input": [ "text" @@ -74887,241 +79547,398 @@ ] }, "limit": { - "context": 131072, + "context": 32768, "output": 8192 }, + "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false + }, + "attachment": false, + "open_weights": false, + "knowledge": "2024-04", + "release_date": "2024-04-03", + "last_updated": "2025-01-25", + "cost": { + "input": 1.6, + "output": 6.4 }, "type": "chat" }, { - "id": "deepseek-ai/DeepSeek-R1-0528-Qwen3-8B", - "name": "deepseek-ai/DeepSeek-R1-0528-Qwen3-8B", - "display_name": "deepseek-ai/DeepSeek-R1-0528-Qwen3-8B", + "id": "claude-3-7-sonnet-20250219", + "name": "Claude Sonnet 3.7", + "display_name": "Claude Sonnet 3.7", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 131072, - "output": 8192 + "context": 200000, + "output": 64000 }, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, - "default": true + "default": false + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": false, + "mode": "budget", + "budget": { + "min": 1024, + "unit": "tokens" + }, + "interleaved": false, + "summaries": false, + "visibility": "full", + "continuation": [ + "thinking_blocks" + ], + "notes": [ + "Anthropic uses thinking budget tokens" + ] + } + }, + "attachment": true, + "open_weights": false, + "knowledge": "2024-10-31", + "release_date": "2025-02-19", + "last_updated": "2025-02-19", + "cost": { + "input": 3, + "output": 15, + "cache_read": 0.3, + "cache_write": 3.75 }, "type": "chat" }, { - "id": "Qwen/Qwen3-30B-A3B", - "name": "Qwen/Qwen3-30B-A3B", - "display_name": "Qwen/Qwen3-30B-A3B", + "id": "o1", + "name": "o1", + "display_name": "o1", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 131072, - "output": 8192 + "context": 200000, + "output": 100000 }, + "temperature": false, "tool_call": true, "reasoning": { - "supported": true + "supported": true, + "default": true }, "extra_capabilities": { "reasoning": { "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] + "default_enabled": true, + "mode": "effort", + "effort": "medium", + "effort_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" } }, + "attachment": true, + "open_weights": false, + "knowledge": "2023-09", + "release_date": "2024-12-05", + "last_updated": "2024-12-05", + "cost": { + "input": 15, + "output": 60, + "cache_read": 7.5 + }, "type": "chat" }, { - "id": "Qwen/Qwen3-Reranker-8B", - "name": "Qwen/Qwen3-Reranker-8B", - "display_name": "Qwen/Qwen3-Reranker-8B", + "id": "minimax-m2.5-highspeed", + "name": "MiniMax-M2.5-highspeed", + "display_name": "MiniMax-M2.5-highspeed", "modalities": { "input": [ "text" ], "output": [ - "score" + "text" ] }, "limit": { - "context": 8192, - "output": 2048 + "context": 204800, + "output": 131072 }, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "type": "rerank" + "extra_capabilities": { + "reasoning": { + "supported": true + } + }, + "attachment": false, + "open_weights": true, + "release_date": "2026-02-13", + "last_updated": "2026-02-13", + "cost": { + "input": 0.6, + "output": 2.4, + "cache_read": 0.06, + "cache_write": 0.375 + }, + "type": "chat" }, { - "id": "Qwen/Qwen3-Embedding-8B", - "name": "Qwen/Qwen3-Embedding-8B", - "display_name": "Qwen/Qwen3-Embedding-8B", + "id": "deepseek-v3.1", + "name": "DeepSeek V3.1", + "display_name": "DeepSeek V3.1", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ - "embedding" + "text" ] }, "limit": { - "context": 8192, - "output": 2048 + "context": 128000, + "output": 32768 }, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "type": "embedding" + "attachment": true, + "open_weights": true, + "release_date": "2025-08-21", + "last_updated": "2025-08-21", + "cost": { + "input": 0.56, + "output": 1.68, + "cache_read": 0.07 + }, + "type": "chat" }, { - "id": "Qwen/Qwen3-Reranker-4B", - "name": "Qwen/Qwen3-Reranker-4B", - "display_name": "Qwen/Qwen3-Reranker-4B", + "id": "llama-4-scout", + "name": "Llama 4 Scout", + "display_name": "Llama 4 Scout", "modalities": { "input": [ "text" ], "output": [ - "score" + "text" ] }, "limit": { - "context": 8192, - "output": 2048 + "context": 32768, + "output": 16384 }, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { "supported": false }, - "type": "rerank" + "attachment": false, + "open_weights": true, + "release_date": "2025-04-05", + "last_updated": "2025-04-05", + "cost": { + "input": 0.18, + "output": 0.59 + }, + "type": "chat" }, { - "id": "Qwen/Qwen3-Embedding-4B", - "name": "Qwen/Qwen3-Embedding-4B", - "display_name": "Qwen/Qwen3-Embedding-4B", + "id": "ministral-14b-2512", + "name": "Ministral 14B", + "display_name": "Ministral 14B", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ - "embedding" + "text" ] }, "limit": { - "context": 8192, - "output": 2048 + "context": 262144, + "output": 8192 }, + "temperature": true, "tool_call": false, "reasoning": { "supported": false }, - "type": "embedding" + "attachment": true, + "open_weights": true, + "release_date": "2025-12-02", + "last_updated": "2025-12-02", + "cost": { + "input": 0.2, + "output": 0.2 + }, + "type": "chat" }, { - "id": "Qwen/Qwen3-Reranker-0.6B", - "name": "Qwen/Qwen3-Reranker-0.6B", - "display_name": "Qwen/Qwen3-Reranker-0.6B", + "id": "sonar-pro", + "name": "Sonar Pro", + "display_name": "Sonar Pro", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ - "score" + "text" ] }, "limit": { - "context": 8192, - "output": 2048 + "context": 200000, + "output": 8192 }, + "temperature": true, "tool_call": false, "reasoning": { "supported": false }, - "type": "rerank" + "attachment": true, + "open_weights": false, + "knowledge": "2025-09-01", + "release_date": "2024-01-01", + "last_updated": "2025-09-01", + "cost": { + "input": 3, + "output": 15 + }, + "type": "chat" }, { - "id": "Qwen/Qwen3-Embedding-0.6B", - "name": "Qwen/Qwen3-Embedding-0.6B", - "display_name": "Qwen/Qwen3-Embedding-0.6B", + "id": "glm-4.6v", + "name": "GLM-4.6V", + "display_name": "GLM-4.6V", "modalities": { "input": [ - "text" + "text", + "image", + "video" ], "output": [ - "embedding" + "text" ] }, "limit": { - "context": 8192, - "output": 2048 + "context": 128000, + "output": 32768 }, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "type": "embedding" + "attachment": true, + "open_weights": true, + "knowledge": "2025-04", + "release_date": "2025-12-08", + "last_updated": "2025-12-08", + "cost": { + "input": 0.3, + "output": 0.9 + }, + "type": "chat" }, { - "id": "Qwen/Qwen3-235B-A22B", - "name": "Qwen/Qwen3-235B-A22B", - "display_name": "Qwen/Qwen3-235B-A22B", + "id": "claude-haiku-4-5", + "name": "Claude Haiku 4.5 (latest)", + "display_name": "Claude Haiku 4.5 (latest)", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 131072, - "output": 8192 + "context": 200000, + "output": 64000 }, + "temperature": true, "tool_call": true, "reasoning": { - "supported": true + "supported": true, + "default": false }, "extra_capabilities": { "reasoning": { "supported": true, + "default_enabled": false, + "mode": "budget", + "budget": { + "min": 1024, + "unit": "tokens" + }, "interleaved": true, "summaries": true, "visibility": "summary", "continuation": [ "thinking_blocks" + ], + "notes": [ + "Claude 4 manual thinking uses thinking.type = \"enabled\" with budget_tokens.", + "Interleaved thinking requires the interleaved-thinking-2025-05-14 beta header for this model family." ] } }, + "attachment": true, + "open_weights": false, + "knowledge": "2025-02-28", + "release_date": "2025-10-15", + "last_updated": "2025-10-15", + "cost": { + "input": 1, + "output": 5, + "cache_read": 0.1, + "cache_write": 1.25 + }, "type": "chat" }, { - "id": "Pro/Qwen/Qwen2.5-VL-7B-Instruct", - "name": "Pro/Qwen/Qwen2.5-VL-7B-Instruct", - "display_name": "Pro/Qwen/Qwen2.5-VL-7B-Instruct", + "id": "minimax-m2.1-lightning", + "name": "MiniMax M2.1 Lightning", + "display_name": "MiniMax M2.1 Lightning", "modalities": { "input": [ "text" @@ -75131,259 +79948,539 @@ ] }, "limit": { - "context": 131072, - "output": 8192 + "context": 196608, + "output": 131072 }, - "tool_call": true, + "temperature": true, + "tool_call": false, "reasoning": { - "supported": false + "supported": true, + "default": true + }, + "attachment": false, + "open_weights": true, + "release_date": "2025-12-23", + "last_updated": "2025-12-23", + "cost": { + "input": 0.12, + "output": 0.48 }, "type": "chat" }, { - "id": "deepseek-ai/DeepSeek-R1-Distill-Qwen-7B", - "name": "deepseek-ai/DeepSeek-R1-Distill-Qwen-7B", - "display_name": "deepseek-ai/DeepSeek-R1-Distill-Qwen-7B", + "id": "gpt-5.4", + "name": "GPT-5.4", + "display_name": "GPT-5.4", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 131072, - "output": 8192 + "context": 1050000, + "output": 128000 }, + "temperature": false, "tool_call": true, "reasoning": { "supported": true, - "default": true + "default": false + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": false, + "mode": "effort", + "effort": "none", + "effort_options": [ + "none", + "low", + "medium", + "high", + "xhigh" + ], + "verbosity": "medium", + "verbosity_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" + } + }, + "attachment": true, + "open_weights": false, + "knowledge": "2025-08-31", + "release_date": "2026-03-05", + "last_updated": "2026-03-05", + "cost": { + "input": 2.5, + "output": 15, + "cache_read": 0.25 }, "type": "chat" }, { - "id": "Qwen/QVQ-72B-Preview", - "name": "Qwen/QVQ-72B-Preview", - "display_name": "Qwen/QVQ-72B-Preview", + "id": "mimo-v2.5", + "name": "MiMo-V2.5", + "display_name": "MiMo-V2.5", "modalities": { "input": [ - "text" + "text", + "image", + "audio", + "video" ], "output": [ "text" ] }, "limit": { - "context": 131072, - "output": 8192 + "context": 1048576, + "output": 131072 }, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, "default": true }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } + }, + "attachment": true, + "open_weights": true, + "knowledge": "2024-12", + "release_date": "2026-04-22", + "last_updated": "2026-04-22", + "cost": { + "input": 0.4, + "output": 2, + "cache_read": 0.08, + "tiers": [ + { + "input": 0.8, + "output": 4, + "cache_read": 0.16, + "tier": { + "type": "context", + "size": 256000 + } + } + ], + "context_over_200k": { + "input": 0.8, + "output": 4, + "cache_read": 0.16 + } + }, "type": "chat" }, { - "id": "deepseek-ai/DeepSeek-V2.5", - "name": "deepseek-ai/DeepSeek-V2.5", - "display_name": "deepseek-ai/DeepSeek-V2.5", + "id": "mimo-v2-omni", + "name": "MiMo-V2-Omni", + "display_name": "MiMo-V2-Omni", "modalities": { "input": [ - "text" + "text", + "image", + "audio", + "video", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 131072, - "output": 8192 + "context": 262144, + "output": 131072 }, + "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } + }, + "attachment": true, + "open_weights": false, + "knowledge": "2024-12", + "release_date": "2026-03-18", + "last_updated": "2026-03-18", + "cost": { + "input": 0.4, + "output": 2, + "cache_read": 0.08 }, "type": "chat" }, { - "id": "fnlp/MOSS-TTSD-v0.5", - "name": "fnlp/MOSS-TTSD-v0.5", - "display_name": "fnlp/MOSS-TTSD-v0.5", + "id": "gpt-5.4-mini", + "name": "GPT-5.4 mini", + "display_name": "GPT-5.4 mini", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ - "audio" - ] - }, - "tool_call": false, - "reasoning": { - "supported": false - } - }, - { - "id": "FunAudioLLM/CosyVoice2-0.5B", - "name": "FunAudioLLM/CosyVoice2-0.5B", - "display_name": "FunAudioLLM/CosyVoice2-0.5B", - "modalities": { - "input": [ "text" - ], - "output": [ - "audio" ] }, - "tool_call": false, + "limit": { + "context": 400000, + "output": 128000 + }, + "temperature": false, + "tool_call": true, "reasoning": { - "supported": false - } + "supported": true, + "default": false + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": false, + "mode": "effort", + "effort": "none", + "effort_options": [ + "none", + "low", + "medium", + "high", + "xhigh" + ], + "verbosity": "medium", + "verbosity_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" + } + }, + "attachment": true, + "open_weights": false, + "knowledge": "2025-08-31", + "release_date": "2026-03-17", + "last_updated": "2026-03-17", + "cost": { + "input": 0.75, + "output": 4.5, + "cache_read": 0.075 + }, + "type": "chat" }, { - "id": "FunAudioLLM/SenseVoiceSmall", - "name": "FunAudioLLM/SenseVoiceSmall", - "display_name": "FunAudioLLM/SenseVoiceSmall", + "id": "kimi-k2.6", + "name": "Kimi K2.6", + "display_name": "Kimi K2.6", "modalities": { "input": [ - "audio" + "text", + "image", + "video" ], "output": [ "text" ] }, - "tool_call": false, + "limit": { + "context": 262144, + "output": 262144 + }, + "temperature": true, + "tool_call": true, "reasoning": { - "supported": false - } + "supported": true, + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } + }, + "attachment": true, + "open_weights": true, + "knowledge": "2025-01", + "release_date": "2026-04-21", + "last_updated": "2026-04-21", + "cost": { + "input": 0.95, + "output": 4, + "cache_read": 0.16 + }, + "type": "chat" }, { - "id": "IndexTeam/IndexTTS-2", - "name": "IndexTeam/IndexTTS-2", - "display_name": "IndexTeam/IndexTTS-2", + "id": "gpt-4.1", + "name": "GPT-4.1", + "display_name": "GPT-4.1", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ - "audio" + "text" ] }, - "tool_call": false, + "limit": { + "context": 1047576, + "output": 32768 + }, + "temperature": true, + "tool_call": true, "reasoning": { "supported": false - } + }, + "attachment": true, + "open_weights": false, + "knowledge": "2024-04", + "release_date": "2025-04-14", + "last_updated": "2025-04-14", + "cost": { + "input": 2, + "output": 8, + "cache_read": 0.5 + }, + "type": "chat" }, { - "id": "BAAI/bge-m3", - "name": "BAAI/bge-m3", - "display_name": "BAAI/bge-m3", + "id": "gemini-3.1-pro-preview", + "name": "Gemini 3.1 Pro Preview", + "display_name": "Gemini 3.1 Pro Preview", "modalities": { "input": [ - "text" + "text", + "image", + "video", + "audio", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 131072, - "output": 8192 + "context": 1048576, + "output": 65536 }, + "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "type": "embedding" + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": true, + "mode": "level", + "level": "high", + "level_options": [ + "low", + "high" + ], + "summaries": true, + "visibility": "summary", + "continuation": [ + "thought_signatures" + ] + } + }, + "attachment": true, + "open_weights": false, + "knowledge": "2025-01", + "release_date": "2026-02-19", + "last_updated": "2026-02-19", + "cost": { + "input": 2, + "output": 12, + "cache_read": 0.2, + "tiers": [ + { + "input": 4, + "output": 18, + "cache_read": 0.4, + "tier": { + "type": "context", + "size": 200000 + } + } + ], + "context_over_200k": { + "input": 4, + "output": 18, + "cache_read": 0.4 + } + }, + "type": "chat" }, { - "id": "BAAI/bge-reranker-v2-m3", - "name": "BAAI/bge-reranker-v2-m3", - "display_name": "BAAI/bge-reranker-v2-m3", + "id": "claude-opus-4-6", + "name": "Claude Opus 4.6", + "display_name": "Claude Opus 4.6", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ - "score" + "text" ] }, "limit": { - "context": 8192, - "output": 2048 + "context": 1000000, + "output": 128000 }, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": false }, - "type": "rerank" + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": false, + "mode": "mixed", + "budget": { + "min": 1024, + "unit": "tokens" + }, + "effort": "high", + "effort_options": [ + "low", + "medium", + "high", + "max" + ], + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ], + "notes": [ + "Anthropic recommends adaptive thinking with effort for Claude 4.6; budget_tokens remains a deprecated compatibility path.", + "Anthropic API defaults effort to high; lower effort levels should be chosen per workload." + ] + } + }, + "attachment": true, + "open_weights": false, + "knowledge": "2025-05-31", + "release_date": "2026-02-05", + "last_updated": "2026-03-13", + "cost": { + "input": 5, + "output": 25, + "cache_read": 0.5, + "cache_write": 6.25 + }, + "type": "chat" }, { - "id": "netease-youdao/bce-embedding-base_v1", - "name": "netease-youdao/bce-embedding-base_v1", - "display_name": "netease-youdao/bce-embedding-base_v1", + "id": "qwen3-coder-next", + "name": "Qwen3 Coder Next", + "display_name": "Qwen3 Coder Next", "modalities": { "input": [ "text" ], "output": [ - "embedding" + "text" ] }, "limit": { - "context": 8192, - "output": 2048 + "context": 262144, + "output": 65536 }, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "type": "embedding" + "attachment": false, + "open_weights": false, + "release_date": "2025-10-15", + "last_updated": "2025-10-15", + "cost": { + "input": 0.108, + "output": 0.675 + }, + "type": "chat" }, { - "id": "netease-youdao/bce-reranker-base_v1", - "name": "netease-youdao/bce-reranker-base_v1", - "display_name": "netease-youdao/bce-reranker-base_v1", + "id": "llama-4-maverick-17b-instruct", + "name": "Llama 4 Maverick 17B Instruct", + "display_name": "Llama 4 Maverick 17B Instruct", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ - "score" + "text" ] }, "limit": { "context": 8192, "output": 2048 }, + "temperature": true, "tool_call": false, "reasoning": { "supported": false - } - }, - { - "id": "Kwai-Kolors/Kolors", - "name": "Kwai-Kolors/Kolors", - "display_name": "Kwai-Kolors/Kolors", - "modalities": { - "input": [ - "text" - ], - "output": [ - "image" - ] }, - "tool_call": false, - "reasoning": { - "supported": false - } + "attachment": true, + "open_weights": true, + "release_date": "2025-04-05", + "last_updated": "2025-04-05", + "cost": { + "input": 0.24, + "output": 0.97 + }, + "type": "chat" }, { - "id": "Qwen/Qwen2-VL-72B-Instruct", - "name": "Qwen/Qwen2-VL-72B-Instruct", - "display_name": "Qwen/Qwen2-VL-72B-Instruct", + "id": "qwen3-coder-480b-a35b-instruct", + "name": "Qwen3-Coder 480B-A35B Instruct", + "display_name": "Qwen3-Coder 480B-A35B Instruct", "modalities": { "input": [ "text" @@ -75393,19 +80490,29 @@ ] }, "limit": { - "context": 131072, - "output": 8192 + "context": 262144, + "output": 65536 }, + "temperature": true, "tool_call": true, "reasoning": { "supported": false }, + "attachment": false, + "open_weights": true, + "knowledge": "2025-04", + "release_date": "2025-04", + "last_updated": "2025-04", + "cost": { + "input": 1.5, + "output": 7.5 + }, "type": "chat" }, { - "id": "Qwen/Qwen2.5-Coder-7B-Instruct", - "name": "Qwen/Qwen2.5-Coder-7B-Instruct", - "display_name": "Qwen/Qwen2.5-Coder-7B-Instruct", + "id": "devstral-2512", + "name": "Devstral 2", + "display_name": "Devstral 2", "modalities": { "input": [ "text" @@ -75415,40 +80522,87 @@ ] }, "limit": { - "context": 131072, - "output": 8192 + "context": 262144, + "output": 262144 }, + "temperature": true, "tool_call": true, "reasoning": { "supported": false - } + }, + "attachment": false, + "open_weights": true, + "knowledge": "2025-12", + "release_date": "2025-12-09", + "last_updated": "2025-12-09", + "cost": { + "input": 0.4, + "output": 2 + }, + "type": "chat" }, { - "id": "internlm/internlm2_5-7b-chat", - "name": "internlm/internlm2_5-7b-chat", - "display_name": "internlm/internlm2_5-7b-chat", + "id": "claude-sonnet-4-5-20250929", + "name": "Claude Sonnet 4.5", + "display_name": "Claude Sonnet 4.5", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 131072, - "output": 8192 + "context": 200000, + "output": 64000 }, + "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": false + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": false, + "mode": "budget", + "budget": { + "min": 1024, + "unit": "tokens" + }, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ], + "notes": [ + "Claude 4 manual thinking uses thinking.type = \"enabled\" with budget_tokens.", + "Interleaved thinking requires the interleaved-thinking-2025-05-14 beta header for this model family." + ] + } + }, + "attachment": true, + "open_weights": false, + "knowledge": "2025-07-31", + "release_date": "2025-09-29", + "last_updated": "2025-09-29", + "cost": { + "input": 3, + "output": 15, + "cache_read": 0.3, + "cache_write": 3.75 }, "type": "chat" }, { - "id": "Qwen/Qwen2-7B-Instruct", - "name": "Qwen/Qwen2-7B-Instruct", - "display_name": "Qwen/Qwen2-7B-Instruct", + "id": "qwq-plus", + "name": "QwQ Plus", + "display_name": "QwQ Plus", "modalities": { "input": [ "text" @@ -75461,41 +80615,81 @@ "context": 131072, "output": 8192 }, + "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } + }, + "attachment": false, + "open_weights": false, + "knowledge": "2024-04", + "release_date": "2025-03-05", + "last_updated": "2025-03-05", + "cost": { + "input": 0.8, + "output": 2.4 }, "type": "chat" }, { - "id": "THUDM/glm-4-9b-chat", - "name": "THUDM/glm-4-9b-chat", - "display_name": "THUDM/glm-4-9b-chat", + "id": "grok-4-1-fast-reasoning", + "name": "Grok 4.1 Fast Reasoning", + "display_name": "Grok 4.1 Fast Reasoning", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 131072, - "output": 8192 + "context": 2000000, + "output": 30000 }, + "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true + } + }, + "attachment": true, + "open_weights": false, + "release_date": "2025-11-19", + "last_updated": "2025-11-19", + "cost": { + "input": 0.2, + "output": 0.5, + "cache_read": 0.05 }, "type": "chat" }, { - "id": "BAAI/bge-large-en-v1.5", - "name": "BAAI/bge-large-en-v1.5", - "display_name": "BAAI/bge-large-en-v1.5", + "id": "qwen3-vl-30b-a3b-instruct", + "name": "Qwen3 VL 30B A3B Instruct", + "display_name": "Qwen3 VL 30B A3B Instruct", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" @@ -75505,60 +80699,125 @@ "context": 131072, "output": 8192 }, + "temperature": true, "tool_call": true, "reasoning": { "supported": false }, - "type": "embedding" + "attachment": true, + "open_weights": true, + "release_date": "2025-10-02", + "last_updated": "2025-10-02", + "cost": { + "input": 0.2, + "output": 0.7 + }, + "type": "chat" }, { - "id": "BAAI/bge-large-zh-v1.5", - "name": "BAAI/bge-large-zh-v1.5", - "display_name": "BAAI/bge-large-zh-v1.5", + "id": "qwen3-vl-flash", + "name": "Qwen3 VL Flash", + "display_name": "Qwen3 VL Flash", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 131072, - "output": 8192 + "context": 1000000, + "output": 32000 }, + "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true }, - "type": "embedding" + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } + }, + "attachment": true, + "open_weights": false, + "release_date": "2025-10-09", + "last_updated": "2025-10-09", + "cost": { + "input": 0.022, + "output": 0.215, + "cache_read": 0.0044 + }, + "type": "chat" }, { - "id": "LoRA/Qwen/Qwen2.5-32B-Instruct", - "name": "LoRA/Qwen/Qwen2.5-32B-Instruct", - "display_name": "LoRA/Qwen/Qwen2.5-32B-Instruct", + "id": "gpt-5-mini", + "name": "GPT-5 Mini", + "display_name": "GPT-5 Mini", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 131072, - "output": 8192 + "context": 400000, + "output": 128000 }, + "temperature": false, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": true, + "mode": "effort", + "effort": "medium", + "effort_options": [ + "minimal", + "low", + "medium", + "high" + ], + "verbosity": "medium", + "verbosity_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" + } + }, + "attachment": true, + "open_weights": false, + "knowledge": "2024-05-30", + "release_date": "2025-08-07", + "last_updated": "2025-08-07", + "cost": { + "input": 0.25, + "output": 2, + "cache_read": 0.025 }, "type": "chat" }, { - "id": "LoRA/Qwen/Qwen2.5-14B-Instruct", - "name": "LoRA/Qwen/Qwen2.5-14B-Instruct", - "display_name": "LoRA/Qwen/Qwen2.5-14B-Instruct", + "id": "mimo-v2-flash", + "name": "MiMo-V2-Flash", + "display_name": "MiMo-V2-Flash", "modalities": { "input": [ "text" @@ -75568,42 +80827,77 @@ ] }, "limit": { - "context": 131072, - "output": 8192 + "context": 262144, + "output": 65536 }, + "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } + }, + "attachment": false, + "open_weights": true, + "knowledge": "2024-12-01", + "release_date": "2025-12-16", + "last_updated": "2026-02-04", + "cost": { + "input": 0.1, + "output": 0.3, + "cache_read": 0.01 }, "type": "chat" }, { - "id": "Pro/deepseek-ai/DeepSeek-R1-Distill-Qwen-7B", - "name": "Pro/deepseek-ai/DeepSeek-R1-Distill-Qwen-7B", - "display_name": "Pro/deepseek-ai/DeepSeek-R1-Distill-Qwen-7B", + "id": "gpt-4.1-mini", + "name": "GPT-4.1 mini", + "display_name": "GPT-4.1 mini", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 131072, - "output": 8192 + "context": 1047576, + "output": 32768 }, + "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false + }, + "attachment": true, + "open_weights": false, + "knowledge": "2024-04", + "release_date": "2025-04-14", + "last_updated": "2025-04-14", + "cost": { + "input": 0.4, + "output": 1.6, + "cache_read": 0.1 }, "type": "chat" }, { - "id": "Pro/Qwen/Qwen2.5-Coder-7B-Instruct", - "name": "Pro/Qwen/Qwen2.5-Coder-7B-Instruct", - "display_name": "Pro/Qwen/Qwen2.5-Coder-7B-Instruct", + "id": "llama-3.1-nemotron-ultra-253b", + "name": "Llama 3.1 Nemotron Ultra 253B", + "display_name": "Llama 3.1 Nemotron Ultra 253B", "modalities": { "input": [ "text" @@ -75613,40 +80907,61 @@ ] }, "limit": { - "context": 131072, + "context": 128000, "output": 8192 }, - "tool_call": true, + "temperature": true, + "tool_call": false, "reasoning": { "supported": false - } + }, + "attachment": false, + "open_weights": true, + "release_date": "2025-04-07", + "last_updated": "2025-04-07", + "cost": { + "input": 0.6, + "output": 1.8 + }, + "type": "chat" }, { - "id": "Pro/BAAI/bge-m3", - "name": "Pro/BAAI/bge-m3", - "display_name": "Pro/BAAI/bge-m3", + "id": "gpt-4-turbo", + "name": "GPT-4 Turbo", + "display_name": "GPT-4 Turbo", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 131072, - "output": 8192 + "context": 128000, + "output": 4096 }, + "temperature": true, "tool_call": true, "reasoning": { "supported": false }, - "type": "embedding" + "attachment": true, + "open_weights": false, + "knowledge": "2023-12", + "release_date": "2023-11-06", + "last_updated": "2024-04-09", + "cost": { + "input": 10, + "output": 30 + }, + "type": "chat" }, { - "id": "Pro/Qwen/Qwen2.5-7B-Instruct", - "name": "Pro/Qwen/Qwen2.5-7B-Instruct", - "display_name": "Pro/Qwen/Qwen2.5-7B-Instruct", + "id": "qwen3-coder-flash", + "name": "Qwen3 Coder Flash", + "display_name": "Qwen3 Coder Flash", "modalities": { "input": [ "text" @@ -75656,63 +80971,116 @@ ] }, "limit": { - "context": 131072, - "output": 8192 + "context": 1000000, + "output": 65536 }, + "temperature": true, "tool_call": true, "reasoning": { "supported": false }, + "attachment": false, + "open_weights": false, + "knowledge": "2025-04", + "release_date": "2025-07-28", + "last_updated": "2025-07-28", + "cost": { + "input": 0.3, + "output": 1.5 + }, "type": "chat" }, { - "id": "Pro/BAAI/bge-reranker-v2-m3", - "name": "Pro/BAAI/bge-reranker-v2-m3", - "display_name": "Pro/BAAI/bge-reranker-v2-m3", + "id": "gemma-2-27b-it-together", + "name": "Gemma 2 27B IT", + "display_name": "Gemma 2 27B IT", "modalities": { "input": [ "text" ], "output": [ - "score" + "text" ] }, "limit": { "context": 8192, - "output": 2048 + "output": 16384 }, + "temperature": true, "tool_call": false, "reasoning": { "supported": false }, - "type": "rerank" + "attachment": false, + "open_weights": true, + "release_date": "2024-06-27", + "last_updated": "2024-06-27", + "cost": { + "input": 0.08, + "output": 0.08 + }, + "type": "chat" }, { - "id": "LoRA/Qwen/Qwen2.5-72B-Instruct", - "name": "LoRA/Qwen/Qwen2.5-72B-Instruct", - "display_name": "LoRA/Qwen/Qwen2.5-72B-Instruct", + "id": "gpt-5-nano", + "name": "GPT-5 Nano", + "display_name": "GPT-5 Nano", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 131072, - "output": 8192 + "context": 400000, + "output": 128000 }, + "temperature": false, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": true, + "mode": "effort", + "effort": "medium", + "effort_options": [ + "minimal", + "low", + "medium", + "high" + ], + "verbosity": "medium", + "verbosity_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" + } + }, + "attachment": true, + "open_weights": false, + "knowledge": "2024-05-30", + "release_date": "2025-08-07", + "last_updated": "2025-08-07", + "cost": { + "input": 0.05, + "output": 0.4, + "cache_read": 0.005 }, "type": "chat" }, { - "id": "Pro/Qwen/Qwen2-7B-Instruct", - "name": "Pro/Qwen/Qwen2-7B-Instruct", - "display_name": "Pro/Qwen/Qwen2-7B-Instruct", + "id": "llama-3.2-11b-instruct", + "name": "Llama 3.2 11B Instruct", + "display_name": "Llama 3.2 11B Instruct", "modalities": { "input": [ "text" @@ -75722,63 +81090,115 @@ ] }, "limit": { - "context": 131072, + "context": 128000, "output": 8192 }, - "tool_call": true, + "temperature": true, + "tool_call": false, "reasoning": { "supported": false }, + "attachment": false, + "open_weights": true, + "release_date": "2024-09-25", + "last_updated": "2024-09-25", + "cost": { + "input": 0.07, + "output": 0.33 + }, "type": "chat" }, { - "id": "LoRA/Qwen/Qwen2.5-7B-Instruct", - "name": "LoRA/Qwen/Qwen2.5-7B-Instruct", - "display_name": "LoRA/Qwen/Qwen2.5-7B-Instruct", + "id": "gpt-5.4-pro", + "name": "GPT-5.4 Pro", + "display_name": "GPT-5.4 Pro", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 131072, - "output": 8192 + "context": 1050000, + "output": 128000 }, + "temperature": false, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": true, + "mode": "effort", + "effort": "high", + "effort_options": [ + "medium", + "high", + "xhigh" + ], + "verbosity": "medium", + "verbosity_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" + } + }, + "attachment": true, + "open_weights": false, + "knowledge": "2025-08-31", + "release_date": "2026-03-05", + "last_updated": "2026-03-05", + "cost": { + "input": 30, + "output": 180 }, "type": "chat" }, { - "id": "Pro/THUDM/glm-4-9b-chat", - "name": "Pro/THUDM/glm-4-9b-chat", - "display_name": "Pro/THUDM/glm-4-9b-chat", + "id": "glm-4.6v-flash", + "name": "GLM-4.6V Flash", + "display_name": "GLM-4.6V Flash", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 131072, - "output": 8192 + "context": 128000, + "output": 16000 }, + "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true + }, + "attachment": true, + "open_weights": true, + "release_date": "2025-12-08", + "last_updated": "2025-12-08", + "cost": { + "input": 0, + "output": 0 }, "type": "chat" }, { - "id": "THUDM/GLM-Z1-Rumination-32B-0414", - "name": "THUDM/GLM-Z1-Rumination-32B-0414", - "display_name": "THUDM/GLM-Z1-Rumination-32B-0414", + "id": "glm-4.5-air", + "name": "GLM-4.5-Air", + "display_name": "GLM-4.5-Air", "modalities": { "input": [ "text" @@ -75789,225 +81209,469 @@ }, "limit": { "context": 131072, - "output": 8192 + "output": 98304 }, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, "default": true }, + "attachment": false, + "open_weights": true, + "knowledge": "2025-04", + "release_date": "2025-07-28", + "last_updated": "2025-07-28", + "cost": { + "input": 0.2, + "output": 1.1, + "cache_read": 0.03, + "cache_write": 0 + }, "type": "chat" }, { - "id": "stabilityai/stable-diffusion-xl-base-1.0", - "name": "stabilityai/stable-diffusion-xl-base-1.0", - "display_name": "stabilityai/stable-diffusion-xl-base-1.0", + "id": "claude-sonnet-4-6", + "name": "Claude Sonnet 4.6", + "display_name": "Claude Sonnet 4.6", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ - "image" + "text" ] }, - "tool_call": false, + "limit": { + "context": 1000000, + "output": 64000 + }, + "temperature": true, + "tool_call": true, "reasoning": { - "supported": false - } + "supported": true, + "default": false + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": false, + "mode": "mixed", + "budget": { + "min": 1024, + "unit": "tokens" + }, + "effort": "high", + "effort_options": [ + "low", + "medium", + "high", + "max" + ], + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ], + "notes": [ + "Anthropic recommends adaptive thinking with effort for Claude 4.6; budget_tokens remains a deprecated compatibility path.", + "Anthropic API defaults effort to high; lower effort levels should be chosen per workload." + ] + } + }, + "attachment": true, + "open_weights": false, + "knowledge": "2025-08-31", + "release_date": "2026-02-17", + "last_updated": "2026-03-13", + "cost": { + "input": 3, + "output": 15, + "cache_read": 0.3, + "cache_write": 3.75 + }, + "type": "chat" }, { - "id": "black-forest-labs/FLUX.1-schnell", - "name": "black-forest-labs/FLUX.1-schnell", - "display_name": "black-forest-labs/FLUX.1-schnell", + "id": "gemini-3-flash-preview", + "name": "Gemini 3 Flash Preview", + "display_name": "Gemini 3 Flash Preview", "modalities": { "input": [ - "text" + "text", + "image", + "video", + "audio", + "pdf" ], "output": [ - "image" + "text" ] }, - "tool_call": false, + "limit": { + "context": 1048576, + "output": 65536 + }, + "temperature": true, + "tool_call": true, "reasoning": { - "supported": false - } + "supported": true, + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": true, + "mode": "level", + "level": "high", + "level_options": [ + "minimal", + "low", + "medium", + "high" + ], + "summaries": true, + "visibility": "summary", + "continuation": [ + "thought_signatures" + ] + } + }, + "attachment": true, + "open_weights": false, + "knowledge": "2025-01", + "release_date": "2025-12-17", + "last_updated": "2025-12-17", + "cost": { + "input": 0.5, + "output": 3, + "cache_read": 0.05, + "input_audio": 1 + }, + "type": "chat" }, { - "id": "black-forest-labs/FLUX.1-dev", - "name": "black-forest-labs/FLUX.1-dev", - "display_name": "black-forest-labs/FLUX.1-dev", + "id": "glm-4.7-flash", + "name": "GLM-4.7-Flash", + "display_name": "GLM-4.7-Flash", "modalities": { "input": [ "text" ], "output": [ - "image" + "text" ] }, - "tool_call": false, + "limit": { + "context": 200000, + "output": 131072 + }, + "temperature": true, + "tool_call": true, "reasoning": { - "supported": false - } + "supported": true, + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true + } + }, + "attachment": false, + "open_weights": true, + "knowledge": "2025-04", + "release_date": "2026-01-19", + "last_updated": "2026-01-19", + "cost": { + "input": 0, + "output": 0, + "cache_read": 0, + "cache_write": 0 + }, + "type": "chat" }, { - "id": "Pro/black-forest-labs/FLUX.1-schnell", - "name": "Pro/black-forest-labs/FLUX.1-schnell", - "display_name": "Pro/black-forest-labs/FLUX.1-schnell", + "id": "qwen3-vl-235b-a22b-instruct", + "name": "Qwen3 VL 235B A22B Instruct", + "display_name": "Qwen3 VL 235B A22B Instruct", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ - "image" + "text" ] }, - "tool_call": false, + "limit": { + "context": 131072, + "output": 8192 + }, + "temperature": true, + "tool_call": true, "reasoning": { "supported": false - } + }, + "attachment": true, + "open_weights": true, + "release_date": "2025-09-15", + "last_updated": "2025-09-15", + "cost": { + "input": 0.3, + "output": 1.5 + }, + "type": "chat" }, { - "id": "stabilityai/stable-diffusion-3-5-large", - "name": "stabilityai/stable-diffusion-3-5-large", - "display_name": "stabilityai/stable-diffusion-3-5-large", + "id": "mimo-v2-pro", + "name": "MiMo-V2-Pro", + "display_name": "MiMo-V2-Pro", "modalities": { "input": [ "text" ], "output": [ - "image" + "text" ] }, - "tool_call": false, + "limit": { + "context": 1048576, + "output": 131072 + }, + "temperature": true, + "tool_call": true, "reasoning": { - "supported": false - } - }, - { - "id": "fishaudio/fish-speech-1.4", - "name": "fishaudio/fish-speech-1.4", - "display_name": "fishaudio/fish-speech-1.4", - "modalities": { - "input": [ - "text" + "supported": true, + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } + }, + "attachment": false, + "open_weights": false, + "knowledge": "2024-12", + "release_date": "2026-03-18", + "last_updated": "2026-03-18", + "cost": { + "input": 1, + "output": 3, + "cache_read": 0.2, + "tiers": [ + { + "input": 2, + "output": 6, + "cache_read": 0.4, + "tier": { + "type": "context", + "size": 256000 + } + } ], - "output": [ - "audio" - ] + "context_over_200k": { + "input": 2, + "output": 6, + "cache_read": 0.4 + } }, - "tool_call": false, - "reasoning": { - "supported": false - } + "type": "chat" }, { - "id": "RVC-Boss/GPT-SoVITS", - "name": "RVC-Boss/GPT-SoVITS", - "display_name": "RVC-Boss/GPT-SoVITS", + "id": "gpt-4o-search-preview", + "name": "GPT-4o Search Preview", + "display_name": "GPT-4o Search Preview", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ - "audio" + "text" ] }, + "limit": { + "context": 128000, + "output": 16384 + }, + "temperature": true, "tool_call": false, "reasoning": { "supported": false - } + }, + "attachment": true, + "open_weights": false, + "release_date": "2024-10-01", + "last_updated": "2024-10-01", + "cost": { + "input": 2.5, + "output": 10 + }, + "type": "chat" }, { - "id": "fishaudio/fish-speech-1.5", - "name": "fishaudio/fish-speech-1.5", - "display_name": "fishaudio/fish-speech-1.5", + "id": "llama-3.2-3b-instruct", + "name": "Llama 3.2 3B Instruct", + "display_name": "Llama 3.2 3B Instruct", "modalities": { "input": [ "text" ], "output": [ - "audio" + "text" ] }, + "limit": { + "context": 32768, + "output": 32000 + }, + "temperature": true, "tool_call": false, "reasoning": { "supported": false - } + }, + "attachment": false, + "open_weights": true, + "release_date": "2024-09-18", + "last_updated": "2024-09-18", + "cost": { + "input": 0.03, + "output": 0.05 + }, + "type": "chat" }, { - "id": "black-forest-labs/FLUX.1-pro", - "name": "black-forest-labs/FLUX.1-pro", - "display_name": "black-forest-labs/FLUX.1-pro", + "id": "mimo-v2.5-pro", + "name": "MiMo-V2.5-Pro", + "display_name": "MiMo-V2.5-Pro", "modalities": { "input": [ "text" ], "output": [ - "image" + "text" ] }, - "tool_call": false, + "limit": { + "context": 1048576, + "output": 131072 + }, + "temperature": true, + "tool_call": true, "reasoning": { - "supported": false - } - }, - { - "id": "LoRA/black-forest-labs/FLUX.1-dev", - "name": "LoRA/black-forest-labs/FLUX.1-dev", - "display_name": "LoRA/black-forest-labs/FLUX.1-dev", - "modalities": { - "input": [ - "text" + "supported": true, + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } + }, + "attachment": false, + "open_weights": true, + "knowledge": "2024-12", + "release_date": "2026-04-22", + "last_updated": "2026-04-22", + "cost": { + "input": 1, + "output": 3, + "cache_read": 0.2, + "tiers": [ + { + "input": 2, + "output": 6, + "cache_read": 0.4, + "tier": { + "type": "context", + "size": 256000 + } + } ], - "output": [ - "image" - ] + "context_over_200k": { + "input": 2, + "output": 6, + "cache_read": 0.4 + } }, - "tool_call": false, - "reasoning": { - "supported": false - } + "type": "chat" }, { - "id": "SeedLLM/Seed-Rice-7B", - "name": "SeedLLM/Seed-Rice-7B", - "display_name": "SeedLLM/Seed-Rice-7B", + "id": "gpt-5.5-pro", + "name": "GPT-5.5 Pro", + "display_name": "GPT-5.5 Pro", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 131072, - "output": 8192 + "context": 1050000, + "output": 128000 }, + "temperature": false, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true + } + }, + "attachment": true, + "open_weights": false, + "knowledge": "2025-12-01", + "release_date": "2026-04-23", + "last_updated": "2026-04-23", + "cost": { + "input": 30, + "output": 180, + "tiers": [ + { + "input": 60, + "output": 270, + "tier": { + "type": "context", + "size": 272000 + } + } + ], + "context_over_200k": { + "input": 60, + "output": 270 + } }, "type": "chat" - } - ] - }, - "zhipuai-coding-plan": { - "id": "zhipuai-coding-plan", - "name": "Zhipu AI Coding Plan", - "display_name": "Zhipu AI Coding Plan", - "api": "https://open.bigmodel.cn/api/coding/paas/v4", - "doc": "https://docs.bigmodel.cn/cn/coding-plan/overview", - "models": [ + }, { - "id": "glm-5v-turbo", - "name": "GLM-5V-Turbo", - "display_name": "GLM-5V-Turbo", + "id": "gpt-4o-mini", + "name": "GPT-4o mini", + "display_name": "GPT-4o mini", "modalities": { "input": [ "text", "image", - "video", "pdf" ], "output": [ @@ -76015,42 +81679,30 @@ ] }, "limit": { - "context": 200000, - "output": 131072 + "context": 128000, + "output": 16384 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } + "supported": false }, "attachment": true, "open_weights": false, - "release_date": "2026-04-01", - "last_updated": "2026-04-01", - "cost": { - "input": 0, - "output": 0, - "cache_read": 0, - "cache_write": 0 + "knowledge": "2023-09", + "release_date": "2024-07-18", + "last_updated": "2024-07-18", + "cost": { + "input": 0.15, + "output": 0.6, + "cache_read": 0.075 }, "type": "chat" }, { - "id": "glm-5.1", - "name": "GLM-5.1", - "display_name": "GLM-5.1", + "id": "gpt-oss-20b", + "name": "GPT OSS 20B", + "display_name": "GPT OSS 20B", "modalities": { "input": [ "text" @@ -76060,8 +81712,8 @@ ] }, "limit": { - "context": 200000, - "output": 131072 + "context": 131072, + "output": 32766 }, "temperature": true, "tool_call": true, @@ -76071,31 +81723,23 @@ }, "extra_capabilities": { "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] + "supported": true } }, "attachment": false, "open_weights": false, - "release_date": "2026-03-27", - "last_updated": "2026-03-27", + "release_date": "2025-08-05", + "last_updated": "2025-08-05", "cost": { - "input": 0, - "output": 0, - "cache_read": 0, - "cache_write": 0 + "input": 0.04, + "output": 0.15 }, "type": "chat" }, { - "id": "glm-4.5-air", - "name": "GLM-4.5-Air", - "display_name": "GLM-4.5-Air", + "id": "glm-4.5-flash", + "name": "GLM-4.5-Flash", + "display_name": "GLM-4.5-Flash", "modalities": { "input": [ "text" @@ -76115,7 +81759,7 @@ "default": true }, "attachment": false, - "open_weights": true, + "open_weights": false, "knowledge": "2025-04", "release_date": "2025-07-28", "last_updated": "2025-07-28", @@ -76128,9 +81772,9 @@ "type": "chat" }, { - "id": "glm-5-turbo", - "name": "GLM-5-Turbo", - "display_name": "GLM-5-Turbo", + "id": "glm-5", + "name": "GLM-5", + "display_name": "GLM-5", "modalities": { "input": [ "text" @@ -76140,7 +81784,7 @@ ] }, "limit": { - "context": 200000, + "context": 204800, "output": 131072 }, "temperature": true, @@ -76161,123 +81805,97 @@ } }, "attachment": false, - "open_weights": false, - "release_date": "2026-03-16", - "last_updated": "2026-03-16", + "open_weights": true, + "release_date": "2026-02-11", + "last_updated": "2026-02-11", "cost": { - "input": 0, - "output": 0, - "cache_read": 0, + "input": 1, + "output": 3.2, + "cache_read": 0.2, "cache_write": 0 }, "type": "chat" }, { - "id": "glm-4.6v", - "name": "GLM-4.6V", - "display_name": "GLM-4.6V", + "id": "qwen-max-latest", + "name": "Qwen Max Latest", + "display_name": "Qwen Max Latest", "modalities": { "input": [ "text", - "image", - "video" + "image" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 32768 + "context": 32768, + "output": 8192 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, "attachment": true, - "open_weights": true, - "knowledge": "2025-04", - "release_date": "2025-12-08", - "last_updated": "2025-12-08", + "open_weights": false, + "release_date": "2025-01-25", + "last_updated": "2025-01-25", "cost": { - "input": 0.3, - "output": 0.9 + "input": 0.345, + "output": 1.377 }, "type": "chat" }, { - "id": "glm-4.7", - "name": "GLM-4.7", - "display_name": "GLM-4.7", + "id": "mistral-large-2512", + "name": "Mistral Large 3", + "display_name": "Mistral Large 3", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 204800, - "output": 131072 + "context": 262144, + "output": 262144 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } + "supported": false }, - "attachment": false, + "attachment": true, "open_weights": true, - "knowledge": "2025-04", - "release_date": "2025-12-22", - "last_updated": "2025-12-22", + "knowledge": "2024-11", + "release_date": "2024-11-01", + "last_updated": "2025-12-02", "cost": { - "input": 0, - "output": 0, - "cache_read": 0, - "cache_write": 0 + "input": 0.5, + "output": 1.5 }, "type": "chat" - } - ] - }, - "xai": { - "id": "xai", - "name": "xai", - "display_name": "xai", - "doc": "https://docs.x.ai/docs/models", - "models": [ + }, { - "id": "grok-build-0.1", - "name": "Grok Build 0.1", - "display_name": "Grok Build 0.1", + "id": "qwen-turbo", + "name": "Qwen Turbo", + "display_name": "Qwen Turbo", "modalities": { "input": [ - "text", - "image", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 256000, - "output": 256000 + "context": 1000000, + "output": 16384 }, "temperature": true, "tool_call": true, @@ -76287,91 +81905,63 @@ }, "extra_capabilities": { "reasoning": { - "supported": true + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] } }, - "attachment": true, + "attachment": false, "open_weights": false, - "release_date": "2026-04-16", - "last_updated": "2026-04-16", + "knowledge": "2024-04", + "release_date": "2024-11-01", + "last_updated": "2025-04-28", "cost": { - "input": 1, - "output": 2, - "cache_read": 0.2, - "tiers": [ - { - "input": 2, - "output": 4, - "cache_read": 0.4, - "tier": { - "type": "context", - "size": 200000 - } - } - ], - "context_over_200k": { - "input": 2, - "output": 4, - "cache_read": 0.4 - } + "input": 0.05, + "output": 0.2, + "reasoning": 0.5 }, "type": "chat" }, { - "id": "grok-4.20-0309-reasoning", - "name": "Grok 4.20 (Reasoning)", - "display_name": "Grok 4.20 (Reasoning)", + "id": "custom", + "name": "Custom Model", + "display_name": "Custom Model", "modalities": { "input": [ "text", - "image", - "pdf" + "image" ], "output": [ "text" ] }, "limit": { - "context": 1000000, - "output": 30000 + "context": 128000, + "output": 16384 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, "attachment": true, "open_weights": false, - "release_date": "2026-03-09", - "last_updated": "2026-03-09", + "release_date": "2024-01-01", + "last_updated": "2024-01-01", "cost": { - "input": 1.25, - "output": 2.5, - "cache_read": 0.2, - "tiers": [ - { - "input": 2.5, - "output": 5, - "cache_read": 0.4, - "tier": { - "type": "context", - "size": 200000 - } - } - ], - "context_over_200k": { - "input": 2.5, - "output": 5, - "cache_read": 0.4 - } + "input": 0, + "output": 0 }, "type": "chat" }, { - "id": "grok-4.20-multi-agent-0309", - "name": "Grok 4.20 Multi-Agent", - "display_name": "Grok 4.20 Multi-Agent", + "id": "grok-4-20-reasoning", + "name": "Grok 4.20 (Reasoning)", + "display_name": "Grok 4.20 (Reasoning)", "modalities": { "input": [ "text", @@ -76387,7 +81977,7 @@ "output": 30000 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { "supported": true, "default": true @@ -76425,22 +82015,21 @@ "type": "chat" }, { - "id": "grok-4.3", - "name": "Grok 4.3", - "display_name": "Grok 4.3", + "id": "deepseek-v3.2", + "name": "DeepSeek V3.2", + "display_name": "DeepSeek V3.2", "modalities": { "input": [ "text", - "image", - "pdf" + "image" ], "output": [ "text" ] }, "limit": { - "context": 1000000, - "output": 30000 + "context": 163840, + "output": 16384 }, "temperature": true, "tool_call": true, @@ -76454,205 +82043,142 @@ } }, "attachment": true, - "open_weights": false, - "release_date": "2026-04-17", - "last_updated": "2026-04-17", + "open_weights": true, + "release_date": "2025-09-29", + "last_updated": "2025-09-29", "cost": { - "input": 1.25, - "output": 2.5, - "cache_read": 0.2, - "tiers": [ - { - "input": 2.5, - "output": 5, - "cache_read": 0.4, - "tier": { - "type": "context", - "size": 200000 - } - } - ], - "context_over_200k": { - "input": 2.5, - "output": 5, - "cache_read": 0.4 - } - }, - "type": "chat" - }, - { - "id": "grok-imagine-image", - "name": "Grok Imagine Image", - "display_name": "Grok Imagine Image", - "modalities": { - "input": [ - "text", - "image", - "pdf" - ], - "output": [ - "image", - "pdf" - ] - }, - "limit": { - "context": 8000, - "output": 8192 - }, - "temperature": false, - "tool_call": false, - "reasoning": { - "supported": false + "input": 0.28, + "output": 0.42, + "cache_read": 0.056 }, - "attachment": true, - "open_weights": false, - "release_date": "2026-01-28", - "last_updated": "2026-01-28", "type": "chat" }, { - "id": "grok-4.20-0309-non-reasoning", - "name": "Grok 4.20 (Non-Reasoning)", - "display_name": "Grok 4.20 (Non-Reasoning)", + "id": "qwen3.6-max-preview", + "name": "Qwen3.6 Max Preview", + "display_name": "Qwen3.6 Max Preview", "modalities": { "input": [ - "text", - "image", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 1000000, - "output": 30000 + "context": 262144, + "output": 65536 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": true, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } + }, + "attachment": false, "open_weights": false, - "release_date": "2026-03-09", - "last_updated": "2026-03-09", + "knowledge": "2025-04", + "release_date": "2026-04-20", + "last_updated": "2026-04-20", "cost": { - "input": 1.25, - "output": 2.5, - "cache_read": 0.2, - "tiers": [ - { - "input": 2.5, - "output": 5, - "cache_read": 0.4, - "tier": { - "type": "context", - "size": 200000 - } - } - ], - "context_over_200k": { - "input": 2.5, - "output": 5, - "cache_read": 0.4 - } + "input": 1.3, + "output": 7.8, + "cache_read": 0.13, + "cache_write": 1.625 }, "type": "chat" }, { - "id": "grok-imagine-image-quality", - "name": "Grok Imagine Image Quality", - "display_name": "Grok Imagine Image Quality", + "id": "auto", + "name": "Auto Route", + "display_name": "Auto Route", "modalities": { "input": [ "text", - "image", - "pdf" + "image" ], "output": [ - "image", - "pdf" + "text" ] }, "limit": { - "context": 8000, - "output": 8192 + "context": 128000, + "output": 16384 }, - "temperature": false, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { "supported": false }, "attachment": true, "open_weights": false, - "release_date": "2026-04-03", - "last_updated": "2026-04-03", + "release_date": "2024-01-01", + "last_updated": "2024-01-01", + "cost": { + "input": 0, + "output": 0 + }, "type": "chat" }, { - "id": "grok-imagine-video", - "name": "Grok Imagine Video", - "display_name": "Grok Imagine Video", + "id": "gemini-3.1-flash-lite-preview", + "name": "Gemini 3.1 Flash Lite Preview", + "display_name": "Gemini 3.1 Flash Lite Preview", "modalities": { "input": [ "text", "image", "video", + "audio", "pdf" ], - "output": [ - "video" - ] - }, - "limit": { - "context": 1024, - "output": 8192 - }, - "temperature": false, - "tool_call": false, - "reasoning": { - "supported": false - }, - "attachment": true, - "open_weights": false, - "release_date": "2026-01-28", - "last_updated": "2026-01-28", - "type": "chat" - }, - { - "id": "grok-3-mini-fast-beta", - "name": "Grok 3 Mini Fast Beta", - "display_name": "Grok 3 Mini Fast Beta", - "modalities": { - "input": [ - "text" - ], "output": [ "text" ] }, "limit": { - "context": 120000, - "output": 100000 + "context": 1048576, + "output": 65536 }, "temperature": true, "tool_call": true, "reasoning": { "supported": true, - "default": true, - "effort": "low" + "default": true }, - "search": { - "supported": false + "extra_capabilities": { + "reasoning": { + "supported": true + } + }, + "attachment": true, + "open_weights": false, + "knowledge": "2025-01", + "release_date": "2026-03-03", + "last_updated": "2026-03-03", + "cost": { + "input": 0.25, + "output": 1.5, + "cache_read": 0.025, + "input_audio": 0.5 }, - "attachment": false, "type": "chat" }, { - "id": "grok-3-mini-beta", - "name": "Grok 3 Mini Beta", - "display_name": "Grok 3 Mini Beta", + "id": "codestral-2508", + "name": "Codestral", + "display_name": "Codestral", "modalities": { "input": [ "text" @@ -76662,26 +82188,28 @@ ] }, "limit": { - "context": 120000, - "output": 100000 + "context": 256000, + "output": 16384 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": true, - "effort": "low" - }, - "search": { "supported": false }, "attachment": false, + "open_weights": true, + "release_date": "2025-07-30", + "last_updated": "2025-07-30", + "cost": { + "input": 0.3, + "output": 0.9 + }, "type": "chat" }, { - "id": "grok-3-fast-beta", - "name": "Grok 3 Fast Beta", - "display_name": "Grok 3 Fast Beta", + "id": "qwen3-235b-a22b-fp8", + "name": "Qwen3 235B A22B FP8", + "display_name": "Qwen3 235B A22B FP8", "modalities": { "input": [ "text" @@ -76691,52 +82219,86 @@ ] }, "limit": { - "context": 120000, - "output": 100000 + "context": 131072, + "output": 8192 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false - }, - "search": { - "supported": false + "supported": true, + "default": true }, "attachment": false, + "open_weights": true, + "release_date": "2025-04-28", + "last_updated": "2025-04-28", + "cost": { + "input": 0.2, + "output": 0.8 + }, "type": "chat" }, { - "id": "grok-2-vision-1212", - "name": "Grok 2 Vision 1212", - "display_name": "Grok 2 Vision 1212", + "id": "gpt-5.2-codex", + "name": "GPT-5.2 Codex", + "display_name": "GPT-5.2 Codex", "modalities": { "input": [ "text", - "image" + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 32000, - "output": 32000 + "context": 400000, + "output": 128000 }, - "temperature": true, - "tool_call": false, + "temperature": false, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "search": { - "supported": false + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": true, + "mode": "effort", + "effort": "medium", + "effort_options": [ + "low", + "medium", + "high", + "xhigh" + ], + "verbosity": "medium", + "verbosity_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" + } + }, + "attachment": true, + "open_weights": false, + "knowledge": "2025-08-31", + "release_date": "2025-12-11", + "last_updated": "2025-12-11", + "cost": { + "input": 1.75, + "output": 14, + "cache_read": 0.175 }, - "attachment": false, "type": "chat" }, { - "id": "grok-2-image-1212", - "name": "Grok 2 Image 1212", - "display_name": "Grok 2 Image 1212", + "id": "qwen-vl-plus", + "name": "Qwen-VL Plus", + "display_name": "Qwen-VL Plus", "modalities": { "input": [ "text", @@ -76747,119 +82309,131 @@ ] }, "limit": { - "context": 130000, - "output": 100000 + "context": 131072, + "output": 8192 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { "supported": false }, - "search": { - "supported": false - }, "attachment": false, + "open_weights": false, + "knowledge": "2024-04", + "release_date": "2024-01-25", + "last_updated": "2025-08-15", + "cost": { + "input": 0.21, + "output": 0.63 + }, "type": "chat" }, { - "id": "grok-3-beta", - "name": "Grok 3 Beta", - "display_name": "Grok 3 Beta", + "id": "qwen3.6-plus", + "name": "Qwen3.6 Plus", + "display_name": "Qwen3.6 Plus", "modalities": { "input": [ - "text" + "text", + "image", + "video" ], "output": [ "text" ] }, "limit": { - "context": 120000, - "output": 100000 + "context": 1000000, + "output": 65536 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "search": { - "supported": false + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } }, "attachment": false, - "type": "chat" - }, - { - "id": "grok-2-1212", - "name": "Grok 2 1212", - "display_name": "Grok 2 1212", - "modalities": { - "input": [ - "text" + "open_weights": false, + "knowledge": "2025-04", + "release_date": "2026-04-02", + "last_updated": "2026-04-02", + "cost": { + "input": 0.5, + "output": 3, + "cache_read": 0.05, + "cache_write": 0.625, + "tiers": [ + { + "input": 2, + "output": 6, + "cache_read": 0.2, + "cache_write": 2.5, + "tier": { + "type": "context", + "size": 256000 + } + } ], - "output": [ - "text" - ] - }, - "limit": { - "context": 120000, - "output": 100000 - }, - "temperature": true, - "tool_call": true, - "reasoning": { - "supported": false - }, - "search": { - "supported": false + "context_over_200k": { + "input": 2, + "output": 6, + "cache_read": 0.2, + "cache_write": 2.5 + } }, - "attachment": false, "type": "chat" - } - ] - }, - "v0": { - "id": "v0", - "name": "v0", - "display_name": "v0", - "doc": "https://sdk.vercel.ai/providers/ai-sdk-providers/vercel", - "models": [ + }, { - "id": "v0-1.5-lg", - "name": "v0-1.5-lg", - "display_name": "v0-1.5-lg", + "id": "gemini-2.0-flash-lite", + "name": "Gemini 2.0 Flash-Lite", + "display_name": "Gemini 2.0 Flash-Lite", "modalities": { "input": [ "text", - "image" + "image", + "audio", + "video", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 512000, - "output": 32000 + "context": 1048576, + "output": 8192 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, "attachment": true, "open_weights": false, - "release_date": "2025-06-09", - "last_updated": "2025-06-09", + "knowledge": "2024-06", + "release_date": "2024-12-11", + "last_updated": "2024-12-11", "cost": { - "input": 15, - "output": 75 + "input": 0.075, + "output": 0.3 }, "type": "chat" }, { - "id": "v0-1.0-md", - "name": "v0-1.0-md", - "display_name": "v0-1.0-md", + "id": "gpt-5.1", + "name": "GPT-5.1", + "display_name": "GPT-5.1", "modalities": { "input": [ "text", @@ -76870,71 +82444,134 @@ ] }, "limit": { - "context": 128000, - "output": 32000 + "context": 400000, + "output": 128000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { "supported": true, - "default": true + "default": false + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": false, + "mode": "effort", + "effort": "none", + "effort_options": [ + "none", + "low", + "medium", + "high" + ], + "verbosity": "medium", + "verbosity_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" + } }, "attachment": true, "open_weights": false, - "release_date": "2025-05-22", - "last_updated": "2025-05-22", + "knowledge": "2024-09-30", + "release_date": "2025-11-13", + "last_updated": "2025-11-13", "cost": { - "input": 3, - "output": 15 + "input": 1.25, + "output": 10, + "cache_read": 0.125 }, "type": "chat" }, { - "id": "v0-1.5-md", - "name": "v0-1.5-md", - "display_name": "v0-1.5-md", + "id": "gpt-5.5", + "name": "GPT-5.5", + "display_name": "GPT-5.5", "modalities": { "input": [ "text", - "image" + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 32000 + "context": 1050000, + "output": 128000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { "supported": true, "default": true }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": true, + "mode": "effort", + "effort": "medium", + "effort_options": [ + "low", + "medium", + "high", + "xhigh" + ], + "verbosity": "medium", + "verbosity_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" + } + }, "attachment": true, "open_weights": false, - "release_date": "2025-06-09", - "last_updated": "2025-06-09", + "knowledge": "2025-12-01", + "release_date": "2026-04-23", + "last_updated": "2026-04-23", "cost": { - "input": 3, - "output": 15 + "input": 5, + "output": 30, + "cache_read": 0.5, + "tiers": [ + { + "input": 10, + "output": 45, + "cache_read": 1, + "tier": { + "type": "context", + "size": 272000 + } + } + ], + "context_over_200k": { + "input": 10, + "output": 45, + "cache_read": 1 + } }, "type": "chat" } ] }, - "neuralwatt": { - "id": "neuralwatt", - "name": "Neuralwatt", - "display_name": "Neuralwatt", - "api": "https://api.neuralwatt.com/v1", - "doc": "https://portal.neuralwatt.com/docs", + "alibaba-coding-plan-cn": { + "id": "alibaba-coding-plan-cn", + "name": "Alibaba Coding Plan (China)", + "display_name": "Alibaba Coding Plan (China)", + "api": "https://coding.dashscope.aliyuncs.com/v1", + "doc": "https://help.aliyun.com/zh/model-studio/coding-plan", "models": [ { - "id": "glm-5-fast", - "name": "GLM 5 Fast", - "display_name": "GLM 5 Fast", + "id": "qwen3-coder-plus", + "name": "Qwen3 Coder Plus", + "display_name": "Qwen3 Coder Plus", "modalities": { "input": [ "text" @@ -76944,8 +82581,8 @@ ] }, "limit": { - "context": 202736, - "output": 202736 + "context": 1000000, + "output": 65536 }, "temperature": true, "tool_call": true, @@ -76954,18 +82591,21 @@ }, "attachment": false, "open_weights": true, - "release_date": "2026-04-07", - "last_updated": "2026-04-07", + "knowledge": "2025-04", + "release_date": "2025-07-23", + "last_updated": "2025-07-23", "cost": { - "input": 1.1, - "output": 3.6 + "input": 0, + "output": 0, + "cache_read": 0, + "cache_write": 0 }, "type": "chat" }, { - "id": "qwen3.5-397b-fast", - "name": "Qwen3.5 397B Fast", - "display_name": "Qwen3.5 397B Fast", + "id": "glm-4.7", + "name": "GLM-4.7", + "display_name": "GLM-4.7", "modalities": { "input": [ "text" @@ -76975,13 +82615,14 @@ ] }, "limit": { - "context": 262128, - "output": 262128 + "context": 202752, + "output": 16384 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true + "supported": true, + "default": true }, "extra_capabilities": { "reasoning": { @@ -76996,50 +82637,21 @@ }, "attachment": false, "open_weights": true, - "release_date": "2026-02-01", - "last_updated": "2026-02-01", - "cost": { - "input": 0.69, - "output": 4.14 - }, - "type": "chat" - }, - { - "id": "kimi-k2.5-fast", - "name": "Kimi K2.5 Fast", - "display_name": "Kimi K2.5 Fast", - "modalities": { - "input": [ - "text", - "image" - ], - "output": [ - "text" - ] - }, - "limit": { - "context": 262128, - "output": 262128 - }, - "temperature": true, - "tool_call": true, - "reasoning": { - "supported": false - }, - "attachment": true, - "open_weights": true, - "release_date": "2026-01-27", - "last_updated": "2026-01-27", + "knowledge": "2025-04", + "release_date": "2025-12-22", + "last_updated": "2025-12-22", "cost": { - "input": 0.52, - "output": 2.59 + "input": 0, + "output": 0, + "cache_read": 0, + "cache_write": 0 }, "type": "chat" }, { - "id": "qwen3.6-35b-fast", - "name": "Qwen3.6 35B Fast", - "display_name": "Qwen3.6 35B Fast", + "id": "qwen3.7-plus", + "name": "Qwen3.7 Plus", + "display_name": "Qwen3.7 Plus", "modalities": { "input": [ "text", @@ -77050,134 +82662,37 @@ ] }, "limit": { - "context": 131056, - "output": 131056 + "context": 1000000, + "output": 64000 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true + "supported": true, + "default": true }, "extra_capabilities": { "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] + "supported": true } }, - "attachment": true, - "open_weights": true, - "release_date": "2026-04-01", - "last_updated": "2026-04-01", - "cost": { - "input": 0.29, - "output": 1.15 - }, - "type": "chat" - }, - { - "id": "kimi-k2.6-fast", - "name": "Kimi K2.6 Fast", - "display_name": "Kimi K2.6 Fast", - "modalities": { - "input": [ - "text", - "image" - ], - "output": [ - "text" - ] - }, - "limit": { - "context": 262128, - "output": 262128 - }, - "temperature": true, - "tool_call": true, - "reasoning": { - "supported": false - }, - "attachment": true, - "open_weights": true, - "release_date": "2026-04-21", - "last_updated": "2026-04-21", - "cost": { - "input": 0.69, - "output": 3.22 - }, - "type": "chat" - }, - { - "id": "glm-5.1-fast", - "name": "GLM 5.1 Fast", - "display_name": "GLM 5.1 Fast", - "modalities": { - "input": [ - "text" - ], - "output": [ - "text" - ] - }, - "limit": { - "context": 202736, - "output": 202736 - }, - "temperature": true, - "tool_call": true, - "reasoning": { - "supported": false - }, "attachment": false, - "open_weights": true, - "release_date": "2026-04-07", - "last_updated": "2026-04-07", - "cost": { - "input": 1.1, - "output": 3.6 - }, - "type": "chat" - }, - { - "id": "mistralai/Devstral-Small-2-24B-Instruct-2512", - "name": "Devstral Small 2 24B Instruct 2512", - "display_name": "Devstral Small 2 24B Instruct 2512", - "modalities": { - "input": [ - "text", - "image" - ], - "output": [ - "text" - ] - }, - "limit": { - "context": 262128, - "output": 262128 - }, - "temperature": true, - "tool_call": true, - "reasoning": { - "supported": false - }, - "attachment": true, - "open_weights": true, - "release_date": "2025-12-09", - "last_updated": "2025-12-09", + "open_weights": false, + "knowledge": "2025-04", + "release_date": "2026-06-02", + "last_updated": "2026-06-02", "cost": { - "input": 0.12, - "output": 0.35 + "input": 0, + "output": 0, + "cache_read": 0, + "cache_write": 0 }, "type": "chat" }, { - "id": "MiniMaxAI/MiniMax-M2.5", - "name": "MiniMax M2.5", - "display_name": "MiniMax M2.5", + "id": "qwen3.7-max", + "name": "Qwen3.7 Max", + "display_name": "Qwen3.7 Max", "modalities": { "input": [ "text" @@ -77187,8 +82702,8 @@ ] }, "limit": { - "context": 196592, - "output": 196592 + "context": 1000000, + "output": 65536 }, "temperature": true, "tool_call": true, @@ -77198,40 +82713,38 @@ }, "extra_capabilities": { "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] + "supported": true } }, "attachment": false, - "open_weights": true, - "release_date": "2026-02-12", - "last_updated": "2026-02-12", + "open_weights": false, + "release_date": "2026-05-21", + "last_updated": "2026-05-21", "cost": { - "input": 0.35, - "output": 1.38 + "input": 2.5, + "output": 7.5, + "cache_read": 0.5, + "cache_write": 3.125 }, "type": "chat" }, { - "id": "zai-org/GLM-5.1-FP8", - "name": "GLM 5.1 FP8", - "display_name": "GLM 5.1 FP8", + "id": "qwen3.6-flash", + "name": "Qwen3.6 Flash", + "display_name": "Qwen3.6 Flash", "modalities": { "input": [ - "text" + "text", + "image", + "video" ], "output": [ "text" ] }, "limit": { - "context": 202736, - "output": 202736 + "context": 1000000, + "output": 65536 }, "temperature": true, "tool_call": true, @@ -77250,38 +82763,37 @@ ] } }, - "attachment": false, - "open_weights": true, - "release_date": "2026-04-07", - "last_updated": "2026-04-07", + "attachment": true, + "open_weights": false, + "release_date": "2026-04-27", + "last_updated": "2026-04-27", "cost": { - "input": 1.1, - "output": 3.6 + "input": 0.1875, + "output": 1.125, + "cache_write": 0.234375 }, "type": "chat" }, { - "id": "moonshotai/Kimi-K2.6", - "name": "Kimi K2.6", - "display_name": "Kimi K2.6", + "id": "qwen3-max-2026-01-23", + "name": "Qwen3 Max", + "display_name": "Qwen3 Max", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 262128, - "output": 262128 + "context": 262144, + "output": 32768 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": true }, "extra_capabilities": { "reasoning": { @@ -77294,20 +82806,23 @@ ] } }, - "attachment": true, - "open_weights": true, - "release_date": "2026-04-21", - "last_updated": "2026-04-21", + "attachment": false, + "open_weights": false, + "knowledge": "2025-04", + "release_date": "2026-01-23", + "last_updated": "2026-01-23", "cost": { - "input": 0.69, - "output": 3.22 + "input": 0, + "output": 0, + "cache_read": 0, + "cache_write": 0 }, "type": "chat" }, { - "id": "moonshotai/Kimi-K2.5", - "name": "Kimi K2.5", - "display_name": "Kimi K2.5", + "id": "qwen3.5-plus", + "name": "Qwen3.5 Plus", + "display_name": "Qwen3.5 Plus", "modalities": { "input": [ "text", @@ -77318,8 +82833,8 @@ ] }, "limit": { - "context": 262128, - "output": 262128 + "context": 1000000, + "output": 65536 }, "temperature": true, "tool_call": true, @@ -77338,20 +82853,23 @@ ] } }, - "attachment": true, - "open_weights": true, - "release_date": "2026-01-27", - "last_updated": "2026-01-27", + "attachment": false, + "open_weights": false, + "knowledge": "2025-04", + "release_date": "2026-02-16", + "last_updated": "2026-02-16", "cost": { - "input": 0.52, - "output": 2.59 + "input": 0, + "output": 0, + "cache_read": 0, + "cache_write": 0 }, "type": "chat" }, { - "id": "Qwen/Qwen3.6-35B-A3B", - "name": "Qwen3.6 35B A3B", - "display_name": "Qwen3.6 35B A3B", + "id": "kimi-k2.5", + "name": "Kimi K2.5", + "display_name": "Kimi K2.5", "modalities": { "input": [ "text", @@ -77362,8 +82880,8 @@ ] }, "limit": { - "context": 131056, - "output": 131056 + "context": 262144, + "output": 32768 }, "temperature": true, "tool_call": true, @@ -77384,18 +82902,21 @@ }, "attachment": true, "open_weights": true, - "release_date": "2026-04-01", - "last_updated": "2026-04-01", + "knowledge": "2025-01", + "release_date": "2026-01-27", + "last_updated": "2026-01-27", "cost": { - "input": 0.29, - "output": 1.15 + "input": 0, + "output": 0, + "cache_read": 0, + "cache_write": 0 }, "type": "chat" }, { - "id": "Qwen/Qwen3.5-397B-A17B-FP8", - "name": "Qwen3.5 397B A17B FP8", - "display_name": "Qwen3.5 397B A17B FP8", + "id": "MiniMax-M2.5", + "name": "MiniMax-M2.5", + "display_name": "MiniMax-M2.5", "modalities": { "input": [ "text" @@ -77405,8 +82926,8 @@ ] }, "limit": { - "context": 262128, - "output": 262128 + "context": 196608, + "output": 24576 }, "temperature": true, "tool_call": true, @@ -77427,18 +82948,20 @@ }, "attachment": false, "open_weights": true, - "release_date": "2026-02-01", - "last_updated": "2026-02-01", + "release_date": "2026-02-12", + "last_updated": "2026-02-12", "cost": { - "input": 0.69, - "output": 4.14 + "input": 0, + "output": 0, + "cache_read": 0, + "cache_write": 0 }, "type": "chat" }, { - "id": "openai/gpt-oss-20b", - "name": "GPT OSS 20B", - "display_name": "GPT OSS 20B", + "id": "qwen3-coder-next", + "name": "Qwen3 Coder Next", + "display_name": "Qwen3 Coder Next", "modalities": { "input": [ "text" @@ -77448,43 +82971,30 @@ ] }, "limit": { - "context": 16368, - "output": 16368 + "context": 262144, + "output": 65536 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true - } + "supported": false }, "attachment": false, "open_weights": true, - "release_date": "2025-08-05", - "last_updated": "2025-08-05", + "release_date": "2026-02-03", + "last_updated": "2026-02-03", "cost": { - "input": 0.03, - "output": 0.16 + "input": 0, + "output": 0, + "cache_read": 0, + "cache_write": 0 }, "type": "chat" - } - ] - }, - "friendli": { - "id": "friendli", - "name": "Friendli", - "display_name": "Friendli", - "api": "https://api.friendli.ai/serverless/v1", - "doc": "https://friendli.ai/docs/guides/serverless_endpoints/introduction", - "models": [ + }, { - "id": "MiniMaxAI/MiniMax-M2.5", - "name": "MiniMax-M2.5", - "display_name": "MiniMax-M2.5", + "id": "glm-5", + "name": "GLM-5", + "display_name": "GLM-5", "modalities": { "input": [ "text" @@ -77494,8 +83004,8 @@ ] }, "limit": { - "context": 196608, - "output": 196608 + "context": 202752, + "output": 16384 }, "temperature": true, "tool_call": true, @@ -77515,31 +83025,34 @@ } }, "attachment": false, - "open_weights": true, - "release_date": "2026-02-12", - "last_updated": "2026-02-12", + "open_weights": false, + "release_date": "2026-02-11", + "last_updated": "2026-02-11", "cost": { - "input": 0.3, - "output": 1.2, - "cache_read": 0.06 + "input": 0, + "output": 0, + "cache_read": 0, + "cache_write": 0 }, "type": "chat" }, { - "id": "zai-org/GLM-5", - "name": "GLM-5", - "display_name": "GLM-5", + "id": "qwen3.6-plus", + "name": "Qwen3.6 Plus", + "display_name": "Qwen3.6 Plus", "modalities": { "input": [ - "text" + "text", + "image", + "video" ], "output": [ "text" ] }, "limit": { - "context": 202752, - "output": 202752 + "context": 1000000, + "output": 65536 }, "temperature": true, "tool_call": true, @@ -77559,33 +83072,45 @@ } }, "attachment": false, - "open_weights": true, - "release_date": "2026-02-12", - "last_updated": "2026-02-12", + "open_weights": false, + "knowledge": "2025-04", + "release_date": "2026-04-02", + "last_updated": "2026-04-02", "cost": { - "input": 1, - "output": 3.2, - "cache_read": 0.5 + "input": 0, + "output": 0, + "cache_read": 0, + "cache_write": 0 }, "type": "chat" - }, + } + ] + }, + "abacus": { + "id": "abacus", + "name": "Abacus", + "display_name": "Abacus", + "api": "https://routellm.abacus.ai/v1", + "doc": "https://abacus.ai/help/api", + "models": [ { - "id": "zai-org/GLM-5.1", - "name": "GLM-5.1", - "display_name": "GLM-5.1", + "id": "o3", + "name": "o3", + "display_name": "o3", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 202752, - "output": 202752 + "context": 200000, + "output": 100000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { "supported": true, @@ -77594,170 +83119,195 @@ "extra_capabilities": { "reasoning": { "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] + "default_enabled": true, + "mode": "effort", + "effort": "medium", + "effort_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" } }, - "attachment": false, - "open_weights": true, - "release_date": "2026-04-07", - "last_updated": "2026-04-07", + "attachment": true, + "open_weights": false, + "knowledge": "2024-05", + "release_date": "2025-04-16", + "last_updated": "2025-04-16", "cost": { - "input": 1.4, - "output": 4.4, - "cache_read": 0.26 + "input": 2, + "output": 8 }, "type": "chat" }, { - "id": "meta-llama/Llama-3.1-8B-Instruct", - "name": "Llama 3.1 8B Instruct", - "display_name": "Llama 3.1 8B Instruct", + "id": "route-llm", + "name": "Route LLM", + "display_name": "Route LLM", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 131072, - "output": 8000 + "context": 128000, + "output": 16384 }, "temperature": true, "tool_call": true, "reasoning": { "supported": false }, - "attachment": false, - "open_weights": true, - "release_date": "2024-08-01", - "last_updated": "2025-12-23", + "attachment": true, + "open_weights": false, + "knowledge": "2024-10", + "release_date": "2024-01-01", + "last_updated": "2024-01-01", "cost": { - "input": 0.1, - "output": 0.1 + "input": 3, + "output": 15 }, "type": "chat" }, { - "id": "meta-llama/Llama-3.3-70B-Instruct", - "name": "Llama 3.3 70B Instruct", - "display_name": "Llama 3.3 70B Instruct", + "id": "grok-code-fast-1", + "name": "Grok Code Fast 1", + "display_name": "Grok Code Fast 1", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 131072, - "output": 131072 + "context": 256000, + "output": 16384 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true }, - "attachment": false, - "open_weights": true, - "release_date": "2024-08-01", - "last_updated": "2025-12-23", + "extra_capabilities": { + "reasoning": { + "supported": true + } + }, + "attachment": true, + "open_weights": false, + "release_date": "2025-09-01", + "last_updated": "2025-09-01", "cost": { - "input": 0.6, - "output": 0.6 + "input": 0.2, + "output": 1.5 }, "type": "chat" }, { - "id": "Qwen/Qwen3-235B-A22B-Instruct-2507", - "name": "Qwen3 235B A22B Instruct 2507", - "display_name": "Qwen3 235B A22B Instruct 2507", + "id": "gpt-5.3-codex-xhigh", + "name": "GPT-5.3 Codex XHigh", + "display_name": "GPT-5.3 Codex XHigh", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 262144, - "output": 262144 + "context": 400000, + "output": 128000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": false, - "open_weights": true, - "release_date": "2025-07-29", - "last_updated": "2026-01-29", + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": true, + "mode": "effort", + "effort": "medium", + "effort_options": [ + "low", + "medium", + "high", + "xhigh" + ], + "verbosity": "medium", + "verbosity_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" + } + }, + "attachment": true, + "open_weights": false, + "knowledge": "2025-08-31", + "release_date": "2026-02-05", + "last_updated": "2026-02-05", "cost": { - "input": 0.2, - "output": 0.8 + "input": 1.75, + "output": 14 }, "type": "chat" - } - ] - }, - "github-copilot": { - "id": "github-copilot", - "name": "GitHub Copilot", - "display_name": "GitHub Copilot", - "api": "https://api.githubcopilot.com", - "doc": "https://docs.github.com/en/copilot", - "models": [ + }, { - "id": "raptor-mini", - "name": "Raptor mini", - "display_name": "Raptor mini", + "id": "llama-3.3-70b-versatile", + "name": "Llama 3.3 70B Versatile", + "display_name": "Llama 3.3 70B Versatile", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 400000, - "output": 128000 + "context": 128000, + "output": 32768 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, - "attachment": true, - "open_weights": false, - "knowledge": "2024-05-30", - "release_date": "2025-08-07", - "last_updated": "2025-08-07", + "attachment": false, + "open_weights": true, + "release_date": "2024-12-06", + "last_updated": "2024-12-06", "cost": { - "input": 0.25, - "output": 2, - "cache_read": 0.025 + "input": 0.59, + "output": 0.79 }, "type": "chat" }, { - "id": "claude-sonnet-4", - "name": "Claude Sonnet 4 (latest)", - "display_name": "Claude Sonnet 4 (latest)", + "id": "gemini-2.5-pro", + "name": "Gemini 2.5 Pro", + "display_name": "Gemini 2.5 Pro", "modalities": { "input": [ "text", "image", + "audio", + "video", "pdf" ], "output": [ @@ -77765,53 +83315,49 @@ ] }, "limit": { - "context": 216000, - "output": 16000 + "context": 1048576, + "output": 65536 }, "temperature": true, "tool_call": true, "reasoning": { "supported": true, - "default": false + "default": true }, "extra_capabilities": { "reasoning": { "supported": true, - "default_enabled": false, + "default_enabled": true, "mode": "budget", "budget": { - "min": 1024, + "default": -1, + "min": 128, + "max": 32768, + "auto": -1, "unit": "tokens" }, - "interleaved": true, "summaries": true, "visibility": "summary", "continuation": [ - "thinking_blocks" - ], - "notes": [ - "Claude 4 manual thinking uses thinking.type = \"enabled\" with budget_tokens.", - "Interleaved thinking requires the interleaved-thinking-2025-05-14 beta header for this model family." + "thought_signatures" ] } }, "attachment": true, "open_weights": false, - "knowledge": "2025-03-31", - "release_date": "2025-05-22", - "last_updated": "2025-05-22", + "knowledge": "2025-01", + "release_date": "2025-03-25", + "last_updated": "2025-03-25", "cost": { - "input": 3, - "output": 15, - "cache_read": 0.3, - "cache_write": 3.75 + "input": 1.25, + "output": 10 }, "type": "chat" }, { - "id": "gpt-5-mini", - "name": "GPT-5 Mini", - "display_name": "GPT-5 Mini", + "id": "gpt-5", + "name": "GPT-5", + "display_name": "GPT-5", "modalities": { "input": [ "text", @@ -77822,8 +83368,8 @@ ] }, "limit": { - "context": 264000, - "output": 64000 + "context": 400000, + "output": 128000 }, "temperature": false, "tool_call": true, @@ -77854,34 +83400,34 @@ }, "attachment": true, "open_weights": false, - "knowledge": "2024-05-30", + "knowledge": "2024-09-30", "release_date": "2025-08-07", "last_updated": "2025-08-07", "cost": { - "input": 0.25, - "output": 2, - "cache_read": 0.025 + "input": 1.25, + "output": 10 }, "type": "chat" }, { - "id": "gpt-5.2", - "name": "GPT-5.2", - "display_name": "GPT-5.2", + "id": "claude-haiku-4-5-20251001", + "name": "Claude Haiku 4.5", + "display_name": "Claude Haiku 4.5", "modalities": { "input": [ "text", - "image" + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 400000, - "output": 128000 + "context": 200000, + "output": 64000 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, @@ -77891,44 +83437,44 @@ "reasoning": { "supported": true, "default_enabled": false, - "mode": "effort", - "effort": "none", - "effort_options": [ - "none", - "low", - "medium", - "high", - "xhigh" - ], - "verbosity": "medium", - "verbosity_options": [ - "low", - "medium", - "high" + "mode": "budget", + "budget": { + "min": 1024, + "unit": "tokens" + }, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" ], - "visibility": "hidden" + "notes": [ + "Claude 4 manual thinking uses thinking.type = \"enabled\" with budget_tokens.", + "Interleaved thinking requires the interleaved-thinking-2025-05-14 beta header for this model family." + ] } }, "attachment": true, "open_weights": false, - "knowledge": "2025-08-31", - "release_date": "2025-12-11", - "last_updated": "2025-12-11", + "knowledge": "2025-02-28", + "release_date": "2025-10-15", + "last_updated": "2025-10-15", "cost": { - "input": 1.75, - "output": 14, - "cache_read": 0.175 + "input": 1, + "output": 5 }, "type": "chat" }, { - "id": "claude-sonnet-4.6", - "name": "Claude Sonnet 4.6", - "display_name": "Claude Sonnet 4.6", + "id": "gemini-2.5-flash", + "name": "Gemini 2.5 Flash", + "display_name": "Gemini 2.5 Flash", "modalities": { "input": [ "text", "image", + "audio", + "video", "pdf" ], "output": [ @@ -77936,95 +83482,76 @@ ] }, "limit": { - "context": 200000, - "output": 32000 + "context": 1048576, + "output": 65536 }, "temperature": true, "tool_call": true, "reasoning": { "supported": true, - "default": false + "default": true }, "extra_capabilities": { "reasoning": { "supported": true, - "default_enabled": false, - "mode": "mixed", + "default_enabled": true, + "mode": "budget", "budget": { - "min": 1024, + "default": -1, + "min": 0, + "max": 24576, + "auto": -1, + "off": 0, "unit": "tokens" }, - "effort": "high", - "effort_options": [ - "low", - "medium", - "high", - "max" - ], - "interleaved": true, "summaries": true, "visibility": "summary", "continuation": [ - "thinking_blocks" - ], - "notes": [ - "Anthropic recommends adaptive thinking with effort for Claude 4.6; budget_tokens remains a deprecated compatibility path.", - "Anthropic API defaults effort to high; lower effort levels should be chosen per workload." + "thought_signatures" ] } }, "attachment": true, "open_weights": false, - "knowledge": "2025-08-31", - "release_date": "2026-02-17", - "last_updated": "2026-03-13", + "knowledge": "2025-01", + "release_date": "2025-03-20", + "last_updated": "2025-06-05", "cost": { - "input": 3, - "output": 15, - "cache_read": 0.3, - "cache_write": 3.75 + "input": 0.3, + "output": 2.5 }, "type": "chat" }, { - "id": "gpt-5.4", - "name": "GPT-5.4", - "display_name": "GPT-5.4", + "id": "o4-mini", + "name": "o4-mini", + "display_name": "o4-mini", "modalities": { "input": [ "text", - "image", - "pdf" + "image" ], "output": [ "text" ] }, "limit": { - "context": 400000, - "output": 128000 + "context": 200000, + "output": 100000 }, "temperature": false, "tool_call": true, "reasoning": { "supported": true, - "default": false + "default": true }, "extra_capabilities": { "reasoning": { "supported": true, - "default_enabled": false, + "default_enabled": true, "mode": "effort", - "effort": "none", + "effort": "medium", "effort_options": [ - "none", - "low", - "medium", - "high", - "xhigh" - ], - "verbosity": "medium", - "verbosity_options": [ "low", "medium", "high" @@ -78034,51 +83561,30 @@ }, "attachment": true, "open_weights": false, - "knowledge": "2025-08-31", - "release_date": "2026-03-05", - "last_updated": "2026-03-05", + "knowledge": "2024-05", + "release_date": "2025-04-16", + "last_updated": "2025-04-16", "cost": { - "input": 2.5, - "output": 15, - "cache_read": 0.25, - "tiers": [ - { - "input": 5, - "output": 22.5, - "cache_read": 0.5, - "tier": { - "type": "context", - "size": 272000 - } - } - ], - "context_over_200k": { - "input": 5, - "output": 22.5, - "cache_read": 0.5 - } + "input": 1.1, + "output": 4.4 }, "type": "chat" }, { - "id": "gemini-3-flash-preview", - "name": "Gemini 3 Flash Preview", - "display_name": "Gemini 3 Flash Preview", + "id": "qwen3-max", + "name": "Qwen3 Max", + "display_name": "Qwen3 Max", "modalities": { "input": [ - "text", - "image", - "video", - "audio", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 64000 + "context": 131072, + "output": 16384 }, "temperature": true, "tool_call": true, @@ -78089,52 +83595,40 @@ "extra_capabilities": { "reasoning": { "supported": true, - "default_enabled": true, - "mode": "level", - "level": "high", - "level_options": [ - "minimal", - "low", - "medium", - "high" - ], + "interleaved": true, "summaries": true, "visibility": "summary", "continuation": [ - "thought_signatures" + "thinking_blocks" ] } }, - "attachment": true, + "attachment": false, "open_weights": false, - "knowledge": "2025-01", - "release_date": "2025-12-17", - "last_updated": "2025-12-17", + "release_date": "2025-05-28", + "last_updated": "2025-05-28", "cost": { - "input": 0.5, - "output": 3, - "cache_read": 0.05, - "input_audio": 1 + "input": 1.2, + "output": 6 }, "type": "chat" }, { - "id": "gpt-5.5", - "name": "GPT-5.5", - "display_name": "GPT-5.5", + "id": "o3-pro", + "name": "o3-pro", + "display_name": "o3-pro", "modalities": { "input": [ "text", - "image", - "pdf" + "image" ], "output": [ "text" ] }, "limit": { - "context": 400000, - "output": 128000 + "context": 200000, + "output": 100000 }, "temperature": false, "tool_call": true, @@ -78149,13 +83643,6 @@ "mode": "effort", "effort": "medium", "effort_options": [ - "low", - "medium", - "high", - "xhigh" - ], - "verbosity": "medium", - "verbosity_options": [ "low", "medium", "high" @@ -78165,36 +83652,19 @@ }, "attachment": true, "open_weights": false, - "knowledge": "2025-12-01", - "release_date": "2026-04-23", - "last_updated": "2026-04-23", + "knowledge": "2024-05", + "release_date": "2025-06-10", + "last_updated": "2025-06-10", "cost": { - "input": 5, - "output": 30, - "cache_read": 0.5, - "tiers": [ - { - "input": 10, - "output": 45, - "cache_read": 1, - "tier": { - "type": "context", - "size": 272000 - } - } - ], - "context_over_200k": { - "input": 10, - "output": 45, - "cache_read": 1 - } + "input": 20, + "output": 40 }, "type": "chat" }, { - "id": "claude-opus-4.5", - "name": "Claude Opus 4.5 (latest)", - "display_name": "Claude Opus 4.5 (latest)", + "id": "claude-opus-4-1-20250805", + "name": "Claude Opus 4.1", + "display_name": "Claude Opus 4.1", "modalities": { "input": [ "text", @@ -78219,17 +83689,11 @@ "reasoning": { "supported": true, "default_enabled": false, - "mode": "mixed", + "mode": "budget", "budget": { "min": 1024, "unit": "tokens" }, - "effort": "high", - "effort_options": [ - "low", - "medium", - "high" - ], "interleaved": true, "summaries": true, "visibility": "summary", @@ -78237,97 +83701,61 @@ "thinking_blocks" ], "notes": [ - "Claude Opus 4.5 uses manual thinking.type = \"enabled\" with budget_tokens; effort can be used alongside the thinking budget.", - "Interleaved thinking requires the interleaved-thinking-2025-05-14 beta header." + "Claude 4 manual thinking uses thinking.type = \"enabled\" with budget_tokens.", + "Interleaved thinking requires the interleaved-thinking-2025-05-14 beta header for this model family." ] } }, "attachment": true, "open_weights": false, - "knowledge": "2025-03-31", - "release_date": "2025-11-24", - "last_updated": "2025-11-24", + "release_date": "2025-08-05", + "last_updated": "2025-08-05", "cost": { - "input": 5, - "output": 25, - "cache_read": 0.5, - "cache_write": 6.25 + "input": 15, + "output": 75 }, "type": "chat" }, { - "id": "claude-opus-4.7", - "name": "Claude Opus 4.7", - "display_name": "Claude Opus 4.7", + "id": "grok-4-1-fast-non-reasoning", + "name": "Grok 4.1 Fast (Non-Reasoning)", + "display_name": "Grok 4.1 Fast (Non-Reasoning)", "modalities": { "input": [ "text", - "image", - "pdf" + "image" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 32000 + "context": 2000000, + "output": 16384 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": false - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": false, - "mode": "effort", - "effort": "high", - "effort_options": [ - "low", - "medium", - "high", - "xhigh", - "max" - ], - "interleaved": true, - "summaries": true, - "visibility": "omitted", - "continuation": [ - "thinking_blocks" - ], - "notes": [ - "Claude Opus 4.7 and newer Opus models require thinking.type = \"adaptive\" to enable thinking explicitly.", - "Manual budget_tokens requests return 400 on Claude Opus 4.7 and newer adaptive-only Opus models.", - "task_budget is separate from thinking control and should not be treated as a thinking budget." - ] - } + "supported": false }, "attachment": true, "open_weights": false, - "knowledge": "2026-01-31", - "release_date": "2026-04-16", - "last_updated": "2026-04-16", + "release_date": "2025-11-17", + "last_updated": "2025-11-17", "cost": { - "input": 5, - "output": 25, - "cache_read": 0.5, - "cache_write": 6.25 + "input": 0.2, + "output": 0.5 }, "type": "chat" }, { - "id": "gemini-2.5-pro", - "name": "Gemini 2.5 Pro", - "display_name": "Gemini 2.5 Pro", + "id": "claude-opus-4-5-20251101", + "name": "Claude Opus 4.5", + "display_name": "Claude Opus 4.5", "modalities": { "input": [ "text", "image", - "audio", - "video", "pdf" ], "output": [ @@ -78335,101 +83763,112 @@ ] }, "limit": { - "context": 128000, + "context": 200000, "output": 64000 }, "temperature": true, "tool_call": true, "reasoning": { "supported": true, - "default": true + "default": false }, "extra_capabilities": { "reasoning": { "supported": true, - "default_enabled": true, - "mode": "budget", + "default_enabled": false, + "mode": "mixed", "budget": { - "default": -1, - "min": 128, - "max": 32768, - "auto": -1, + "min": 1024, "unit": "tokens" }, + "effort": "high", + "effort_options": [ + "low", + "medium", + "high" + ], + "interleaved": true, "summaries": true, "visibility": "summary", "continuation": [ - "thought_signatures" + "thinking_blocks" + ], + "notes": [ + "Claude Opus 4.5 uses manual thinking.type = \"enabled\" with budget_tokens; effort can be used alongside the thinking budget.", + "Interleaved thinking requires the interleaved-thinking-2025-05-14 beta header." ] } }, "attachment": true, "open_weights": false, - "knowledge": "2025-01", - "release_date": "2025-03-20", - "last_updated": "2025-06-05", + "knowledge": "2025-03-31", + "release_date": "2025-11-01", + "last_updated": "2025-11-01", "cost": { - "input": 1.25, - "output": 10, - "cache_read": 0.125, - "tiers": [ - { - "input": 2.5, - "output": 15, - "cache_read": 0.25, - "tier": { - "type": "context", - "size": 200000 - } - } - ], - "context_over_200k": { - "input": 2.5, - "output": 15, - "cache_read": 0.25 - } + "input": 5, + "output": 25 }, "type": "chat" }, { - "id": "gpt-4.1", - "name": "GPT-4.1", - "display_name": "GPT-4.1", + "id": "gpt-5.1-codex", + "name": "GPT-5.1 Codex", + "display_name": "GPT-5.1 Codex", "modalities": { "input": [ "text", - "image", - "pdf" + "image" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 16384 + "context": 400000, + "output": 128000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": false + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": false, + "mode": "effort", + "effort": "none", + "effort_options": [ + "none", + "low", + "medium", + "high" + ], + "verbosity": "medium", + "verbosity_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" + } }, "attachment": true, "open_weights": false, - "knowledge": "2024-04", - "release_date": "2025-04-14", - "last_updated": "2025-04-14", + "knowledge": "2024-09-30", + "release_date": "2025-11-13", + "last_updated": "2025-11-13", "cost": { - "input": 2, - "output": 8, - "cache_read": 0.5 + "input": 1.25, + "output": 10 }, "type": "chat" }, { - "id": "gpt-5.4-nano", - "name": "GPT-5.4 nano", - "display_name": "GPT-5.4 nano", + "id": "gpt-5.1-codex-max", + "name": "GPT-5.1 Codex Max", + "display_name": "GPT-5.1 Codex Max", "modalities": { "input": [ "text", @@ -78459,8 +83898,7 @@ "none", "low", "medium", - "high", - "xhigh" + "high" ], "verbosity": "medium", "verbosity_options": [ @@ -78473,35 +83911,86 @@ }, "attachment": true, "open_weights": false, - "knowledge": "2025-08-31", - "release_date": "2026-03-17", - "last_updated": "2026-03-17", + "knowledge": "2024-09-30", + "release_date": "2025-11-13", + "last_updated": "2025-11-13", "cost": { - "input": 0.2, - "output": 1.25, - "cache_read": 0.02 + "input": 1.25, + "output": 10 }, "type": "chat" }, { - "id": "gemini-3.1-pro-preview", - "name": "Gemini 3.1 Pro Preview", - "display_name": "Gemini 3.1 Pro Preview", + "id": "claude-opus-4-20250514", + "name": "Claude Opus 4", + "display_name": "Claude Opus 4", + "modalities": { + "input": [ + "text", + "image", + "pdf" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 200000, + "output": 32000 + }, + "temperature": true, + "tool_call": true, + "reasoning": { + "supported": true, + "default": false + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": false, + "mode": "budget", + "budget": { + "min": 1024, + "unit": "tokens" + }, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ], + "notes": [ + "Claude 4 manual thinking uses thinking.type = \"enabled\" with budget_tokens.", + "Interleaved thinking requires the interleaved-thinking-2025-05-14 beta header for this model family." + ] + } + }, + "attachment": true, + "open_weights": false, + "release_date": "2025-05-14", + "last_updated": "2025-05-14", + "cost": { + "input": 15, + "output": 75 + }, + "type": "chat" + }, + { + "id": "gpt-5.3-chat-latest", + "name": "GPT-5.3 Chat Latest", + "display_name": "GPT-5.3 Chat Latest", "modalities": { "input": [ "text", - "image", - "video", - "audio", - "pdf" + "image" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 64000 + "context": 400000, + "output": 128000 }, "temperature": true, "tool_call": true, @@ -78509,68 +83998,31 @@ "supported": true, "default": true }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": true, - "mode": "level", - "level": "high", - "level_options": [ - "low", - "high" - ], - "summaries": true, - "visibility": "summary", - "continuation": [ - "thought_signatures" - ] - } - }, "attachment": true, "open_weights": false, - "knowledge": "2025-01", - "release_date": "2026-02-19", - "last_updated": "2026-02-19", + "release_date": "2026-03-01", + "last_updated": "2026-03-01", "cost": { - "input": 2, - "output": 12, - "cache_read": 0.2, - "tiers": [ - { - "input": 4, - "output": 18, - "cache_read": 0.4, - "tier": { - "type": "context", - "size": 200000 - } - } - ], - "context_over_200k": { - "input": 4, - "output": 18, - "cache_read": 0.4 - } + "input": 1.75, + "output": 14 }, "type": "chat" }, { - "id": "gpt-5.3-codex", - "name": "GPT-5.3 Codex", - "display_name": "GPT-5.3 Codex", + "id": "o3-mini", + "name": "o3-mini", + "display_name": "o3-mini", "modalities": { "input": [ - "text", - "image", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 400000, - "output": 128000 + "context": 200000, + "output": 100000 }, "temperature": false, "tool_call": true, @@ -78585,13 +84037,6 @@ "mode": "effort", "effort": "medium", "effort_options": [ - "low", - "medium", - "high", - "xhigh" - ], - "verbosity": "medium", - "verbosity_options": [ "low", "medium", "high" @@ -78599,95 +84044,66 @@ "visibility": "hidden" } }, - "attachment": true, + "attachment": false, "open_weights": false, - "knowledge": "2025-08-31", - "release_date": "2026-02-05", - "last_updated": "2026-02-05", + "knowledge": "2024-05", + "release_date": "2024-12-20", + "last_updated": "2025-01-29", "cost": { - "input": 1.75, - "output": 14, - "cache_read": 0.175 + "input": 1.1, + "output": 4.4 }, "type": "chat" }, { - "id": "gemini-3.5-flash", - "name": "Gemini 3.5 Flash", - "display_name": "Gemini 3.5 Flash", + "id": "kimi-k2-turbo-preview", + "name": "Kimi K2 Turbo Preview", + "display_name": "Kimi K2 Turbo Preview", "modalities": { "input": [ - "text", - "image", - "video", - "audio", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 64000 + "context": 256000, + "output": 8192 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": true, - "mode": "level", - "level": "high", - "level_options": [ - "minimal", - "low", - "medium", - "high" - ], - "summaries": true, - "visibility": "summary", - "continuation": [ - "thought_signatures" - ] - } + "supported": false }, - "attachment": true, + "attachment": false, "open_weights": false, - "knowledge": "2025-01", - "release_date": "2026-05-19", - "last_updated": "2026-05-19", + "release_date": "2025-07-08", + "last_updated": "2025-07-08", "cost": { - "input": 1.5, - "output": 9, - "cache_read": 0.15, - "input_audio": 1.5 + "input": 0.15, + "output": 8 }, "type": "chat" }, { - "id": "claude-sonnet-4.5", - "name": "Claude Sonnet 4.5 (latest)", - "display_name": "Claude Sonnet 4.5 (latest)", + "id": "gpt-5.2", + "name": "GPT-5.2", + "display_name": "GPT-5.2", "modalities": { "input": [ "text", - "image", - "pdf" + "image" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 32000 + "context": 400000, + "output": 128000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { "supported": true, @@ -78697,40 +84113,39 @@ "reasoning": { "supported": true, "default_enabled": false, - "mode": "budget", - "budget": { - "min": 1024, - "unit": "tokens" - }, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" + "mode": "effort", + "effort": "none", + "effort_options": [ + "none", + "low", + "medium", + "high", + "xhigh" ], - "notes": [ - "Claude 4 manual thinking uses thinking.type = \"enabled\" with budget_tokens.", - "Interleaved thinking requires the interleaved-thinking-2025-05-14 beta header for this model family." - ] + "verbosity": "medium", + "verbosity_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" } }, "attachment": true, "open_weights": false, - "knowledge": "2025-07-31", - "release_date": "2025-09-29", - "last_updated": "2025-09-29", + "knowledge": "2025-08-31", + "release_date": "2025-12-11", + "last_updated": "2025-12-11", "cost": { - "input": 3, - "output": 15, - "cache_read": 0.3, - "cache_write": 3.75 + "input": 1.75, + "output": 14 }, "type": "chat" }, { - "id": "gpt-5.2-codex", - "name": "GPT-5.2 Codex", - "display_name": "GPT-5.2 Codex", + "id": "gpt-5.3-codex", + "name": "GPT-5.3 Codex", + "display_name": "GPT-5.3 Codex", "modalities": { "input": [ "text", @@ -78775,84 +84190,51 @@ "attachment": true, "open_weights": false, "knowledge": "2025-08-31", - "release_date": "2025-12-11", - "last_updated": "2025-12-11", + "release_date": "2026-02-05", + "last_updated": "2026-02-05", "cost": { "input": 1.75, - "output": 14, - "cache_read": 0.175 + "output": 14 }, "type": "chat" }, { - "id": "claude-opus-4.6", - "name": "Claude Opus 4.6", - "display_name": "Claude Opus 4.6", + "id": "grok-4-0709", + "name": "Grok 4", + "display_name": "Grok 4", "modalities": { "input": [ "text", - "image", - "pdf" + "image" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 32000 + "context": 256000, + "output": 16384 }, "temperature": true, "tool_call": true, "reasoning": { "supported": true, - "default": false - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": false, - "mode": "mixed", - "budget": { - "min": 1024, - "unit": "tokens" - }, - "effort": "high", - "effort_options": [ - "low", - "medium", - "high", - "max" - ], - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ], - "notes": [ - "Anthropic recommends adaptive thinking with effort for Claude 4.6; budget_tokens remains a deprecated compatibility path.", - "Anthropic API defaults effort to high; lower effort levels should be chosen per workload." - ] - } + "default": true }, "attachment": true, "open_weights": false, - "knowledge": "2025-05-31", - "release_date": "2026-02-05", - "last_updated": "2026-03-13", + "release_date": "2025-07-09", + "last_updated": "2025-07-09", "cost": { - "input": 5, - "output": 25, - "cache_read": 0.5, - "cache_write": 6.25 + "input": 3, + "output": 15 }, "type": "chat" }, { - "id": "claude-haiku-4.5", - "name": "Claude Haiku 4.5 (latest)", - "display_name": "Claude Haiku 4.5 (latest)", + "id": "claude-sonnet-4-20250514", + "name": "Claude Sonnet 4", + "display_name": "Claude Sonnet 4", "modalities": { "input": [ "text", @@ -78896,83 +84278,64 @@ }, "attachment": true, "open_weights": false, - "knowledge": "2025-02-28", - "release_date": "2025-10-15", - "last_updated": "2025-10-15", + "release_date": "2025-05-14", + "last_updated": "2025-05-14", "cost": { - "input": 1, - "output": 5, - "cache_read": 0.1, - "cache_write": 1.25 + "input": 3, + "output": 15 }, "type": "chat" }, { - "id": "claude-opus-4.8", - "name": "Claude Opus 4.8", - "display_name": "Claude Opus 4.8", + "id": "kimi-k2.5", + "name": "Kimi K2.5", + "display_name": "Kimi K2.5", "modalities": { "input": [ "text", "image", - "pdf" + "video" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 64000 + "context": 262144, + "output": 32768 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, - "default": false + "default": true }, "extra_capabilities": { "reasoning": { "supported": true, - "default_enabled": false, - "mode": "effort", - "effort": "high", - "effort_options": [ - "low", - "medium", - "high", - "xhigh", - "max" - ], "interleaved": true, "summaries": true, - "visibility": "omitted", + "visibility": "summary", "continuation": [ "thinking_blocks" - ], - "notes": [ - "Claude Opus 4.7 and newer Opus models require thinking.type = \"adaptive\" to enable thinking explicitly.", - "Manual budget_tokens requests return 400 on Claude Opus 4.7 and newer adaptive-only Opus models.", - "task_budget is separate from thinking control and should not be treated as a thinking budget." ] } }, - "attachment": true, - "open_weights": false, - "release_date": "2026-05-28", - "last_updated": "2026-05-28", + "attachment": false, + "open_weights": true, + "knowledge": "2025-01", + "release_date": "2026-01", + "last_updated": "2026-01", "cost": { - "input": 5, - "output": 25, - "cache_read": 0.5, - "cache_write": 6.25 + "input": 0.6, + "output": 3 }, "type": "chat" }, { - "id": "gpt-5.4-mini", - "name": "GPT-5.4 mini", - "display_name": "GPT-5.4 mini", + "id": "gpt-5.1-chat-latest", + "name": "GPT-5.1 Chat Latest", + "display_name": "GPT-5.1 Chat Latest", "modalities": { "input": [ "text", @@ -78990,131 +84353,103 @@ "tool_call": true, "reasoning": { "supported": true, - "default": false - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": false, - "mode": "effort", - "effort": "none", - "effort_options": [ - "none", - "low", - "medium", - "high", - "xhigh" - ], - "verbosity": "medium", - "verbosity_options": [ - "low", - "medium", - "high" - ], - "visibility": "hidden" - } + "default": true }, "attachment": true, "open_weights": false, - "knowledge": "2025-08-31", - "release_date": "2026-03-17", - "last_updated": "2026-03-17", + "knowledge": "2024-09-30", + "release_date": "2025-11-13", + "last_updated": "2025-11-13", "cost": { - "input": 0.75, - "output": 4.5, - "cache_read": 0.075 + "input": 1.25, + "output": 10 }, "type": "chat" - } - ] - }, - "inference": { - "id": "inference", - "name": "Inference", - "display_name": "Inference", - "api": "https://inference.net/v1", - "doc": "https://inference.net/models", - "models": [ + }, { - "id": "osmosis/osmosis-structure-0.6b", - "name": "Osmosis Structure 0.6B", - "display_name": "Osmosis Structure 0.6B", + "id": "gpt-5.2-chat-latest", + "name": "GPT-5.2 Chat Latest", + "display_name": "GPT-5.2 Chat Latest", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 4000, - "output": 2048 + "context": 400000, + "output": 128000 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": false, - "open_weights": true, - "knowledge": "2024-12", - "release_date": "2025-01-01", - "last_updated": "2025-01-01", + "attachment": true, + "open_weights": false, + "knowledge": "2024-09-30", + "release_date": "2026-01-01", + "last_updated": "2026-01-01", "cost": { - "input": 0.1, - "output": 0.5 + "input": 1.75, + "output": 14 }, "type": "chat" }, { - "id": "mistral/mistral-nemo-12b-instruct", - "name": "Mistral Nemo 12B Instruct", - "display_name": "Mistral Nemo 12B Instruct", + "id": "gpt-4.1-nano", + "name": "GPT-4.1 Nano", + "display_name": "GPT-4.1 Nano", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 16000, - "output": 4096 + "context": 1047576, + "output": 32768 }, "temperature": true, "tool_call": true, "reasoning": { "supported": false }, - "attachment": false, - "open_weights": true, - "knowledge": "2024-12", - "release_date": "2025-01-01", - "last_updated": "2025-01-01", + "attachment": true, + "open_weights": false, + "knowledge": "2024-04", + "release_date": "2025-04-14", + "last_updated": "2025-04-14", "cost": { - "input": 0.038, - "output": 0.1 + "input": 0.1, + "output": 0.4 }, "type": "chat" }, { - "id": "qwen/qwen-2.5-7b-vision-instruct", - "name": "Qwen 2.5 7B Vision Instruct", - "display_name": "Qwen 2.5 7B Vision Instruct", + "id": "gpt-4o-2024-11-20", + "name": "GPT-4o (2024-11-20)", + "display_name": "GPT-4o (2024-11-20)", "modalities": { "input": [ "text", - "image" + "image", + "audio" ], "output": [ "text" ] }, "limit": { - "context": 125000, - "output": 4096 + "context": 128000, + "output": 16384 }, "temperature": true, "tool_call": true, @@ -79122,84 +84457,75 @@ "supported": false }, "attachment": true, - "open_weights": true, - "knowledge": "2024-12", - "release_date": "2025-01-01", - "last_updated": "2025-01-01", + "open_weights": false, + "knowledge": "2024-10", + "release_date": "2024-11-20", + "last_updated": "2024-11-20", "cost": { - "input": 0.2, - "output": 0.2 + "input": 2.5, + "output": 10 }, "type": "chat" }, { - "id": "qwen/qwen3-embedding-4b", - "name": "Qwen 3 Embedding 4B", - "display_name": "Qwen 3 Embedding 4B", - "modalities": { - "input": [ - "text" - ], - "output": [ - "text" - ] - }, - "limit": { - "context": 32000, - "output": 2048 - }, - "temperature": false, - "tool_call": false, - "reasoning": { - "supported": false - }, - "attachment": false, - "open_weights": true, - "knowledge": "2024-12", - "release_date": "2025-01-01", - "last_updated": "2025-01-01", - "cost": { - "input": 0.01, - "output": 0 - }, - "type": "embedding" - }, - { - "id": "meta/llama-3.2-3b-instruct", - "name": "Llama 3.2 3B Instruct", - "display_name": "Llama 3.2 3B Instruct", + "id": "claude-3-7-sonnet-20250219", + "name": "Claude Sonnet 3.7", + "display_name": "Claude Sonnet 3.7", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 16000, - "output": 4096 + "context": 200000, + "output": 64000 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": false }, - "attachment": false, - "open_weights": true, - "knowledge": "2023-12", - "release_date": "2025-01-01", - "last_updated": "2025-01-01", + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": false, + "mode": "budget", + "budget": { + "min": 1024, + "unit": "tokens" + }, + "interleaved": false, + "summaries": false, + "visibility": "full", + "continuation": [ + "thinking_blocks" + ], + "notes": [ + "Anthropic uses thinking budget tokens" + ] + } + }, + "attachment": true, + "open_weights": false, + "knowledge": "2024-10-31", + "release_date": "2025-02-19", + "last_updated": "2025-02-19", "cost": { - "input": 0.02, - "output": 0.02 + "input": 3, + "output": 15 }, "type": "chat" }, { - "id": "meta/llama-3.2-11b-vision-instruct", - "name": "Llama 3.2 11B Vision Instruct", - "display_name": "Llama 3.2 11B Vision Instruct", + "id": "gpt-5.4", + "name": "GPT-5.4", + "display_name": "GPT-5.4", "modalities": { "input": [ "text", @@ -79210,135 +84536,202 @@ ] }, "limit": { - "context": 16000, - "output": 4096 + "context": 1050000, + "output": 128000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": false + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": false, + "mode": "effort", + "effort": "none", + "effort_options": [ + "none", + "low", + "medium", + "high", + "xhigh" + ], + "verbosity": "medium", + "verbosity_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" + } }, "attachment": true, - "open_weights": true, - "knowledge": "2023-12", - "release_date": "2025-01-01", - "last_updated": "2025-01-01", + "open_weights": false, + "knowledge": "2025-08-31", + "release_date": "2026-03-05", + "last_updated": "2026-03-05", "cost": { - "input": 0.055, - "output": 0.055 + "input": 2.5, + "output": 15 }, "type": "chat" }, { - "id": "meta/llama-3.2-1b-instruct", - "name": "Llama 3.2 1B Instruct", - "display_name": "Llama 3.2 1B Instruct", + "id": "gpt-4.1", + "name": "GPT-4.1", + "display_name": "GPT-4.1", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 16000, - "output": 4096 + "context": 1047576, + "output": 32768 }, "temperature": true, "tool_call": true, "reasoning": { "supported": false }, - "attachment": false, - "open_weights": true, - "knowledge": "2023-12", - "release_date": "2025-01-01", - "last_updated": "2025-01-01", + "attachment": true, + "open_weights": false, + "knowledge": "2024-04", + "release_date": "2025-04-14", + "last_updated": "2025-04-14", "cost": { - "input": 0.01, - "output": 0.01 + "input": 2, + "output": 8 }, "type": "chat" }, { - "id": "meta/llama-3.1-8b-instruct", - "name": "Llama 3.1 8B Instruct", - "display_name": "Llama 3.1 8B Instruct", + "id": "gemini-3.1-pro-preview", + "name": "Gemini 3.1 Pro Preview", + "display_name": "Gemini 3.1 Pro Preview", "modalities": { "input": [ - "text" + "text", + "image", + "video", + "audio", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 16000, - "output": 4096 + "context": 1048576, + "output": 65536 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": false, - "open_weights": true, - "knowledge": "2023-12", - "release_date": "2025-01-01", - "last_updated": "2025-01-01", + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": true, + "mode": "level", + "level": "high", + "level_options": [ + "low", + "high" + ], + "summaries": true, + "visibility": "summary", + "continuation": [ + "thought_signatures" + ] + } + }, + "attachment": true, + "open_weights": false, + "knowledge": "2025-01", + "release_date": "2026-02-19", + "last_updated": "2026-02-19", "cost": { - "input": 0.025, - "output": 0.025 + "input": 2, + "output": 12 }, "type": "chat" }, { - "id": "google/gemma-3", - "name": "Google Gemma 3", - "display_name": "Google Gemma 3", + "id": "claude-opus-4-6", + "name": "Claude Opus 4.6", + "display_name": "Claude Opus 4.6", "modalities": { "input": [ "text", - "image" + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 125000, - "output": 4096 + "context": 200000, + "output": 128000 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": false + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": false, + "mode": "mixed", + "budget": { + "min": 1024, + "unit": "tokens" + }, + "effort": "high", + "effort_options": [ + "low", + "medium", + "high", + "max" + ], + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ], + "notes": [ + "Anthropic recommends adaptive thinking with effort for Claude 4.6; budget_tokens remains a deprecated compatibility path.", + "Anthropic API defaults effort to high; lower effort levels should be chosen per workload." + ] + } }, "attachment": true, - "open_weights": true, - "knowledge": "2024-12", - "release_date": "2025-01-01", - "last_updated": "2025-01-01", + "open_weights": false, + "knowledge": "2025-05-31", + "release_date": "2026-02-05", + "last_updated": "2026-02-05", "cost": { - "input": 0.15, - "output": 0.3 + "input": 5, + "output": 25 }, "type": "chat" - } - ] - }, - "huggingface": { - "id": "huggingface", - "name": "Hugging Face", - "display_name": "Hugging Face", - "api": "https://router.huggingface.co/v1", - "doc": "https://huggingface.co/docs/inference-providers", - "models": [ + }, { - "id": "XiaomiMiMo/MiMo-V2-Flash", - "name": "MiMo-V2-Flash", - "display_name": "MiMo-V2-Flash", + "id": "qwen-2.5-coder-32b", + "name": "Qwen 2.5 Coder 32B", + "display_name": "Qwen 2.5 Coder 32B", "modalities": { "input": [ "text" @@ -79348,87 +84741,98 @@ ] }, "limit": { - "context": 262144, - "output": 4096 + "context": 128000, + "output": 8192 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, "attachment": false, "open_weights": true, - "knowledge": "2024-12", - "release_date": "2025-12-16", - "last_updated": "2025-12-16", + "release_date": "2024-11-11", + "last_updated": "2024-11-11", "cost": { - "input": 0.1, - "output": 0.3 + "input": 0.79, + "output": 0.79 }, "type": "chat" }, { - "id": "MiniMaxAI/MiniMax-M2.5", - "name": "MiniMax-M2.5", - "display_name": "MiniMax-M2.5", + "id": "claude-sonnet-4-5-20250929", + "name": "Claude Sonnet 4.5", + "display_name": "Claude Sonnet 4.5", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 204800, - "output": 131072 + "context": 200000, + "output": 64000 }, "temperature": true, "tool_call": true, "reasoning": { "supported": true, - "default": true + "default": false }, "extra_capabilities": { "reasoning": { "supported": true, + "default_enabled": false, + "mode": "budget", + "budget": { + "min": 1024, + "unit": "tokens" + }, "interleaved": true, "summaries": true, "visibility": "summary", "continuation": [ "thinking_blocks" + ], + "notes": [ + "Claude 4 manual thinking uses thinking.type = \"enabled\" with budget_tokens.", + "Interleaved thinking requires the interleaved-thinking-2025-05-14 beta header for this model family." ] } }, - "attachment": false, - "open_weights": true, - "release_date": "2026-02-12", - "last_updated": "2026-02-12", + "attachment": true, + "open_weights": false, + "knowledge": "2025-07-31", + "release_date": "2025-09-29", + "last_updated": "2025-09-29", "cost": { - "input": 0.3, - "output": 1.2, - "cache_read": 0.03 + "input": 3, + "output": 15 }, "type": "chat" }, { - "id": "MiniMaxAI/MiniMax-M2.7", - "name": "MiniMax-M2.7", - "display_name": "MiniMax-M2.7", + "id": "gpt-5-mini", + "name": "GPT-5 Mini", + "display_name": "GPT-5 Mini", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 204800, - "output": 131072 + "context": 400000, + "output": 128000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { "supported": true, @@ -79437,43 +84841,87 @@ "extra_capabilities": { "reasoning": { "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] + "default_enabled": true, + "mode": "effort", + "effort": "medium", + "effort_options": [ + "minimal", + "low", + "medium", + "high" + ], + "verbosity": "medium", + "verbosity_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" } }, - "attachment": false, - "open_weights": true, - "release_date": "2026-03-18", - "last_updated": "2026-03-18", + "attachment": true, + "open_weights": false, + "knowledge": "2024-05-30", + "release_date": "2025-08-07", + "last_updated": "2025-08-07", "cost": { - "input": 0.3, - "output": 1.2, - "cache_read": 0.06 + "input": 0.25, + "output": 2 }, "type": "chat" }, { - "id": "MiniMaxAI/MiniMax-M2.1", - "name": "MiniMax-M2.1", - "display_name": "MiniMax-M2.1", + "id": "gpt-4.1-mini", + "name": "GPT-4.1 Mini", + "display_name": "GPT-4.1 Mini", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 204800, - "output": 131072 + "context": 1047576, + "output": 32768 }, "temperature": true, "tool_call": true, + "reasoning": { + "supported": false + }, + "attachment": true, + "open_weights": false, + "knowledge": "2024-04", + "release_date": "2025-04-14", + "last_updated": "2025-04-14", + "cost": { + "input": 0.4, + "output": 1.6 + }, + "type": "chat" + }, + { + "id": "gpt-5-nano", + "name": "GPT-5 Nano", + "display_name": "GPT-5 Nano", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 400000, + "output": 128000 + }, + "temperature": false, + "tool_call": true, "reasoning": { "supported": true, "default": true @@ -79481,85 +84929,149 @@ "extra_capabilities": { "reasoning": { "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] + "default_enabled": true, + "mode": "effort", + "effort": "medium", + "effort_options": [ + "minimal", + "low", + "medium", + "high" + ], + "verbosity": "medium", + "verbosity_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" } }, - "attachment": false, - "open_weights": true, - "knowledge": "2025-10", - "release_date": "2025-12-23", - "last_updated": "2025-12-23", + "attachment": true, + "open_weights": false, + "knowledge": "2024-05-30", + "release_date": "2025-08-07", + "last_updated": "2025-08-07", "cost": { - "input": 0.3, - "output": 1.2 + "input": 0.05, + "output": 0.4 }, "type": "chat" }, { - "id": "zai-org/GLM-4.7", - "name": "GLM-4.7", - "display_name": "GLM-4.7", + "id": "claude-sonnet-4-6", + "name": "Claude Sonnet 4.6", + "display_name": "Claude Sonnet 4.6", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 204800, - "output": 131072 + "context": 200000, + "output": 64000 }, "temperature": true, "tool_call": true, "reasoning": { "supported": true, - "default": true + "default": false }, "extra_capabilities": { "reasoning": { "supported": true, + "default_enabled": false, + "mode": "mixed", + "budget": { + "min": 1024, + "unit": "tokens" + }, + "effort": "high", + "effort_options": [ + "low", + "medium", + "high", + "max" + ], "interleaved": true, "summaries": true, "visibility": "summary", "continuation": [ "thinking_blocks" + ], + "notes": [ + "Anthropic recommends adaptive thinking with effort for Claude 4.6; budget_tokens remains a deprecated compatibility path.", + "Anthropic API defaults effort to high; lower effort levels should be chosen per workload." ] } }, - "attachment": false, - "open_weights": true, - "knowledge": "2025-04", - "release_date": "2025-12-22", - "last_updated": "2025-12-22", + "attachment": true, + "open_weights": false, + "knowledge": "2025-08-31", + "release_date": "2026-02-17", + "last_updated": "2026-02-17", "cost": { - "input": 0.6, - "output": 2.2, - "cache_read": 0.11 + "input": 3, + "output": 15 }, "type": "chat" }, { - "id": "zai-org/GLM-5", - "name": "GLM-5", - "display_name": "GLM-5", + "id": "grok-4-fast-non-reasoning", + "name": "Grok 4 Fast (Non-Reasoning)", + "display_name": "Grok 4 Fast (Non-Reasoning)", "modalities": { "input": [ + "text", + "image" + ], + "output": [ "text" + ] + }, + "limit": { + "context": 2000000, + "output": 16384 + }, + "temperature": true, + "tool_call": true, + "reasoning": { + "supported": false + }, + "attachment": true, + "open_weights": false, + "release_date": "2025-07-09", + "last_updated": "2025-07-09", + "cost": { + "input": 0.2, + "output": 0.5 + }, + "type": "chat" + }, + { + "id": "gemini-3-flash-preview", + "name": "Gemini 3 Flash Preview", + "display_name": "Gemini 3 Flash Preview", + "modalities": { + "input": [ + "text", + "image", + "audio", + "video", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 202752, - "output": 131072 + "context": 1048576, + "output": 65536 }, "temperature": true, "tool_call": true, @@ -79570,86 +85082,84 @@ "extra_capabilities": { "reasoning": { "supported": true, - "interleaved": true, + "default_enabled": true, + "mode": "level", + "level": "high", + "level_options": [ + "minimal", + "low", + "medium", + "high" + ], "summaries": true, "visibility": "summary", "continuation": [ - "thinking_blocks" + "thought_signatures" ] } }, - "attachment": false, - "open_weights": true, - "release_date": "2026-02-11", - "last_updated": "2026-02-11", + "attachment": true, + "open_weights": false, + "knowledge": "2025-01", + "release_date": "2025-12-17", + "last_updated": "2025-12-17", "cost": { - "input": 1, - "output": 3.2, - "cache_read": 0.2 + "input": 0.5, + "output": 3 }, "type": "chat" }, { - "id": "zai-org/GLM-5.1", - "name": "GLM-5.1", - "display_name": "GLM-5.1", + "id": "gpt-4o-mini", + "name": "GPT-4o Mini", + "display_name": "GPT-4o Mini", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 202752, - "output": 131072 + "context": 128000, + "output": 16384 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } + "supported": false }, - "attachment": false, - "open_weights": true, - "release_date": "2026-04-03", - "last_updated": "2026-04-03", + "attachment": true, + "open_weights": false, + "knowledge": "2024-04", + "release_date": "2024-07-18", + "last_updated": "2024-07-18", "cost": { - "input": 1, - "output": 3.2, - "cache_read": 0.2 + "input": 0.15, + "output": 0.6 }, "type": "chat" }, { - "id": "zai-org/GLM-4.7-Flash", - "name": "GLM-4.7-Flash", - "display_name": "GLM-4.7-Flash", + "id": "gpt-5-codex", + "name": "GPT-5 Codex", + "display_name": "GPT-5 Codex", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 200000, + "context": 400000, "output": 128000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { "supported": true, @@ -79658,42 +85168,54 @@ "extra_capabilities": { "reasoning": { "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] + "default_enabled": true, + "mode": "effort", + "effort": "medium", + "effort_options": [ + "minimal", + "low", + "medium", + "high" + ], + "verbosity": "medium", + "verbosity_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" } }, "attachment": false, - "open_weights": true, - "knowledge": "2025-04", - "release_date": "2025-08-08", - "last_updated": "2025-08-08", + "open_weights": false, + "knowledge": "2024-09-30", + "release_date": "2025-09-15", + "last_updated": "2025-09-15", "cost": { - "input": 0, - "output": 0 + "input": 1.25, + "output": 10 }, "type": "chat" }, { - "id": "moonshotai/Kimi-K2.6", - "name": "Kimi-K2.6", - "display_name": "Kimi-K2.6", + "id": "gemini-3.1-flash-lite-preview", + "name": "Gemini 3.1 Flash Lite Preview", + "display_name": "Gemini 3.1 Flash Lite Preview", "modalities": { "input": [ "text", "image", - "video" + "audio", + "video", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 262144, - "output": 262144 + "context": 1048576, + "output": 65536 }, "temperature": true, "tool_call": true, @@ -79703,142 +85225,169 @@ }, "extra_capabilities": { "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] + "supported": true } }, "attachment": true, - "open_weights": true, - "knowledge": "2025-01", - "release_date": "2026-04-20", - "last_updated": "2026-04-20", + "open_weights": false, + "release_date": "2026-03-01", + "last_updated": "2026-03-01", "cost": { - "input": 0.95, - "output": 4, - "cache_read": 0.16 + "input": 0.25, + "output": 1.5, + "cache_read": 0.025, + "cache_write": 1 }, "type": "chat" }, { - "id": "moonshotai/Kimi-K2-Instruct-0905", - "name": "Kimi-K2-Instruct-0905", - "display_name": "Kimi-K2-Instruct-0905", + "id": "gpt-5.2-codex", + "name": "GPT-5.2 Codex", + "display_name": "GPT-5.2 Codex", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 262144, - "output": 16384 + "context": 400000, + "output": 128000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": false, - "open_weights": true, - "knowledge": "2024-10", - "release_date": "2025-09-04", - "last_updated": "2025-09-04", + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": true, + "mode": "effort", + "effort": "medium", + "effort_options": [ + "low", + "medium", + "high", + "xhigh" + ], + "verbosity": "medium", + "verbosity_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" + } + }, + "attachment": true, + "open_weights": false, + "knowledge": "2025-08-31", + "release_date": "2025-12-11", + "last_updated": "2025-12-11", "cost": { - "input": 1, - "output": 3 + "input": 1.75, + "output": 14 }, "type": "chat" }, { - "id": "moonshotai/Kimi-K2.5", - "name": "Kimi-K2.5", - "display_name": "Kimi-K2.5", + "id": "gpt-5.1", + "name": "GPT-5.1", + "display_name": "GPT-5.1", "modalities": { "input": [ "text", - "image", - "video" + "image" ], "output": [ "text" ] }, "limit": { - "context": 262144, - "output": 262144 + "context": 400000, + "output": 128000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { "supported": true, - "default": true + "default": false }, "extra_capabilities": { "reasoning": { "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] + "default_enabled": false, + "mode": "effort", + "effort": "none", + "effort_options": [ + "none", + "low", + "medium", + "high" + ], + "verbosity": "medium", + "verbosity_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" } }, "attachment": true, - "open_weights": true, - "knowledge": "2025-01", - "release_date": "2026-01-01", - "last_updated": "2026-01-01", + "open_weights": false, + "knowledge": "2024-09-30", + "release_date": "2025-11-13", + "last_updated": "2025-11-13", "cost": { - "input": 0.6, - "output": 3, - "cache_read": 0.1 + "input": 1.25, + "output": 10 }, "type": "chat" }, { - "id": "moonshotai/Kimi-K2-Instruct", - "name": "Kimi-K2-Instruct", - "display_name": "Kimi-K2-Instruct", + "id": "meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8", + "name": "Llama 4 Maverick 17B 128E Instruct FP8", + "display_name": "Llama 4 Maverick 17B 128E Instruct FP8", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 131072, - "output": 16384 + "context": 1000000, + "output": 32768 }, "temperature": true, "tool_call": true, "reasoning": { "supported": false }, - "attachment": false, + "attachment": true, "open_weights": true, - "knowledge": "2024-10", - "release_date": "2025-07-14", - "last_updated": "2025-07-14", + "knowledge": "2024-08", + "release_date": "2025-04-05", + "last_updated": "2025-04-05", "cost": { - "input": 1, - "output": 3 + "input": 0.14, + "output": 0.59 }, "type": "chat" }, { - "id": "moonshotai/Kimi-K2-Thinking", - "name": "Kimi-K2-Thinking", - "display_name": "Kimi-K2-Thinking", + "id": "meta-llama/Meta-Llama-3.1-405B-Instruct-Turbo", + "name": "Llama 3.1 405B Instruct Turbo", + "display_name": "Llama 3.1 405B Instruct Turbo", "modalities": { "input": [ "text" @@ -79848,42 +85397,28 @@ ] }, "limit": { - "context": 262144, - "output": 262144 + "context": 128000, + "output": 4096 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } + "supported": false }, "attachment": false, "open_weights": true, - "knowledge": "2024-08", - "release_date": "2025-11-06", - "last_updated": "2025-11-06", + "release_date": "2024-07-23", + "last_updated": "2024-07-23", "cost": { - "input": 0.6, - "output": 2.5, - "cache_read": 0.15 + "input": 3.5, + "output": 3.5 }, "type": "chat" }, { - "id": "deepseek-ai/DeepSeek-V4-Pro", - "name": "DeepSeek V4 Pro", - "display_name": "DeepSeek V4 Pro", + "id": "meta-llama/Meta-Llama-3.1-8B-Instruct", + "name": "Llama 3.1 8B Instruct", + "display_name": "Llama 3.1 8B Instruct", "modalities": { "input": [ "text" @@ -79893,42 +85428,28 @@ ] }, "limit": { - "context": 1048576, - "output": 393216 + "context": 128000, + "output": 4096 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } + "supported": false }, "attachment": false, "open_weights": true, - "knowledge": "2025-05", - "release_date": "2026-04-24", - "last_updated": "2026-04-24", + "release_date": "2024-07-23", + "last_updated": "2024-07-23", "cost": { - "input": 0.435, - "output": 0.87, - "cache_read": 0.003625 + "input": 0.02, + "output": 0.05 }, "type": "chat" }, { - "id": "deepseek-ai/DeepSeek-V3.2", - "name": "DeepSeek-V3.2", - "display_name": "DeepSeek-V3.2", + "id": "Qwen/qwen3-coder-480b-a35b-instruct", + "name": "Qwen3 Coder 480B A35B Instruct", + "display_name": "Qwen3 Coder 480B A35B Instruct", "modalities": { "input": [ "text" @@ -79938,7 +85459,7 @@ ] }, "limit": { - "context": 163840, + "context": 262144, "output": 65536 }, "temperature": true, @@ -79947,26 +85468,20 @@ "supported": true, "default": true }, - "extra_capabilities": { - "reasoning": { - "supported": true - } - }, "attachment": false, "open_weights": true, - "knowledge": "2024-07", - "release_date": "2025-12-01", - "last_updated": "2025-12-01", + "release_date": "2025-07-22", + "last_updated": "2025-07-22", "cost": { - "input": 0.28, - "output": 0.4 + "input": 0.29, + "output": 1.2 }, "type": "chat" }, { - "id": "deepseek-ai/DeepSeek-R1-0528", - "name": "DeepSeek-R1-0528", - "display_name": "DeepSeek-R1-0528", + "id": "Qwen/QwQ-32B", + "name": "QwQ 32B", + "display_name": "QwQ 32B", "modalities": { "input": [ "text" @@ -79976,8 +85491,8 @@ ] }, "limit": { - "context": 163840, - "output": 163840 + "context": 32768, + "output": 32768 }, "temperature": true, "tool_call": true, @@ -79998,19 +85513,18 @@ }, "attachment": false, "open_weights": true, - "knowledge": "2025-05", - "release_date": "2025-05-28", - "last_updated": "2025-05-28", + "release_date": "2024-11-28", + "last_updated": "2024-11-28", "cost": { - "input": 3, - "output": 5 + "input": 0.4, + "output": 0.4 }, "type": "chat" }, { - "id": "Qwen/Qwen3-Coder-480B-A35B-Instruct", - "name": "Qwen3-Coder-480B-A35B-Instruct", - "display_name": "Qwen3-Coder-480B-A35B-Instruct", + "id": "Qwen/Qwen3-235B-A22B-Instruct-2507", + "name": "Qwen3 235B A22B Instruct", + "display_name": "Qwen3 235B A22B Instruct", "modalities": { "input": [ "text" @@ -80021,28 +85535,28 @@ }, "limit": { "context": 262144, - "output": 66536 + "output": 8192 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "attachment": false, "open_weights": true, - "knowledge": "2025-04", - "release_date": "2025-07-23", - "last_updated": "2025-07-23", + "release_date": "2025-07-01", + "last_updated": "2025-07-01", "cost": { - "input": 2, - "output": 2 + "input": 0.13, + "output": 0.6 }, "type": "chat" }, { - "id": "Qwen/Qwen3-Embedding-8B", - "name": "Qwen 3 Embedding 8B", - "display_name": "Qwen 3 Embedding 8B", + "id": "Qwen/Qwen3-32B", + "name": "Qwen3 32B", + "display_name": "Qwen3 32B", "modalities": { "input": [ "text" @@ -80052,29 +85566,40 @@ ] }, "limit": { - "context": 32000, - "output": 4096 + "context": 128000, + "output": 8192 }, - "temperature": false, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } }, "attachment": false, "open_weights": true, - "knowledge": "2024-12", - "release_date": "2025-01-01", - "last_updated": "2025-01-01", + "release_date": "2025-04-29", + "last_updated": "2025-04-29", "cost": { - "input": 0.01, - "output": 0 + "input": 0.09, + "output": 0.29 }, - "type": "embedding" + "type": "chat" }, { - "id": "Qwen/Qwen3-Coder-Next", - "name": "Qwen3-Coder-Next", - "display_name": "Qwen3-Coder-Next", + "id": "Qwen/Qwen2.5-72B-Instruct", + "name": "Qwen 2.5 72B Instruct", + "display_name": "Qwen 2.5 72B Instruct", "modalities": { "input": [ "text" @@ -80084,8 +85609,8 @@ ] }, "limit": { - "context": 262144, - "output": 65536 + "context": 128000, + "output": 8192 }, "temperature": true, "tool_call": true, @@ -80094,30 +85619,30 @@ }, "attachment": false, "open_weights": true, - "knowledge": "2025-04", - "release_date": "2026-02-03", - "last_updated": "2026-02-03", + "release_date": "2024-09-19", + "last_updated": "2024-09-19", "cost": { - "input": 0.2, - "output": 1.5 + "input": 0.11, + "output": 0.38 }, "type": "chat" }, { - "id": "Qwen/Qwen3-235B-A22B-Thinking-2507", - "name": "Qwen3-235B-A22B-Thinking-2507", - "display_name": "Qwen3-235B-A22B-Thinking-2507", + "id": "openai/gpt-oss-120b", + "name": "GPT-OSS 120B", + "display_name": "GPT-OSS 120B", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 262144, - "output": 131072 + "context": 128000, + "output": 32768 }, "temperature": true, "tool_call": true, @@ -80127,48 +85652,39 @@ }, "extra_capabilities": { "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] + "supported": true } }, - "attachment": false, + "attachment": true, "open_weights": true, - "knowledge": "2025-04", - "release_date": "2025-07-25", - "last_updated": "2025-07-25", + "release_date": "2025-08-05", + "last_updated": "2025-08-05", "cost": { - "input": 0.3, - "output": 3 + "input": 0.08, + "output": 0.44 }, "type": "chat" }, { - "id": "Qwen/Qwen3.5-397B-A17B", - "name": "Qwen3.5-397B-A17B", - "display_name": "Qwen3.5-397B-A17B", + "id": "zai-org/glm-4.7", + "name": "GLM-4.7", + "display_name": "GLM-4.7", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 262144, - "output": 32768 + "context": 128000, + "output": 8192 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": true }, "extra_capabilities": { "reasoning": { @@ -80181,21 +85697,20 @@ ] } }, - "attachment": true, + "attachment": false, "open_weights": true, - "knowledge": "2025-04", - "release_date": "2026-02-01", - "last_updated": "2026-02-01", + "release_date": "2025-06-01", + "last_updated": "2025-06-01", "cost": { "input": 0.6, - "output": 3.6 + "output": 2.2 }, "type": "chat" }, { - "id": "Qwen/Qwen3-Next-80B-A3B-Instruct", - "name": "Qwen3-Next-80B-A3B-Instruct", - "display_name": "Qwen3-Next-80B-A3B-Instruct", + "id": "zai-org/glm-4.5", + "name": "GLM-4.5", + "display_name": "GLM-4.5", "modalities": { "input": [ "text" @@ -80205,29 +85720,29 @@ ] }, "limit": { - "context": 262144, - "output": 66536 + "context": 128000, + "output": 8192 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "attachment": false, "open_weights": true, - "knowledge": "2025-04", - "release_date": "2025-09-11", - "last_updated": "2025-09-11", + "release_date": "2025-07-28", + "last_updated": "2025-07-28", "cost": { - "input": 0.25, - "output": 1 + "input": 0.6, + "output": 2.2 }, "type": "chat" }, { - "id": "Qwen/Qwen3-Embedding-4B", - "name": "Qwen 3 Embedding 4B", - "display_name": "Qwen 3 Embedding 4B", + "id": "zai-org/glm-4.6", + "name": "GLM-4.6", + "display_name": "GLM-4.6", "modalities": { "input": [ "text" @@ -80237,29 +85752,33 @@ ] }, "limit": { - "context": 32000, - "output": 2048 + "context": 128000, + "output": 8192 }, - "temperature": false, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { - "supported": false + "supported": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true + } }, "attachment": false, "open_weights": true, - "knowledge": "2024-12", - "release_date": "2025-01-01", - "last_updated": "2025-01-01", + "release_date": "2025-03-01", + "last_updated": "2025-03-01", "cost": { - "input": 0.01, - "output": 0 + "input": 0.6, + "output": 2.2 }, - "type": "embedding" + "type": "chat" }, { - "id": "Qwen/Qwen3-Next-80B-A3B-Thinking", - "name": "Qwen3-Next-80B-A3B-Thinking", - "display_name": "Qwen3-Next-80B-A3B-Thinking", + "id": "zai-org/glm-5", + "name": "GLM-5", + "display_name": "GLM-5", "modalities": { "input": [ "text" @@ -80269,13 +85788,14 @@ ] }, "limit": { - "context": 262144, + "context": 204800, "output": 131072 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true + "supported": true, + "default": true }, "extra_capabilities": { "reasoning": { @@ -80290,27 +85810,18 @@ }, "attachment": false, "open_weights": true, - "knowledge": "2025-04", - "release_date": "2025-09-11", - "last_updated": "2025-09-11", + "release_date": "2026-02-11", + "last_updated": "2026-02-11", "cost": { - "input": 0.3, - "output": 2 + "input": 1, + "output": 3.2 }, "type": "chat" - } - ] - }, - "cohere": { - "id": "cohere", - "name": "Cohere", - "display_name": "Cohere", - "doc": "https://docs.cohere.com/docs/models", - "models": [ + }, { - "id": "command-r-plus-08-2024", - "name": "Command R+", - "display_name": "Command R+", + "id": "deepseek-ai/DeepSeek-R1", + "name": "DeepSeek R1", + "display_name": "DeepSeek R1", "modalities": { "input": [ "text" @@ -80321,56 +85832,39 @@ }, "limit": { "context": 128000, - "output": 4000 + "output": 8192 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } }, "attachment": false, "open_weights": true, - "knowledge": "2024-06-01", - "release_date": "2024-08-30", - "last_updated": "2024-08-30", + "release_date": "2025-01-20", + "last_updated": "2025-01-20", "cost": { - "input": 2.5, - "output": 10 - }, - "type": "chat" - }, - { - "id": "c4ai-aya-vision-8b", - "name": "Aya Vision 8B", - "display_name": "Aya Vision 8B", - "modalities": { - "input": [ - "text", - "image" - ], - "output": [ - "text" - ] - }, - "limit": { - "context": 16000, - "output": 4000 - }, - "temperature": true, - "tool_call": false, - "reasoning": { - "supported": false + "input": 3, + "output": 7 }, - "attachment": true, - "open_weights": true, - "release_date": "2025-03-04", - "last_updated": "2025-05-14", "type": "chat" }, { - "id": "command-a-reasoning-08-2025", - "name": "Command A Reasoning", - "display_name": "Command A Reasoning", + "id": "deepseek-ai/DeepSeek-V3.1-Terminus", + "name": "DeepSeek V3.1 Terminus", + "display_name": "DeepSeek V3.1 Terminus", "modalities": { "input": [ "text" @@ -80380,8 +85874,8 @@ ] }, "limit": { - "context": 256000, - "output": 32000 + "context": 128000, + "output": 8192 }, "temperature": true, "tool_call": true, @@ -80391,47 +85885,18 @@ }, "attachment": false, "open_weights": true, - "knowledge": "2024-06-01", - "release_date": "2025-08-21", - "last_updated": "2025-08-21", + "release_date": "2025-06-01", + "last_updated": "2025-06-01", "cost": { - "input": 2.5, - "output": 10 - }, - "type": "chat" - }, - { - "id": "c4ai-aya-vision-32b", - "name": "Aya Vision 32B", - "display_name": "Aya Vision 32B", - "modalities": { - "input": [ - "text", - "image" - ], - "output": [ - "text" - ] - }, - "limit": { - "context": 16000, - "output": 4000 - }, - "temperature": true, - "tool_call": false, - "reasoning": { - "supported": false + "input": 0.27, + "output": 1 }, - "attachment": true, - "open_weights": true, - "release_date": "2025-03-04", - "last_updated": "2025-05-14", "type": "chat" }, { - "id": "c4ai-aya-expanse-8b", - "name": "Aya Expanse 8B", - "display_name": "Aya Expanse 8B", + "id": "deepseek-ai/DeepSeek-V3.2", + "name": "DeepSeek V3.2", + "display_name": "DeepSeek V3.2", "modalities": { "input": [ "text" @@ -80441,28 +85906,37 @@ ] }, "limit": { - "context": 8000, - "output": 4000 + "context": 128000, + "output": 8192 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true + } }, "attachment": false, "open_weights": true, - "release_date": "2024-10-24", - "last_updated": "2024-10-24", + "release_date": "2025-06-15", + "last_updated": "2025-06-15", + "cost": { + "input": 0.27, + "output": 0.4 + }, "type": "chat" }, { - "id": "command-a-plus-05-2026", - "name": "Command A Plus", - "display_name": "Command A Plus", + "id": "deepseek/deepseek-v3.1", + "name": "DeepSeek V3.1", + "display_name": "DeepSeek V3.1", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" @@ -80470,7 +85944,7 @@ }, "limit": { "context": 128000, - "output": 64000 + "output": 8192 }, "temperature": true, "tool_call": true, @@ -80478,21 +85952,29 @@ "supported": true, "default": true }, - "attachment": true, + "attachment": false, "open_weights": true, - "knowledge": "2025-04-01", - "release_date": "2026-05-20", - "last_updated": "2026-06-09", + "release_date": "2025-01-20", + "last_updated": "2025-01-20", "cost": { - "input": 2.5, - "output": 10 + "input": 0.55, + "output": 1.66 }, "type": "chat" - }, + } + ] + }, + "cloudferro-sherlock": { + "id": "cloudferro-sherlock", + "name": "CloudFerro Sherlock", + "display_name": "CloudFerro Sherlock", + "api": "https://api-sherlock.cloudferro.com/openai/v1/", + "doc": "https://docs.sherlock.cloudferro.com/", + "models": [ { - "id": "north-mini-code-1-0", - "name": "North Mini Code", - "display_name": "North Mini Code", + "id": "meta-llama/Llama-3.3-70B-Instruct", + "name": "Llama 3.3 70B Instruct", + "display_name": "Llama 3.3 70B Instruct", "modalities": { "input": [ "text" @@ -80502,41 +85984,29 @@ ] }, "limit": { - "context": 256000, - "output": 64000 + "context": 70000, + "output": 70000 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } + "supported": false }, "attachment": false, "open_weights": true, - "knowledge": "2025-09-23", - "release_date": "2026-06-09", - "last_updated": "2026-06-09", + "knowledge": "2024-10-09", + "release_date": "2024-12-06", + "last_updated": "2024-12-06", "cost": { - "input": 0, - "output": 0 + "input": 2.92, + "output": 2.92 }, "type": "chat" }, { - "id": "command-r-08-2024", - "name": "Command R", - "display_name": "Command R", + "id": "openai/gpt-oss-120b", + "name": "OpenAI GPT OSS 120B", + "display_name": "OpenAI GPT OSS 120B", "modalities": { "input": [ "text" @@ -80546,29 +86016,34 @@ ] }, "limit": { - "context": 128000, - "output": 4000 + "context": 131000, + "output": 131000 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true + } }, "attachment": false, "open_weights": true, - "knowledge": "2024-06-01", - "release_date": "2024-08-30", - "last_updated": "2024-08-30", + "release_date": "2025-08-28", + "last_updated": "2025-08-28", "cost": { - "input": 0.15, - "output": 0.6 + "input": 2.92, + "output": 2.92 }, "type": "chat" }, { - "id": "command-r7b-12-2024", - "name": "Command R7B", - "display_name": "Command R7B", + "id": "speakleash/Bielik-11B-v3.0-Instruct", + "name": "Bielik 11B v3.0 Instruct", + "display_name": "Bielik 11B v3.0 Instruct", "modalities": { "input": [ "text" @@ -80578,8 +86053,8 @@ ] }, "limit": { - "context": 128000, - "output": 4000 + "context": 32000, + "output": 32000 }, "temperature": true, "tool_call": true, @@ -80588,19 +86063,19 @@ }, "attachment": false, "open_weights": true, - "knowledge": "2024-06-01", - "release_date": "2024-02-27", - "last_updated": "2024-02-27", + "knowledge": "2025-03", + "release_date": "2025-03-13", + "last_updated": "2025-03-13", "cost": { - "input": 0.0375, - "output": 0.15 + "input": 0.67, + "output": 0.67 }, "type": "chat" }, { - "id": "command-a-03-2025", - "name": "Command A", - "display_name": "Command A", + "id": "speakleash/Bielik-11B-v2.6-Instruct", + "name": "Bielik 11B v2.6 Instruct", + "display_name": "Bielik 11B v2.6 Instruct", "modalities": { "input": [ "text" @@ -80610,8 +86085,8 @@ ] }, "limit": { - "context": 256000, - "output": 8000 + "context": 32000, + "output": 32000 }, "temperature": true, "tool_call": true, @@ -80620,19 +86095,19 @@ }, "attachment": false, "open_weights": true, - "knowledge": "2024-06-01", + "knowledge": "2025-03", "release_date": "2025-03-13", "last_updated": "2025-03-13", "cost": { - "input": 2.5, - "output": 10 + "input": 0.67, + "output": 0.67 }, "type": "chat" }, { - "id": "c4ai-aya-expanse-32b", - "name": "Aya Expanse 32B", - "display_name": "Aya Expanse 32B", + "id": "MiniMaxAI/MiniMax-M2.5", + "name": "MiniMax-M2.5", + "display_name": "MiniMax-M2.5", "modalities": { "input": [ "text" @@ -80642,24 +86117,43 @@ ] }, "limit": { - "context": 128000, - "output": 4000 + "context": 196000, + "output": 16000 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true + } }, "attachment": false, "open_weights": true, - "release_date": "2024-10-24", - "last_updated": "2024-10-24", + "knowledge": "2026-01", + "release_date": "2026-03-05", + "last_updated": "2026-03-05", + "cost": { + "input": 0.3, + "output": 1.2 + }, "type": "chat" - }, + } + ] + }, + "cloudflare-ai-gateway": { + "id": "cloudflare-ai-gateway", + "name": "Cloudflare AI Gateway", + "display_name": "Cloudflare AI Gateway", + "doc": "https://developers.cloudflare.com/ai-gateway/", + "models": [ { - "id": "command-a-vision-07-2025", - "name": "Command A Vision", - "display_name": "Command A Vision", + "id": "openai/o3", + "name": "o3", + "display_name": "o3", "modalities": { "input": [ "text", @@ -80670,29 +86164,45 @@ ] }, "limit": { - "context": 128000, - "output": 8000 + "context": 200000, + "output": 100000 }, - "temperature": true, - "tool_call": false, + "temperature": false, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": false, - "open_weights": true, - "knowledge": "2024-06-01", - "release_date": "2025-07-31", - "last_updated": "2025-07-31", + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": true, + "mode": "effort", + "effort": "medium", + "effort_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" + } + }, + "attachment": true, + "open_weights": false, + "knowledge": "2024-05", + "release_date": "2025-04-16", + "last_updated": "2025-04-16", "cost": { - "input": 2.5, - "output": 10 + "input": 2, + "output": 8, + "cache_read": 0.5 }, "type": "chat" }, { - "id": "command-a-translate-08-2025", - "name": "Command A Translate", - "display_name": "Command A Translate", + "id": "openai/gpt-3.5-turbo", + "name": "GPT-3.5-turbo", + "display_name": "GPT-3.5-turbo", "modalities": { "input": [ "text" @@ -80702,32 +86212,34 @@ ] }, "limit": { - "context": 8000, - "output": 8000 + "context": 16385, + "output": 4096 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": false }, "attachment": false, - "open_weights": true, - "knowledge": "2024-06-01", - "release_date": "2025-08-28", - "last_updated": "2025-08-28", + "open_weights": false, + "knowledge": "2021-09-01", + "release_date": "2023-03-01", + "last_updated": "2023-11-06", "cost": { - "input": 2.5, - "output": 10 + "input": 0.5, + "output": 1.5, + "cache_read": 1.25 }, "type": "chat" }, { - "id": "command-r7b-arabic-02-2025", - "name": "Command R7B Arabic", - "display_name": "Command R7B Arabic", + "id": "openai/gpt-4o", + "name": "GPT-4o", + "display_name": "GPT-4o", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" @@ -80735,105 +86247,65 @@ }, "limit": { "context": 128000, - "output": 4000 + "output": 16384 }, "temperature": true, "tool_call": true, "reasoning": { "supported": false }, - "attachment": false, - "open_weights": true, - "knowledge": "2024-06-01", - "release_date": "2025-02-27", - "last_updated": "2025-02-27", + "attachment": true, + "open_weights": false, + "knowledge": "2023-09", + "release_date": "2024-05-13", + "last_updated": "2024-08-06", "cost": { - "input": 0.0375, - "output": 0.15 - }, - "type": "chat" - } - ] - }, - "azure-cognitive-services": { - "id": "azure-cognitive-services", - "name": "Azure Cognitive Services", - "display_name": "Azure Cognitive Services", - "doc": "https://learn.microsoft.com/en-us/azure/ai-services/openai/concepts/models", - "models": [ + "input": 2.5, + "output": 10, + "cache_read": 1.25 + }, + "type": "chat" + }, { - "id": "claude-opus-4-5", - "name": "Claude Opus 4.5", - "display_name": "Claude Opus 4.5", + "id": "openai/gpt-4", + "name": "GPT-4", + "display_name": "GPT-4", "modalities": { "input": [ - "text", - "image", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 64000 + "context": 8192, + "output": 8192 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": false - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": false, - "mode": "mixed", - "budget": { - "min": 1024, - "unit": "tokens" - }, - "effort": "high", - "effort_options": [ - "low", - "medium", - "high" - ], - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ], - "notes": [ - "Claude Opus 4.5 uses manual thinking.type = \"enabled\" with budget_tokens; effort can be used alongside the thinking budget.", - "Interleaved thinking requires the interleaved-thinking-2025-05-14 beta header." - ] - } + "supported": false }, "attachment": true, "open_weights": false, - "knowledge": "2025-03-31", - "release_date": "2025-11-24", - "last_updated": "2025-08-01", + "knowledge": "2023-11", + "release_date": "2023-11-06", + "last_updated": "2024-04-09", "cost": { - "input": 5, - "output": 25, - "cache_read": 0.5, - "cache_write": 6.25 + "input": 30, + "output": 60 }, "type": "chat" }, { - "id": "claude-haiku-4-5", - "name": "Claude Haiku 4.5", - "display_name": "Claude Haiku 4.5", + "id": "openai/o4-mini", + "name": "o4-mini", + "display_name": "o4-mini", "modalities": { "input": [ "text", - "image", - "pdf" + "image" ], "output": [ "text" @@ -80841,52 +86313,44 @@ }, "limit": { "context": 200000, - "output": 64000 + "output": 100000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { "supported": true, - "default": false + "default": true }, "extra_capabilities": { "reasoning": { "supported": true, - "default_enabled": false, - "mode": "budget", - "budget": { - "min": 1024, - "unit": "tokens" - }, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" + "default_enabled": true, + "mode": "effort", + "effort": "medium", + "effort_options": [ + "low", + "medium", + "high" ], - "notes": [ - "Claude 4 manual thinking uses thinking.type = \"enabled\" with budget_tokens.", - "Interleaved thinking requires the interleaved-thinking-2025-05-14 beta header for this model family." - ] + "visibility": "hidden" } }, "attachment": true, "open_weights": false, - "knowledge": "2025-02-31", - "release_date": "2025-11-18", - "last_updated": "2025-11-18", + "knowledge": "2024-05", + "release_date": "2025-04-16", + "last_updated": "2025-04-16", "cost": { - "input": 1, - "output": 5, - "cache_read": 0.1, - "cache_write": 1.25 + "input": 1.1, + "output": 4.4, + "cache_read": 0.28 }, "type": "chat" }, { - "id": "gpt-5.4-pro", - "name": "GPT-5.4 Pro", - "display_name": "GPT-5.4 Pro", + "id": "openai/o3-pro", + "name": "o3-pro", + "display_name": "o3-pro", "modalities": { "input": [ "text", @@ -80897,8 +86361,8 @@ ] }, "limit": { - "context": 1050000, - "output": 128000 + "context": 200000, + "output": 100000 }, "temperature": false, "tool_call": true, @@ -80911,14 +86375,8 @@ "supported": true, "default_enabled": true, "mode": "effort", - "effort": "high", + "effort": "medium", "effort_options": [ - "medium", - "high", - "xhigh" - ], - "verbosity": "medium", - "verbosity_options": [ "low", "medium", "high" @@ -80928,45 +86386,30 @@ }, "attachment": true, "open_weights": false, - "knowledge": "2025-08-31", - "release_date": "2026-03-05", - "last_updated": "2026-03-05", + "knowledge": "2024-05", + "release_date": "2025-06-10", + "last_updated": "2025-06-10", "cost": { - "input": 30, - "output": 180, - "tiers": [ - { - "input": 60, - "output": 270, - "tier": { - "type": "context", - "size": 272000 - } - } - ], - "context_over_200k": { - "input": 60, - "output": 270 - } + "input": 20, + "output": 80 }, "type": "chat" }, { - "id": "gpt-5.4", - "name": "GPT-5.4", - "display_name": "GPT-5.4", + "id": "openai/gpt-5.1-codex", + "name": "GPT-5.1 Codex", + "display_name": "GPT-5.1 Codex", "modalities": { "input": [ "text", - "image", - "pdf" + "image" ], "output": [ "text" ] }, "limit": { - "context": 1050000, + "context": 400000, "output": 128000 }, "temperature": false, @@ -80985,8 +86428,7 @@ "none", "low", "medium", - "high", - "xhigh" + "high" ], "verbosity": "medium", "verbosity_options": [ @@ -80999,50 +86441,33 @@ }, "attachment": true, "open_weights": false, - "knowledge": "2025-08-31", - "release_date": "2026-03-05", - "last_updated": "2026-03-05", + "knowledge": "2024-09-30", + "release_date": "2025-11-13", + "last_updated": "2025-11-13", "cost": { - "input": 2.5, - "output": 15, - "cache_read": 0.25, - "tiers": [ - { - "input": 5, - "output": 22.5, - "cache_read": 0.5, - "tier": { - "type": "context", - "size": 272000 - } - } - ], - "context_over_200k": { - "input": 5, - "output": 22.5, - "cache_read": 0.5 - } + "input": 1.25, + "output": 10, + "cache_read": 0.125 }, "type": "chat" }, { - "id": "kimi-k2.6", - "name": "Kimi K2.6", - "display_name": "Kimi K2.6", + "id": "openai/o3-mini", + "name": "o3-mini", + "display_name": "o3-mini", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 262144, - "output": 262144 + "context": 200000, + "output": 100000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { "supported": true, @@ -81051,39 +86476,47 @@ "extra_capabilities": { "reasoning": { "supported": true, - "interleaved": true + "default_enabled": true, + "mode": "effort", + "effort": "medium", + "effort_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" } }, "attachment": false, - "open_weights": true, - "knowledge": "2025-01", - "release_date": "2026-04-22", - "last_updated": "2026-04-22", + "open_weights": false, + "knowledge": "2024-05", + "release_date": "2024-12-20", + "last_updated": "2025-01-29", "cost": { - "input": 0.95, - "output": 4 + "input": 1.1, + "output": 4.4, + "cache_read": 0.55 }, "type": "chat" }, { - "id": "claude-opus-4-1", - "name": "Claude Opus 4.1", - "display_name": "Claude Opus 4.1", + "id": "openai/gpt-5.2", + "name": "GPT-5.2", + "display_name": "GPT-5.2", "modalities": { "input": [ "text", - "image", - "pdf" + "image" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 32000 + "context": 400000, + "output": 128000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { "supported": true, @@ -81093,40 +86526,40 @@ "reasoning": { "supported": true, "default_enabled": false, - "mode": "budget", - "budget": { - "min": 1024, - "unit": "tokens" - }, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" + "mode": "effort", + "effort": "none", + "effort_options": [ + "none", + "low", + "medium", + "high", + "xhigh" ], - "notes": [ - "Claude 4 manual thinking uses thinking.type = \"enabled\" with budget_tokens.", - "Interleaved thinking requires the interleaved-thinking-2025-05-14 beta header for this model family." - ] + "verbosity": "medium", + "verbosity_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" } }, "attachment": true, "open_weights": false, - "knowledge": "2025-03-31", - "release_date": "2025-11-18", - "last_updated": "2025-11-18", + "knowledge": "2025-08-31", + "release_date": "2025-12-11", + "last_updated": "2025-12-11", "cost": { - "input": 15, - "output": 75, - "cache_read": 1.5, - "cache_write": 18.75 + "input": 1.75, + "output": 14, + "cache_read": 0.175 }, "type": "chat" }, { - "id": "gpt-5.4-nano", - "name": "GPT-5.4 Nano", - "display_name": "GPT-5.4 Nano", + "id": "openai/gpt-5.3-codex", + "name": "GPT-5.3 Codex", + "display_name": "GPT-5.3 Codex", "modalities": { "input": [ "text", @@ -81145,16 +86578,15 @@ "tool_call": true, "reasoning": { "supported": true, - "default": false + "default": true }, "extra_capabilities": { "reasoning": { "supported": true, - "default_enabled": false, + "default_enabled": true, "mode": "effort", - "effort": "none", + "effort": "medium", "effort_options": [ - "none", "low", "medium", "high", @@ -81172,24 +86604,23 @@ "attachment": true, "open_weights": false, "knowledge": "2025-08-31", - "release_date": "2026-03-17", - "last_updated": "2026-03-17", + "release_date": "2026-02-05", + "last_updated": "2026-02-05", "cost": { - "input": 0.2, - "output": 1.25, - "cache_read": 0.02 + "input": 1.75, + "output": 14, + "cache_read": 0.175 }, "type": "chat" }, { - "id": "claude-sonnet-4-5", - "name": "Claude Sonnet 4.5", - "display_name": "Claude Sonnet 4.5", + "id": "openai/o1", + "name": "o1", + "display_name": "o1", "modalities": { "input": [ "text", - "image", - "pdf" + "image" ], "output": [ "text" @@ -81197,52 +86628,44 @@ }, "limit": { "context": 200000, - "output": 64000 + "output": 100000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { "supported": true, - "default": false + "default": true }, "extra_capabilities": { "reasoning": { "supported": true, - "default_enabled": false, - "mode": "budget", - "budget": { - "min": 1024, - "unit": "tokens" - }, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" + "default_enabled": true, + "mode": "effort", + "effort": "medium", + "effort_options": [ + "low", + "medium", + "high" ], - "notes": [ - "Claude 4 manual thinking uses thinking.type = \"enabled\" with budget_tokens.", - "Interleaved thinking requires the interleaved-thinking-2025-05-14 beta header for this model family." - ] + "visibility": "hidden" } }, "attachment": true, "open_weights": false, - "knowledge": "2025-07-31", - "release_date": "2025-11-18", - "last_updated": "2025-11-18", + "knowledge": "2023-09", + "release_date": "2024-12-05", + "last_updated": "2024-12-05", "cost": { - "input": 3, - "output": 15, - "cache_read": 0.3, - "cache_write": 3.75 + "input": 15, + "output": 60, + "cache_read": 7.5 }, "type": "chat" }, { - "id": "gpt-5.4-mini", - "name": "GPT-5.4 Mini", - "display_name": "GPT-5.4 Mini", + "id": "openai/gpt-5.4", + "name": "GPT-5.4", + "display_name": "GPT-5.4", "modalities": { "input": [ "text", @@ -81254,7 +86677,7 @@ ] }, "limit": { - "context": 400000, + "context": 1050000, "output": 128000 }, "temperature": false, @@ -81288,102 +86711,52 @@ "attachment": true, "open_weights": false, "knowledge": "2025-08-31", - "release_date": "2026-03-17", - "last_updated": "2026-03-17", + "release_date": "2026-03-05", + "last_updated": "2026-03-05", "cost": { - "input": 0.75, - "output": 4.5, - "cache_read": 0.075 + "input": 2.5, + "output": 15, + "cache_read": 0.25 }, "type": "chat" }, { - "id": "claude-opus-4-6", - "name": "Claude Opus 4.6", - "display_name": "Claude Opus 4.6", + "id": "openai/gpt-4-turbo", + "name": "GPT-4 Turbo", + "display_name": "GPT-4 Turbo", "modalities": { "input": [ "text", - "image", - "pdf" + "image" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 128000 + "context": 128000, + "output": 4096 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": false - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": false, - "mode": "mixed", - "budget": { - "min": 1024, - "unit": "tokens" - }, - "effort": "high", - "effort_options": [ - "low", - "medium", - "high", - "max" - ], - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ], - "notes": [ - "Anthropic recommends adaptive thinking with effort for Claude 4.6; budget_tokens remains a deprecated compatibility path.", - "Anthropic API defaults effort to high; lower effort levels should be chosen per workload." - ] - } + "supported": false }, "attachment": true, "open_weights": false, - "knowledge": "2025-05-31", - "release_date": "2026-02-05", - "last_updated": "2026-02-05", + "knowledge": "2023-12", + "release_date": "2023-11-06", + "last_updated": "2024-04-09", "cost": { - "input": 5, - "output": 25, - "cache_read": 0.5, - "cache_write": 6.25, - "tiers": [ - { - "input": 10, - "output": 37.5, - "cache_read": 1, - "cache_write": 12.5, - "tier": { - "type": "context", - "size": 200000 - } - } - ], - "context_over_200k": { - "input": 10, - "output": 37.5, - "cache_read": 1, - "cache_write": 12.5 - } + "input": 10, + "output": 30 }, "type": "chat" }, { - "id": "cohere-embed-v-4-0", - "name": "Embed v4", - "display_name": "Embed v4", + "id": "openai/gpt-4o-mini", + "name": "GPT-4o mini", + "display_name": "GPT-4o mini", "modalities": { "input": [ "text", @@ -81395,70 +86768,7 @@ }, "limit": { "context": 128000, - "output": 1536 - }, - "temperature": false, - "tool_call": false, - "reasoning": { - "supported": false - }, - "attachment": true, - "open_weights": true, - "release_date": "2025-04-15", - "last_updated": "2025-04-15", - "cost": { - "input": 0.12, - "output": 0 - }, - "type": "chat" - }, - { - "id": "cohere-embed-v3-multilingual", - "name": "Embed v3 Multilingual", - "display_name": "Embed v3 Multilingual", - "modalities": { - "input": [ - "text" - ], - "output": [ - "text" - ] - }, - "limit": { - "context": 512, - "output": 1024 - }, - "temperature": false, - "tool_call": false, - "reasoning": { - "supported": false - }, - "attachment": false, - "open_weights": true, - "release_date": "2023-11-07", - "last_updated": "2023-11-07", - "cost": { - "input": 0.1, - "output": 0 - }, - "type": "chat" - }, - { - "id": "gpt-4.1-nano", - "name": "GPT-4.1 nano", - "display_name": "GPT-4.1 nano", - "modalities": { - "input": [ - "text", - "image" - ], - "output": [ - "text" - ] - }, - "limit": { - "context": 1047576, - "output": 32768 + "output": 16384 }, "temperature": true, "tool_call": true, @@ -81467,161 +86777,33 @@ }, "attachment": true, "open_weights": false, - "knowledge": "2024-04", - "release_date": "2025-04-14", - "last_updated": "2025-04-14", - "cost": { - "input": 0.1, - "output": 0.4, - "cache_read": 0.025 - }, - "type": "chat" - }, - { - "id": "codestral-2501", - "name": "Codestral 25.01", - "display_name": "Codestral 25.01", - "modalities": { - "input": [ - "text" - ], - "output": [ - "text" - ] - }, - "limit": { - "context": 256000, - "output": 256000 - }, - "temperature": true, - "tool_call": true, - "reasoning": { - "supported": false - }, - "attachment": false, - "open_weights": false, - "knowledge": "2024-03", - "release_date": "2025-01-01", - "last_updated": "2025-01-01", - "cost": { - "input": 0.3, - "output": 0.9 - }, - "type": "chat" - }, - { - "id": "gpt-4", - "name": "GPT-4", - "display_name": "GPT-4", - "modalities": { - "input": [ - "text" - ], - "output": [ - "text" - ] - }, - "limit": { - "context": 8192, - "output": 8192 - }, - "temperature": true, - "tool_call": true, - "reasoning": { - "supported": false - }, - "attachment": false, - "open_weights": false, - "knowledge": "2023-11", - "release_date": "2023-03-14", - "last_updated": "2023-03-14", - "cost": { - "input": 60, - "output": 120 - }, - "type": "chat" - }, - { - "id": "cohere-command-a", - "name": "Command A", - "display_name": "Command A", - "modalities": { - "input": [ - "text" - ], - "output": [ - "text" - ] - }, - "limit": { - "context": 256000, - "output": 8000 - }, - "temperature": true, - "tool_call": true, - "reasoning": { - "supported": true, - "default": true - }, - "attachment": false, - "open_weights": true, - "knowledge": "2024-06-01", - "release_date": "2025-03-13", - "last_updated": "2025-03-13", - "cost": { - "input": 2.5, - "output": 10 - }, - "type": "chat" - }, - { - "id": "deepseek-v3.1", - "name": "DeepSeek-V3.1", - "display_name": "DeepSeek-V3.1", - "modalities": { - "input": [ - "text" - ], - "output": [ - "text" - ] - }, - "limit": { - "context": 131072, - "output": 131072 - }, - "temperature": true, - "tool_call": true, - "reasoning": { - "supported": true, - "default": true - }, - "attachment": false, - "open_weights": true, - "knowledge": "2024-07", - "release_date": "2025-08-21", - "last_updated": "2025-08-21", + "knowledge": "2023-09", + "release_date": "2024-07-18", + "last_updated": "2024-07-18", "cost": { - "input": 0.56, - "output": 1.68 + "input": 0.15, + "output": 0.6, + "cache_read": 0.08 }, "type": "chat" }, { - "id": "codex-mini", - "name": "Codex Mini", - "display_name": "Codex Mini", + "id": "openai/gpt-5.2-codex", + "name": "GPT-5.2 Codex", + "display_name": "GPT-5.2 Codex", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 100000 + "context": 400000, + "output": 128000 }, "temperature": false, "tool_call": true, @@ -81629,22 +86811,43 @@ "supported": true, "default": true }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": true, + "mode": "effort", + "effort": "medium", + "effort_options": [ + "low", + "medium", + "high", + "xhigh" + ], + "verbosity": "medium", + "verbosity_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" + } + }, "attachment": true, "open_weights": false, - "knowledge": "2024-04", - "release_date": "2025-05-16", - "last_updated": "2025-05-16", + "knowledge": "2025-08-31", + "release_date": "2025-12-11", + "last_updated": "2025-12-11", "cost": { - "input": 1.5, - "output": 6, - "cache_read": 0.375 + "input": 1.75, + "output": 14, + "cache_read": 0.175 }, "type": "chat" }, { - "id": "kimi-k2.5", - "name": "Kimi K2.5", - "display_name": "Kimi K2.5", + "id": "openai/gpt-5.1", + "name": "GPT-5.1", + "display_name": "GPT-5.1", "modalities": { "input": [ "text", @@ -81655,53 +86858,65 @@ ] }, "limit": { - "context": 262144, - "output": 262144 + "context": 400000, + "output": 128000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { "supported": true, - "default": true + "default": false }, "extra_capabilities": { "reasoning": { "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] + "default_enabled": false, + "mode": "effort", + "effort": "none", + "effort_options": [ + "none", + "low", + "medium", + "high" + ], + "verbosity": "medium", + "verbosity_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" } }, - "attachment": false, - "open_weights": true, - "knowledge": "2025-01", - "release_date": "2026-02-06", - "last_updated": "2026-02-06", + "attachment": true, + "open_weights": false, + "knowledge": "2024-09-30", + "release_date": "2025-11-13", + "last_updated": "2025-11-13", "cost": { - "input": 0.6, - "output": 3 + "input": 1.25, + "output": 10, + "cache_read": 0.13 }, "type": "chat" }, { - "id": "o1", - "name": "o1", - "display_name": "o1", + "id": "openai/gpt-5.5", + "name": "GPT-5.5", + "display_name": "GPT-5.5", "modalities": { "input": [ "text", - "image" + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 100000 + "context": 1050000, + "output": 128000 }, "temperature": false, "tool_call": true, @@ -81716,6 +86931,13 @@ "mode": "effort", "effort": "medium", "effort_options": [ + "low", + "medium", + "high", + "xhigh" + ], + "verbosity": "medium", + "verbosity_options": [ "low", "medium", "high" @@ -81723,65 +86945,50 @@ "visibility": "hidden" } }, - "attachment": false, + "attachment": true, "open_weights": false, - "knowledge": "2023-09", - "release_date": "2024-12-05", - "last_updated": "2024-12-05", + "knowledge": "2025-12-01", + "release_date": "2026-04-23", + "last_updated": "2026-04-23", "cost": { - "input": 15, - "output": 60, - "cache_read": 7.5 - }, - "type": "chat" - }, - { - "id": "gpt-3.5-turbo-0301", - "name": "GPT-3.5 Turbo 0301", - "display_name": "GPT-3.5 Turbo 0301", - "modalities": { - "input": [ - "text" + "input": 5, + "output": 30, + "cache_read": 0.5, + "tiers": [ + { + "input": 10, + "output": 45, + "cache_read": 1, + "tier": { + "type": "context", + "size": 272000 + } + } ], - "output": [ - "text" - ] - }, - "limit": { - "context": 4096, - "output": 4096 - }, - "temperature": true, - "tool_call": false, - "reasoning": { - "supported": false - }, - "attachment": false, - "open_weights": false, - "knowledge": "2021-08", - "release_date": "2023-03-01", - "last_updated": "2023-03-01", - "cost": { - "input": 1.5, - "output": 2 + "context_over_200k": { + "input": 10, + "output": 45, + "cache_read": 1 + } }, "type": "chat" }, { - "id": "llama-3.2-90b-vision-instruct", - "name": "Llama-3.2-90B-Vision-Instruct", - "display_name": "Llama-3.2-90B-Vision-Instruct", + "id": "anthropic/claude-3.5-haiku", + "name": "Claude Haiku 3.5 (latest)", + "display_name": "Claude Haiku 3.5 (latest)", "modalities": { "input": [ "text", - "image" + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 128000, + "context": 200000, "output": 8192 }, "temperature": true, @@ -81790,64 +86997,35 @@ "supported": false }, "attachment": true, - "open_weights": true, - "knowledge": "2023-12", - "release_date": "2024-09-25", - "last_updated": "2024-09-25", - "cost": { - "input": 2.04, - "output": 2.04 - }, - "type": "chat" - }, - { - "id": "llama-3.3-70b-instruct", - "name": "Llama-3.3-70B-Instruct", - "display_name": "Llama-3.3-70B-Instruct", - "modalities": { - "input": [ - "text" - ], - "output": [ - "text" - ] - }, - "limit": { - "context": 128000, - "output": 32768 - }, - "temperature": true, - "tool_call": true, - "reasoning": { - "supported": false - }, - "attachment": false, - "open_weights": true, - "knowledge": "2023-12", - "release_date": "2024-12-06", - "last_updated": "2024-12-06", + "open_weights": false, + "knowledge": "2024-07-31", + "release_date": "2024-10-22", + "last_updated": "2024-10-22", "cost": { - "input": 0.71, - "output": 0.71 + "input": 0.8, + "output": 4, + "cache_read": 0.08, + "cache_write": 1 }, "type": "chat" }, { - "id": "gpt-4-turbo", - "name": "GPT-4 Turbo", - "display_name": "GPT-4 Turbo", + "id": "anthropic/claude-3.5-sonnet", + "name": "Claude Sonnet 3.5 v2", + "display_name": "Claude Sonnet 3.5 v2", "modalities": { "input": [ "text", - "image" + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 4096 + "context": 200000, + "output": 8192 }, "temperature": true, "tool_call": true, @@ -81856,139 +87034,94 @@ }, "attachment": true, "open_weights": false, - "knowledge": "2023-12", - "release_date": "2023-11-06", - "last_updated": "2024-04-09", - "cost": { - "input": 10, - "output": 30 - }, - "type": "chat" - }, - { - "id": "gpt-3.5-turbo-0613", - "name": "GPT-3.5 Turbo 0613", - "display_name": "GPT-3.5 Turbo 0613", - "modalities": { - "input": [ - "text" - ], - "output": [ - "text" - ] - }, - "limit": { - "context": 16384, - "output": 16384 - }, - "temperature": true, - "tool_call": false, - "reasoning": { - "supported": false - }, - "attachment": false, - "open_weights": false, - "knowledge": "2021-08", - "release_date": "2023-06-13", - "last_updated": "2023-06-13", + "knowledge": "2024-04-30", + "release_date": "2024-10-22", + "last_updated": "2024-10-22", "cost": { "input": 3, - "output": 4 + "output": 15, + "cache_read": 0.3, + "cache_write": 3.75 }, "type": "chat" }, { - "id": "gpt-5.1-chat", - "name": "GPT-5.1 Chat", - "display_name": "GPT-5.1 Chat", + "id": "anthropic/claude-sonnet-4", + "name": "Claude Sonnet 4 (latest)", + "display_name": "Claude Sonnet 4 (latest)", "modalities": { "input": [ "text", "image", - "audio" - ], - "output": [ - "text", - "image", - "audio" - ] - }, - "limit": { - "context": 128000, - "output": 16384 - }, - "temperature": false, - "tool_call": true, - "reasoning": { - "supported": true, - "default": true - }, - "attachment": true, - "open_weights": false, - "knowledge": "2024-09-30", - "release_date": "2025-11-14", - "last_updated": "2025-11-14", - "cost": { - "input": 1.25, - "output": 10, - "cache_read": 0.125 - }, - "type": "chat" - }, - { - "id": "phi-4-mini-reasoning", - "name": "Phi-4-mini-reasoning", - "display_name": "Phi-4-mini-reasoning", - "modalities": { - "input": [ - "text" + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 4096 + "context": 200000, + "output": 64000 }, "temperature": true, "tool_call": true, "reasoning": { "supported": true, - "default": true + "default": false + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": false, + "mode": "budget", + "budget": { + "min": 1024, + "unit": "tokens" + }, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ], + "notes": [ + "Claude 4 manual thinking uses thinking.type = \"enabled\" with budget_tokens.", + "Interleaved thinking requires the interleaved-thinking-2025-05-14 beta header for this model family." + ] + } }, - "attachment": false, - "open_weights": true, - "knowledge": "2023-10", - "release_date": "2024-12-11", - "last_updated": "2024-12-11", + "attachment": true, + "open_weights": false, + "knowledge": "2025-03-31", + "release_date": "2025-05-22", + "last_updated": "2025-05-22", "cost": { - "input": 0.075, - "output": 0.3 + "input": 3, + "output": 15, + "cache_read": 0.3, + "cache_write": 3.75 }, "type": "chat" }, { - "id": "gpt-5.1-codex", - "name": "GPT-5.1 Codex", - "display_name": "GPT-5.1 Codex", + "id": "anthropic/claude-opus-4-5", + "name": "Claude Opus 4.5 (latest)", + "display_name": "Claude Opus 4.5 (latest)", "modalities": { "input": [ "text", "image", - "audio" + "pdf" ], "output": [ - "text", - "image", - "audio" + "text" ] }, "limit": { - "context": 400000, - "output": 128000 + "context": 200000, + "output": 64000 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, @@ -81998,317 +87131,313 @@ "reasoning": { "supported": true, "default_enabled": false, - "mode": "effort", - "effort": "none", + "mode": "mixed", + "budget": { + "min": 1024, + "unit": "tokens" + }, + "effort": "high", "effort_options": [ - "none", "low", "medium", "high" ], - "verbosity": "medium", - "verbosity_options": [ - "low", - "medium", - "high" + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" ], - "visibility": "hidden" + "notes": [ + "Claude Opus 4.5 uses manual thinking.type = \"enabled\" with budget_tokens; effort can be used alongside the thinking budget.", + "Interleaved thinking requires the interleaved-thinking-2025-05-14 beta header." + ] } }, - "attachment": false, + "attachment": true, "open_weights": false, - "knowledge": "2024-09-30", - "release_date": "2025-11-14", - "last_updated": "2025-11-14", + "knowledge": "2025-03-31", + "release_date": "2025-11-24", + "last_updated": "2025-11-24", "cost": { - "input": 1.25, - "output": 10, - "cache_read": 0.125 + "input": 5, + "output": 25, + "cache_read": 0.5, + "cache_write": 6.25 }, "type": "chat" }, { - "id": "o1-mini", - "name": "o1-mini", - "display_name": "o1-mini", + "id": "anthropic/claude-sonnet-4-5", + "name": "Claude Sonnet 4.5 (latest)", + "display_name": "Claude Sonnet 4.5 (latest)", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 65536 + "context": 200000, + "output": 64000 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, - "default": true + "default": false }, "extra_capabilities": { "reasoning": { "supported": true, - "default_enabled": true, - "mode": "effort", - "effort": "medium", - "effort_options": [ - "low", - "medium", - "high" + "default_enabled": false, + "mode": "budget", + "budget": { + "min": 1024, + "unit": "tokens" + }, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" ], - "visibility": "hidden" + "notes": [ + "Claude 4 manual thinking uses thinking.type = \"enabled\" with budget_tokens.", + "Interleaved thinking requires the interleaved-thinking-2025-05-14 beta header for this model family." + ] } }, - "attachment": false, + "attachment": true, "open_weights": false, - "knowledge": "2023-09", - "release_date": "2024-09-12", - "last_updated": "2024-09-12", + "knowledge": "2025-07-31", + "release_date": "2025-09-29", + "last_updated": "2025-09-29", "cost": { - "input": 1.1, - "output": 4.4, - "cache_read": 0.55 + "input": 3, + "output": 15, + "cache_read": 0.3, + "cache_write": 3.75 }, "type": "chat" }, { - "id": "gpt-5.2-codex", - "name": "GPT-5.2 Codex", - "display_name": "GPT-5.2 Codex", + "id": "anthropic/claude-opus-4-7", + "name": "Claude Opus 4.7", + "display_name": "Claude Opus 4.7", "modalities": { "input": [ "text", - "image" + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 400000, + "context": 1000000, "output": 128000 }, "temperature": false, "tool_call": true, "reasoning": { "supported": true, - "default": true + "default": false }, "extra_capabilities": { "reasoning": { "supported": true, - "default_enabled": true, + "default_enabled": false, "mode": "effort", - "effort": "medium", + "effort": "high", "effort_options": [ "low", "medium", "high", - "xhigh" + "xhigh", + "max" ], - "verbosity": "medium", - "verbosity_options": [ - "low", - "medium", - "high" + "interleaved": true, + "summaries": true, + "visibility": "omitted", + "continuation": [ + "thinking_blocks" ], - "visibility": "hidden" + "notes": [ + "Claude Opus 4.7 and newer Opus models require thinking.type = \"adaptive\" to enable thinking explicitly.", + "Manual budget_tokens requests return 400 on Claude Opus 4.7 and newer adaptive-only Opus models.", + "task_budget is separate from thinking control and should not be treated as a thinking budget." + ] } }, - "attachment": false, + "attachment": true, "open_weights": false, - "knowledge": "2025-08-31", - "release_date": "2026-01-14", - "last_updated": "2026-01-14", + "knowledge": "2026-01", + "release_date": "2026-04-16", + "last_updated": "2026-04-16", "cost": { - "input": 1.75, - "output": 14, - "cache_read": 0.175 + "input": 5, + "output": 25, + "cache_read": 0.5, + "cache_write": 6.25 }, "type": "chat" }, { - "id": "gpt-3.5-turbo-instruct", - "name": "GPT-3.5 Turbo Instruct", - "display_name": "GPT-3.5 Turbo Instruct", + "id": "anthropic/claude-3-sonnet", + "name": "Claude Sonnet 3", + "display_name": "Claude Sonnet 3", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 4096, + "context": 200000, "output": 4096 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { "supported": false }, - "attachment": false, + "attachment": true, "open_weights": false, - "knowledge": "2021-08", - "release_date": "2023-09-21", - "last_updated": "2023-09-21", - "cost": { - "input": 1.5, - "output": 2 - }, - "type": "chat" - }, - { - "id": "meta-llama-3-70b-instruct", - "name": "Meta-Llama-3-70B-Instruct", - "display_name": "Meta-Llama-3-70B-Instruct", - "modalities": { - "input": [ - "text" - ], - "output": [ - "text" - ] - }, - "limit": { - "context": 8192, - "output": 2048 - }, - "temperature": true, - "tool_call": false, - "reasoning": { - "supported": false - }, - "attachment": false, - "open_weights": true, - "knowledge": "2023-12", - "release_date": "2024-04-18", - "last_updated": "2024-04-18", + "knowledge": "2023-08-31", + "release_date": "2024-03-04", + "last_updated": "2024-03-04", "cost": { - "input": 2.68, - "output": 3.54 + "input": 3, + "output": 15, + "cache_read": 0.3, + "cache_write": 0.3 }, "type": "chat" }, { - "id": "gpt-5.2-chat", - "name": "GPT-5.2 Chat", - "display_name": "GPT-5.2 Chat", + "id": "anthropic/claude-opus-4-8", + "name": "Claude Opus 4.8", + "display_name": "Claude Opus 4.8", "modalities": { "input": [ "text", - "image" + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 16384 + "context": 1000000, + "output": 128000 }, "temperature": false, "tool_call": true, "reasoning": { "supported": true, - "default": true + "default": false + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": false, + "mode": "effort", + "effort": "high", + "effort_options": [ + "low", + "medium", + "high", + "xhigh", + "max" + ], + "interleaved": true, + "summaries": true, + "visibility": "omitted", + "continuation": [ + "thinking_blocks" + ], + "notes": [ + "Claude Opus 4.7 and newer Opus models require thinking.type = \"adaptive\" to enable thinking explicitly.", + "Manual budget_tokens requests return 400 on Claude Opus 4.7 and newer adaptive-only Opus models.", + "task_budget is separate from thinking control and should not be treated as a thinking budget." + ] + } }, "attachment": true, "open_weights": false, - "knowledge": "2025-08-31", - "release_date": "2025-12-11", - "last_updated": "2025-12-11", - "cost": { - "input": 1.75, - "output": 14, - "cache_read": 0.175 - }, - "type": "chat" - }, - { - "id": "cohere-command-r-08-2024", - "name": "Command R", - "display_name": "Command R", - "modalities": { - "input": [ - "text" - ], - "output": [ - "text" - ] - }, - "limit": { - "context": 128000, - "output": 4000 - }, - "temperature": true, - "tool_call": true, - "reasoning": { - "supported": false - }, - "attachment": false, - "open_weights": true, - "knowledge": "2024-06-01", - "release_date": "2024-08-30", - "last_updated": "2024-08-30", + "release_date": "2026-05-28", + "last_updated": "2026-05-28", "cost": { - "input": 0.15, - "output": 0.6 + "input": 5, + "output": 25, + "cache_read": 0.5, + "cache_write": 6.25 }, "type": "chat" }, { - "id": "phi-3.5-moe-instruct", - "name": "Phi-3.5-MoE-instruct", - "display_name": "Phi-3.5-MoE-instruct", + "id": "anthropic/claude-3-opus", + "name": "Claude Opus 3", + "display_name": "Claude Opus 3", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 128000, + "context": 200000, "output": 4096 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { "supported": false }, - "attachment": false, - "open_weights": true, - "knowledge": "2023-10", - "release_date": "2024-08-20", - "last_updated": "2024-08-20", + "attachment": true, + "open_weights": false, + "knowledge": "2023-08-31", + "release_date": "2024-02-29", + "last_updated": "2024-02-29", "cost": { - "input": 0.16, - "output": 0.64 + "input": 15, + "output": 75, + "cache_read": 1.5, + "cache_write": 18.75 }, "type": "chat" }, { - "id": "llama-3.2-11b-vision-instruct", - "name": "Llama-3.2-11B-Vision-Instruct", - "display_name": "Llama-3.2-11B-Vision-Instruct", + "id": "anthropic/claude-3-5-haiku", + "name": "Claude Haiku 3.5 (latest)", + "display_name": "Claude Haiku 3.5 (latest)", "modalities": { "input": [ "text", - "image" + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 128000, + "context": 200000, "output": 8192 }, "temperature": true, @@ -82317,98 +87446,92 @@ "supported": false }, "attachment": true, - "open_weights": true, - "knowledge": "2023-12", - "release_date": "2024-09-25", - "last_updated": "2024-09-25", - "cost": { - "input": 0.37, - "output": 0.37 - }, - "type": "chat" - }, - { - "id": "gpt-3.5-turbo-0125", - "name": "GPT-3.5 Turbo 0125", - "display_name": "GPT-3.5 Turbo 0125", - "modalities": { - "input": [ - "text" - ], - "output": [ - "text" - ] - }, - "limit": { - "context": 16384, - "output": 16384 - }, - "temperature": true, - "tool_call": false, - "reasoning": { - "supported": false - }, - "attachment": false, "open_weights": false, - "knowledge": "2021-08", - "release_date": "2024-01-25", - "last_updated": "2024-01-25", + "knowledge": "2024-07-31", + "release_date": "2024-10-22", + "last_updated": "2024-10-22", "cost": { - "input": 0.5, - "output": 1.5 + "input": 0.8, + "output": 4, + "cache_read": 0.08, + "cache_write": 1 }, "type": "chat" }, { - "id": "phi-4-multimodal", - "name": "Phi-4-multimodal", - "display_name": "Phi-4-multimodal", + "id": "anthropic/claude-opus-4-1", + "name": "Claude Opus 4.1 (latest)", + "display_name": "Claude Opus 4.1 (latest)", "modalities": { "input": [ "text", "image", - "audio" + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 4096 + "context": 200000, + "output": 32000 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": false + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": false, + "mode": "budget", + "budget": { + "min": 1024, + "unit": "tokens" + }, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ], + "notes": [ + "Claude 4 manual thinking uses thinking.type = \"enabled\" with budget_tokens.", + "Interleaved thinking requires the interleaved-thinking-2025-05-14 beta header for this model family." + ] + } }, "attachment": true, - "open_weights": true, - "knowledge": "2023-10", - "release_date": "2024-12-11", - "last_updated": "2024-12-11", + "open_weights": false, + "knowledge": "2025-03-31", + "release_date": "2025-08-05", + "last_updated": "2025-08-05", "cost": { - "input": 0.08, - "output": 0.32, - "input_audio": 4 + "input": 15, + "output": 75, + "cache_read": 1.5, + "cache_write": 18.75 }, "type": "chat" }, { - "id": "gpt-5.3-codex", - "name": "GPT-5.3 Codex", - "display_name": "GPT-5.3 Codex", + "id": "anthropic/claude-fable-5", + "name": "Claude Fable 5", + "display_name": "Claude Fable 5", "modalities": { "input": [ "text", - "image" + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 400000, + "context": 1000000, "output": 128000 }, "temperature": false, @@ -82422,426 +87545,531 @@ "supported": true, "default_enabled": true, "mode": "effort", - "effort": "medium", + "effort": "high", "effort_options": [ "low", "medium", "high", - "xhigh" + "xhigh", + "max" ], - "verbosity": "medium", - "verbosity_options": [ - "low", - "medium", - "high" + "interleaved": true, + "summaries": true, + "visibility": "omitted", + "continuation": [ + "thinking_blocks" ], - "visibility": "hidden" + "notes": [ + "Adaptive thinking is always on for Claude Fable 5 and Claude Mythos 5; thinking.type = \"disabled\" is rejected.", + "Manual budget_tokens requests return 400 on Claude Fable 5 and Claude Mythos 5.", + "thinking.display defaults to omitted; set display to summarized to receive readable thinking summaries." + ] } }, - "attachment": false, + "attachment": true, "open_weights": false, - "knowledge": "2025-08-31", - "release_date": "2026-02-24", - "last_updated": "2026-02-24", + "knowledge": "2026-01-31", + "release_date": "2026-06-09", + "last_updated": "2026-06-09", "cost": { - "input": 1.75, - "output": 14, - "cache_read": 0.175 + "input": 10, + "output": 50, + "cache_read": 1, + "cache_write": 12.5 }, "type": "chat" }, { - "id": "deepseek-v3.2-speciale", - "name": "DeepSeek-V3.2-Speciale", - "display_name": "DeepSeek-V3.2-Speciale", + "id": "anthropic/claude-haiku-4-5", + "name": "Claude Haiku 4.5 (latest)", + "display_name": "Claude Haiku 4.5 (latest)", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 128000 + "context": 200000, + "output": 64000 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { "supported": true, - "default": true - }, - "attachment": false, - "open_weights": true, - "knowledge": "2024-07", - "release_date": "2025-12-01", - "last_updated": "2025-12-01", - "cost": { - "input": 0.58, - "output": 1.68 - }, - "type": "chat" - }, - { - "id": "phi-3-medium-4k-instruct", - "name": "Phi-3-medium-instruct (4k)", - "display_name": "Phi-3-medium-instruct (4k)", - "modalities": { - "input": [ - "text" - ], - "output": [ - "text" - ] - }, - "limit": { - "context": 4096, - "output": 1024 + "default": false }, - "temperature": true, - "tool_call": false, - "reasoning": { - "supported": false + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": false, + "mode": "budget", + "budget": { + "min": 1024, + "unit": "tokens" + }, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ], + "notes": [ + "Claude 4 manual thinking uses thinking.type = \"enabled\" with budget_tokens.", + "Interleaved thinking requires the interleaved-thinking-2025-05-14 beta header for this model family." + ] + } }, - "attachment": false, - "open_weights": true, - "knowledge": "2023-10", - "release_date": "2024-04-23", - "last_updated": "2024-04-23", + "attachment": true, + "open_weights": false, + "knowledge": "2025-02-28", + "release_date": "2025-10-15", + "last_updated": "2025-10-15", "cost": { - "input": 0.17, - "output": 0.68 + "input": 1, + "output": 5, + "cache_read": 0.1, + "cache_write": 1.25 }, "type": "chat" }, { - "id": "meta-llama-3.1-70b-instruct", - "name": "Meta-Llama-3.1-70B-Instruct", - "display_name": "Meta-Llama-3.1-70B-Instruct", + "id": "anthropic/claude-opus-4-6", + "name": "Claude Opus 4.6 (latest)", + "display_name": "Claude Opus 4.6 (latest)", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 32768 + "context": 1000000, + "output": 128000 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false - }, - "attachment": false, - "open_weights": true, - "knowledge": "2023-12", - "release_date": "2024-07-23", - "last_updated": "2024-07-23", - "cost": { - "input": 2.68, - "output": 3.54 - }, - "type": "chat" - }, - { - "id": "phi-3-mini-4k-instruct", - "name": "Phi-3-mini-instruct (4k)", - "display_name": "Phi-3-mini-instruct (4k)", - "modalities": { - "input": [ - "text" - ], - "output": [ - "text" - ] - }, - "limit": { - "context": 4096, - "output": 1024 + "supported": true, + "default": false }, - "temperature": true, - "tool_call": false, - "reasoning": { - "supported": false + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": false, + "mode": "mixed", + "budget": { + "min": 1024, + "unit": "tokens" + }, + "effort": "high", + "effort_options": [ + "low", + "medium", + "high", + "max" + ], + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ], + "notes": [ + "Anthropic recommends adaptive thinking with effort for Claude 4.6; budget_tokens remains a deprecated compatibility path.", + "Anthropic API defaults effort to high; lower effort levels should be chosen per workload." + ] + } }, - "attachment": false, - "open_weights": true, - "knowledge": "2023-10", - "release_date": "2024-04-23", - "last_updated": "2024-04-23", + "attachment": true, + "open_weights": false, + "knowledge": "2025-05-31", + "release_date": "2026-02-05", + "last_updated": "2026-02-05", "cost": { - "input": 0.13, - "output": 0.52 - }, - "type": "chat" - }, - { - "id": "cohere-embed-v3-english", - "name": "Embed v3 English", - "display_name": "Embed v3 English", - "modalities": { - "input": [ - "text" + "input": 5, + "output": 25, + "cache_read": 0.5, + "cache_write": 6.25, + "tiers": [ + { + "input": 10, + "output": 37.5, + "cache_read": 1, + "cache_write": 12.5, + "tier": { + "type": "context", + "size": 200000 + } + } ], - "output": [ - "text" - ] - }, - "limit": { - "context": 512, - "output": 1024 - }, - "temperature": false, - "tool_call": false, - "reasoning": { - "supported": false - }, - "attachment": false, - "open_weights": true, - "release_date": "2023-11-07", - "last_updated": "2023-11-07", - "cost": { - "input": 0.1, - "output": 0 + "context_over_200k": { + "input": 10, + "output": 37.5, + "cache_read": 1, + "cache_write": 12.5 + } }, "type": "chat" }, { - "id": "phi-3.5-mini-instruct", - "name": "Phi-3.5-mini-instruct", - "display_name": "Phi-3.5-mini-instruct", + "id": "anthropic/claude-3-haiku", + "name": "Claude Haiku 3", + "display_name": "Claude Haiku 3", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 128000, + "context": 200000, "output": 4096 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { "supported": false }, - "attachment": false, - "open_weights": true, - "knowledge": "2023-10", - "release_date": "2024-08-20", - "last_updated": "2024-08-20", + "attachment": true, + "open_weights": false, + "knowledge": "2023-08-31", + "release_date": "2024-03-13", + "last_updated": "2024-03-13", "cost": { - "input": 0.13, - "output": 0.52 + "input": 0.25, + "output": 1.25, + "cache_read": 0.03, + "cache_write": 0.3 }, "type": "chat" }, { - "id": "meta-llama-3-8b-instruct", - "name": "Meta-Llama-3-8B-Instruct", - "display_name": "Meta-Llama-3-8B-Instruct", + "id": "anthropic/claude-sonnet-4-6", + "name": "Claude Sonnet 4.6", + "display_name": "Claude Sonnet 4.6", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 8192, - "output": 2048 + "context": 1000000, + "output": 64000 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": false }, - "attachment": false, - "open_weights": true, - "knowledge": "2023-12", - "release_date": "2024-04-18", - "last_updated": "2024-04-18", + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": false, + "mode": "mixed", + "budget": { + "min": 1024, + "unit": "tokens" + }, + "effort": "high", + "effort_options": [ + "low", + "medium", + "high", + "max" + ], + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ], + "notes": [ + "Anthropic recommends adaptive thinking with effort for Claude 4.6; budget_tokens remains a deprecated compatibility path.", + "Anthropic API defaults effort to high; lower effort levels should be chosen per workload." + ] + } + }, + "attachment": true, + "open_weights": false, + "knowledge": "2025-08-31", + "release_date": "2026-02-17", + "last_updated": "2026-02-17", "cost": { - "input": 0.3, - "output": 0.61 + "input": 3, + "output": 15, + "cache_read": 0.3, + "cache_write": 3.75, + "tiers": [ + { + "input": 6, + "output": 22.5, + "cache_read": 0.6, + "cache_write": 7.5, + "tier": { + "type": "context", + "size": 200000 + } + } + ], + "context_over_200k": { + "input": 6, + "output": 22.5, + "cache_read": 0.6, + "cache_write": 7.5 + } }, "type": "chat" }, { - "id": "phi-3-small-8k-instruct", - "name": "Phi-3-small-instruct (8k)", - "display_name": "Phi-3-small-instruct (8k)", + "id": "anthropic/claude-opus-4", + "name": "Claude Opus 4 (latest)", + "display_name": "Claude Opus 4 (latest)", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 8192, - "output": 2048 + "context": 200000, + "output": 32000 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": false }, - "attachment": false, - "open_weights": true, - "knowledge": "2023-10", - "release_date": "2024-04-23", - "last_updated": "2024-04-23", + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": false, + "mode": "budget", + "budget": { + "min": 1024, + "unit": "tokens" + }, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ], + "notes": [ + "Claude 4 manual thinking uses thinking.type = \"enabled\" with budget_tokens.", + "Interleaved thinking requires the interleaved-thinking-2025-05-14 beta header for this model family." + ] + } + }, + "attachment": true, + "open_weights": false, + "knowledge": "2025-03-31", + "release_date": "2025-05-22", + "last_updated": "2025-05-22", "cost": { - "input": 0.15, - "output": 0.6 + "input": 15, + "output": 75, + "cache_read": 1.5, + "cache_write": 18.75 }, "type": "chat" - }, + } + ] + }, + "moonshot": { + "id": "moonshot", + "name": "Moonshot AI (China)", + "display_name": "Moonshot AI (China)", + "api": "https://api.moonshot.cn/v1", + "doc": "https://platform.moonshot.cn/docs/api/chat", + "models": [ { - "id": "gpt-4.1", - "name": "GPT-4.1", - "display_name": "GPT-4.1", + "id": "kimi-k2.6", + "name": "Kimi K2.6", + "display_name": "Kimi K2.6", "modalities": { "input": [ "text", - "image" + "image", + "video" ], "output": [ "text" ] }, "limit": { - "context": 1047576, - "output": 32768 + "context": 262144, + "output": 262144 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } }, "attachment": true, - "open_weights": false, - "knowledge": "2024-04", - "release_date": "2025-04-14", - "last_updated": "2025-04-14", + "open_weights": true, + "knowledge": "2025-01", + "release_date": "2026-04-21", + "last_updated": "2026-04-21", "cost": { - "input": 2, - "output": 8, - "cache_read": 0.5 + "input": 0.95, + "output": 4, + "cache_read": 0.16 }, "type": "chat" }, { - "id": "cohere-command-r-plus-08-2024", - "name": "Command R+", - "display_name": "Command R+", + "id": "kimi-k2.5", + "name": "Kimi K2.5", + "display_name": "Kimi K2.5", "modalities": { "input": [ - "text" + "text", + "image", + "video" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 4000 + "context": 262144, + "output": 262144 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } }, "attachment": false, "open_weights": true, - "knowledge": "2024-06-01", - "release_date": "2024-08-30", - "last_updated": "2024-08-30", + "knowledge": "2025-01", + "release_date": "2026-01", + "last_updated": "2026-01", "cost": { - "input": 2.5, - "output": 10 + "input": 0.6, + "output": 3, + "cache_read": 0.1 }, "type": "chat" }, { - "id": "llama-4-maverick-17b-128e-instruct-fp8", - "name": "Llama 4 Maverick 17B 128E Instruct FP8", - "display_name": "Llama 4 Maverick 17B 128E Instruct FP8", + "id": "kimi-k2-turbo-preview", + "name": "Kimi K2 Turbo", + "display_name": "Kimi K2 Turbo", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 8192 + "context": 262144, + "output": 262144 }, "temperature": true, "tool_call": true, "reasoning": { "supported": false }, - "attachment": true, + "attachment": false, "open_weights": true, - "knowledge": "2024-08", - "release_date": "2025-04-05", - "last_updated": "2025-04-05", + "knowledge": "2024-10", + "release_date": "2025-09-05", + "last_updated": "2025-09-05", "cost": { - "input": 0.25, - "output": 1 + "input": 2.4, + "output": 10, + "cache_read": 0.6 }, "type": "chat" }, { - "id": "mistral-medium-2505", - "name": "Mistral Medium 3", - "display_name": "Mistral Medium 3", + "id": "kimi-k2-0711-preview", + "name": "Kimi K2 0711", + "display_name": "Kimi K2 0711", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 128000 + "context": 131072, + "output": 16384 }, "temperature": true, "tool_call": true, "reasoning": { "supported": false }, - "attachment": true, - "open_weights": false, - "knowledge": "2025-05", - "release_date": "2025-05-07", - "last_updated": "2025-05-07", + "attachment": false, + "open_weights": true, + "knowledge": "2024-10", + "release_date": "2025-07-14", + "last_updated": "2025-07-14", "cost": { - "input": 0.4, - "output": 2 + "input": 0.6, + "output": 2.5, + "cache_read": 0.15 }, "type": "chat" }, { - "id": "deepseek-r1", - "name": "DeepSeek-R1", - "display_name": "DeepSeek-R1", + "id": "kimi-k2-thinking", + "name": "Kimi K2 Thinking", + "display_name": "Kimi K2 Thinking", "modalities": { "input": [ "text" @@ -82851,11 +88079,11 @@ ] }, "limit": { - "context": 163840, - "output": 163840 + "context": 262144, + "output": 262144 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { "supported": true, "default": true @@ -82873,19 +88101,20 @@ }, "attachment": false, "open_weights": true, - "knowledge": "2024-07", - "release_date": "2025-01-20", - "last_updated": "2025-01-20", + "knowledge": "2024-08", + "release_date": "2025-11-06", + "last_updated": "2025-11-06", "cost": { - "input": 1.35, - "output": 5.4 + "input": 0.6, + "output": 2.5, + "cache_read": 0.15 }, "type": "chat" }, { - "id": "phi-4-reasoning-plus", - "name": "Phi-4-reasoning-plus", - "display_name": "Phi-4-reasoning-plus", + "id": "kimi-k2-thinking-turbo", + "name": "Kimi K2 Thinking Turbo", + "display_name": "Kimi K2 Thinking Turbo", "modalities": { "input": [ "text" @@ -82895,30 +88124,42 @@ ] }, "limit": { - "context": 32000, - "output": 4096 + "context": 262144, + "output": 262144 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { "supported": true, "default": true }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } + }, "attachment": false, "open_weights": true, - "knowledge": "2023-10", - "release_date": "2024-12-11", - "last_updated": "2024-12-11", + "knowledge": "2024-08", + "release_date": "2025-11-06", + "last_updated": "2025-11-06", "cost": { - "input": 0.125, - "output": 0.5 + "input": 1.15, + "output": 8, + "cache_read": 0.15 }, "type": "chat" }, { - "id": "text-embedding-ada-002", - "name": "text-embedding-ada-002", - "display_name": "text-embedding-ada-002", + "id": "kimi-k2-0905-preview", + "name": "Kimi K2 0905", + "display_name": "Kimi K2 0905", "modalities": { "input": [ "text" @@ -82928,157 +88169,140 @@ ] }, "limit": { - "context": 8192, - "output": 1536 + "context": 262144, + "output": 262144 }, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { "supported": false }, "attachment": false, - "open_weights": false, - "release_date": "2022-12-15", - "last_updated": "2022-12-15", + "open_weights": true, + "knowledge": "2024-10", + "release_date": "2025-09-05", + "last_updated": "2025-09-05", "cost": { - "input": 0.1, - "output": 0 + "input": 0.6, + "output": 2.5, + "cache_read": 0.15 }, - "type": "embedding" - }, + "type": "chat" + } + ] + }, + "morph": { + "id": "morph", + "name": "Morph", + "display_name": "Morph", + "api": "https://api.morphllm.com/v1", + "doc": "https://docs.morphllm.com/api-reference/introduction", + "models": [ { - "id": "gpt-5.1-codex-mini", - "name": "GPT-5.1 Codex Mini", - "display_name": "GPT-5.1 Codex Mini", + "id": "morph-v3-fast", + "name": "Morph v3 Fast", + "display_name": "Morph v3 Fast", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 400000, - "output": 128000 + "context": 16000, + "output": 16000 }, "temperature": false, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": false - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": false, - "mode": "effort", - "effort": "none", - "effort_options": [ - "none", - "low", - "medium", - "high" - ], - "verbosity": "medium", - "verbosity_options": [ - "low", - "medium", - "high" - ], - "visibility": "hidden" - } + "supported": false }, "attachment": false, "open_weights": false, - "knowledge": "2024-09-30", - "release_date": "2025-11-14", - "last_updated": "2025-11-14", + "release_date": "2024-08-15", + "last_updated": "2024-08-15", "cost": { - "input": 0.25, - "output": 2, - "cache_read": 0.025 + "input": 0.8, + "output": 1.2 }, "type": "chat" }, { - "id": "grok-4-fast-reasoning", - "name": "Grok 4 Fast (Reasoning)", - "display_name": "Grok 4 Fast (Reasoning)", + "id": "morph-v3-large", + "name": "Morph v3 Large", + "display_name": "Morph v3 Large", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 2000000, - "output": 30000 + "context": 32000, + "output": 32000 }, - "temperature": true, - "tool_call": true, + "temperature": false, + "tool_call": false, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true - } + "supported": false }, - "attachment": true, + "attachment": false, "open_weights": false, - "knowledge": "2025-07", - "release_date": "2025-09-19", - "last_updated": "2025-09-19", + "release_date": "2024-08-15", + "last_updated": "2024-08-15", "cost": { - "input": 0.2, - "output": 0.5, - "cache_read": 0.05 + "input": 0.9, + "output": 1.9 }, "type": "chat" }, { - "id": "gpt-4o-mini", - "name": "GPT-4o mini", - "display_name": "GPT-4o mini", + "id": "auto", + "name": "Auto", + "display_name": "Auto", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 16384 + "context": 32000, + "output": 32000 }, - "temperature": true, - "tool_call": true, + "temperature": false, + "tool_call": false, "reasoning": { "supported": false }, - "attachment": true, + "attachment": false, "open_weights": false, - "knowledge": "2023-09", - "release_date": "2024-07-18", - "last_updated": "2024-07-18", + "release_date": "2024-06-01", + "last_updated": "2024-06-01", "cost": { - "input": 0.15, - "output": 0.6, - "cache_read": 0.075 + "input": 0.85, + "output": 1.55 }, "type": "chat" - }, + } + ] + }, + "deepinfra": { + "id": "deepinfra", + "name": "Deep Infra", + "display_name": "Deep Infra", + "doc": "https://deepinfra.com/models", + "models": [ { - "id": "gpt-5-nano", - "name": "GPT-5 Nano", - "display_name": "GPT-5 Nano", + "id": "meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8", + "name": "Llama 4 Maverick 17B FP8", + "display_name": "Llama 4 Maverick 17B FP8", "modalities": { "input": [ "text", @@ -83089,143 +88313,58 @@ ] }, "limit": { - "context": 272000, - "output": 128000 + "context": 1048576, + "output": 16384 }, - "temperature": false, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": true, - "mode": "effort", - "effort": "medium", - "effort_options": [ - "minimal", - "low", - "medium", - "high" - ], - "verbosity": "medium", - "verbosity_options": [ - "low", - "medium", - "high" - ], - "visibility": "hidden" - } + "supported": false }, - "attachment": true, - "open_weights": false, - "knowledge": "2024-05-30", - "release_date": "2025-08-07", - "last_updated": "2025-08-07", + "attachment": false, + "open_weights": true, + "release_date": "2025-04-05", + "last_updated": "2025-04-05", "cost": { - "input": 0.05, - "output": 0.4, - "cache_read": 0.01 + "input": 0.15, + "output": 0.6 }, "type": "chat" }, { - "id": "gpt-5.1", - "name": "GPT-5.1", - "display_name": "GPT-5.1", + "id": "meta-llama/Llama-4-Scout-17B-16E-Instruct", + "name": "Llama 4 Scout 17B", + "display_name": "Llama 4 Scout 17B", "modalities": { "input": [ "text", - "image", - "audio" - ], - "output": [ - "text", - "image", - "audio" - ] - }, - "limit": { - "context": 272000, - "output": 128000 - }, - "temperature": false, - "tool_call": true, - "reasoning": { - "supported": true, - "default": false - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": false, - "mode": "effort", - "effort": "none", - "effort_options": [ - "none", - "low", - "medium", - "high" - ], - "verbosity": "medium", - "verbosity_options": [ - "low", - "medium", - "high" - ], - "visibility": "hidden" - } - }, - "attachment": true, - "open_weights": false, - "knowledge": "2024-09-30", - "release_date": "2025-11-14", - "last_updated": "2025-11-14", - "cost": { - "input": 1.25, - "output": 10, - "cache_read": 0.125 - }, - "type": "chat" - }, - { - "id": "phi-4-mini", - "name": "Phi-4-mini", - "display_name": "Phi-4-mini", - "modalities": { - "input": [ - "text" + "image" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 4096 + "context": 327680, + "output": 16384 }, - "temperature": true, "tool_call": true, "reasoning": { "supported": false }, "attachment": false, "open_weights": true, - "knowledge": "2023-10", - "release_date": "2024-12-11", - "last_updated": "2024-12-11", + "release_date": "2025-04-05", + "last_updated": "2025-04-05", "cost": { - "input": 0.075, + "input": 0.1, "output": 0.3 }, "type": "chat" }, { - "id": "phi-3-small-128k-instruct", - "name": "Phi-3-small-instruct (128k)", - "display_name": "Phi-3-small-instruct (128k)", + "id": "meta-llama/Llama-3.3-70B-Instruct-Turbo", + "name": "Llama 3.3 70B Turbo", + "display_name": "Llama 3.3 70B Turbo", "modalities": { "input": [ "text" @@ -83235,205 +88374,247 @@ ] }, "limit": { - "context": 128000, - "output": 4096 + "context": 131072, + "output": 16384 }, - "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { "supported": false }, "attachment": false, "open_weights": true, - "knowledge": "2023-10", - "release_date": "2024-04-23", - "last_updated": "2024-04-23", + "release_date": "2024-12-06", + "last_updated": "2024-12-06", "cost": { - "input": 0.15, - "output": 0.6 + "input": 0.1, + "output": 0.32 }, "type": "chat" }, { - "id": "phi-3-mini-128k-instruct", - "name": "Phi-3-mini-instruct (128k)", - "display_name": "Phi-3-mini-instruct (128k)", + "id": "moonshotai/Kimi-K2.6", + "name": "Kimi K2.6", + "display_name": "Kimi K2.6", "modalities": { "input": [ - "text" + "text", + "image", + "video" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 4096 + "context": 262144, + "output": 16384 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": false, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } + }, + "attachment": true, "open_weights": true, - "knowledge": "2023-10", - "release_date": "2024-04-23", - "last_updated": "2024-04-23", + "knowledge": "2024-04", + "release_date": "2026-04-21", + "last_updated": "2026-04-21", "cost": { - "input": 0.13, - "output": 0.52 + "input": 0.75, + "output": 3.5, + "cache_read": 0.15 }, "type": "chat" }, { - "id": "llama-4-scout-17b-16e-instruct", - "name": "Llama 4 Scout 17B 16E Instruct", - "display_name": "Llama 4 Scout 17B 16E Instruct", + "id": "moonshotai/Kimi-K2.5", + "name": "Kimi K2.5", + "display_name": "Kimi K2.5", "modalities": { "input": [ "text", - "image" + "image", + "video" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 8192 + "context": 262144, + "output": 32768 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } }, "attachment": true, "open_weights": true, - "knowledge": "2024-08", - "release_date": "2025-04-05", - "last_updated": "2025-04-05", + "knowledge": "2025-01", + "release_date": "2026-01-27", + "last_updated": "2026-01-27", "cost": { - "input": 0.2, - "output": 0.78 + "input": 0.45, + "output": 2.25, + "cache_read": 0.07 }, "type": "chat" }, { - "id": "meta-llama-3.1-8b-instruct", - "name": "Meta-Llama-3.1-8B-Instruct", - "display_name": "Meta-Llama-3.1-8B-Instruct", + "id": "google/gemma-4-31B-it", + "name": "Gemma 4 31B IT", + "display_name": "Gemma 4 31B IT", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 128000, + "context": 262144, "output": 32768 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": false, + "attachment": true, "open_weights": true, - "knowledge": "2023-12", - "release_date": "2024-07-23", - "last_updated": "2024-07-23", + "release_date": "2026-04-02", + "last_updated": "2026-04-02", "cost": { - "input": 0.3, - "output": 0.61 + "input": 0.13, + "output": 0.38 }, "type": "chat" }, { - "id": "gpt-4-32k", - "name": "GPT-4 32K", - "display_name": "GPT-4 32K", + "id": "google/gemma-4-26B-A4B-it", + "name": "Gemma 4 26B A4B IT", + "display_name": "Gemma 4 26B A4B IT", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 32768, + "context": 262144, "output": 32768 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": false, - "open_weights": false, - "knowledge": "2023-11", - "release_date": "2023-03-14", - "last_updated": "2023-03-14", + "attachment": true, + "open_weights": true, + "release_date": "2026-04-02", + "last_updated": "2026-04-02", "cost": { - "input": 60, - "output": 120 + "input": 0.07, + "output": 0.34 }, "type": "chat" }, { - "id": "mistral-nemo", - "name": "Mistral Nemo", - "display_name": "Mistral Nemo", + "id": "Qwen/Qwen3.6-35B-A3B", + "name": "Qwen3.6 35B A3B", + "display_name": "Qwen3.6 35B A3B", "modalities": { "input": [ - "text" + "text", + "image", + "video" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 128000 + "context": 262144, + "output": 81920 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": false, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } + }, + "attachment": true, "open_weights": true, - "knowledge": "2024-07", - "release_date": "2024-07-18", - "last_updated": "2024-07-18", + "release_date": "2026-04-01", + "last_updated": "2026-04-01", "cost": { "input": 0.15, - "output": 0.15 + "output": 0.95 }, "type": "chat" }, { - "id": "gpt-5.5", - "name": "GPT-5.5", - "display_name": "GPT-5.5", + "id": "Qwen/Qwen3.5-397B-A17B", + "name": "Qwen 3.5 397B A17B", + "display_name": "Qwen 3.5 397B A17B", "modalities": { "input": [ "text", "image", - "pdf" + "video" ], "output": [ "text" ] }, "limit": { - "context": 1050000, - "output": 128000 + "context": 262144, + "output": 81920 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, @@ -83442,56 +88623,30 @@ "extra_capabilities": { "reasoning": { "supported": true, - "default_enabled": true, - "mode": "effort", - "effort": "medium", - "effort_options": [ - "low", - "medium", - "high", - "xhigh" - ], - "verbosity": "medium", - "verbosity_options": [ - "low", - "medium", - "high" - ], - "visibility": "hidden" + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] } }, "attachment": true, - "open_weights": false, - "knowledge": "2025-12-01", - "release_date": "2026-04-24", - "last_updated": "2026-04-24", + "open_weights": true, + "knowledge": "2025-01", + "release_date": "2026-02-01", + "last_updated": "2026-04-20", "cost": { - "input": 5, - "output": 30, - "cache_read": 0.5, - "tiers": [ - { - "input": 10, - "output": 45, - "cache_read": 1, - "tier": { - "type": "context", - "size": 272000 - } - } - ], - "context_over_200k": { - "input": 10, - "output": 45, - "cache_read": 1 - } + "input": 0.45, + "output": 3, + "cache_read": 0.22 }, "type": "chat" }, { - "id": "phi-4", - "name": "Phi-4", - "display_name": "Phi-4", + "id": "Qwen/Qwen3-Coder-480B-A35B-Instruct-Turbo", + "name": "Qwen3 Coder 480B A35B Instruct Turbo", + "display_name": "Qwen3 Coder 480B A35B Instruct Turbo", "modalities": { "input": [ "text" @@ -83501,62 +88656,76 @@ ] }, "limit": { - "context": 128000, - "output": 4096 + "context": 262144, + "output": 66536 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { "supported": false }, "attachment": false, "open_weights": true, - "knowledge": "2023-10", - "release_date": "2024-12-11", - "last_updated": "2024-12-11", + "knowledge": "2025-04", + "release_date": "2025-07-23", + "last_updated": "2025-07-23", "cost": { - "input": 0.125, - "output": 0.5 + "input": 0.3, + "output": 1 }, "type": "chat" }, { - "id": "phi-4-reasoning", - "name": "Phi-4-reasoning", - "display_name": "Phi-4-reasoning", + "id": "Qwen/Qwen3.5-35B-A3B", + "name": "Qwen 3.5 35B A3B", + "display_name": "Qwen 3.5 35B A3B", "modalities": { "input": [ - "text" + "text", + "image", + "video" ], "output": [ "text" ] }, "limit": { - "context": 32000, - "output": 4096 + "context": 262144, + "output": 81920 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { "supported": true, "default": true }, - "attachment": false, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } + }, + "attachment": true, "open_weights": true, - "knowledge": "2023-10", - "release_date": "2024-12-11", - "last_updated": "2024-12-11", + "knowledge": "2025-01", + "release_date": "2026-02-01", + "last_updated": "2026-04-20", "cost": { - "input": 0.125, - "output": 0.5 + "input": 0.14, + "output": 1, + "cache_read": 0.05 }, "type": "chat" }, { - "id": "o3-mini", - "name": "o3-mini", - "display_name": "o3-mini", + "id": "openai/gpt-oss-120b", + "name": "GPT OSS 120B", + "display_name": "GPT OSS 120B", "modalities": { "input": [ "text" @@ -83566,10 +88735,10 @@ ] }, "limit": { - "context": 200000, - "output": 100000 + "context": 131072, + "output": 16384 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, @@ -83577,48 +88746,36 @@ }, "extra_capabilities": { "reasoning": { - "supported": true, - "default_enabled": true, - "mode": "effort", - "effort": "medium", - "effort_options": [ - "low", - "medium", - "high" - ], - "visibility": "hidden" + "supported": true } }, "attachment": false, - "open_weights": false, - "knowledge": "2024-05", - "release_date": "2024-12-20", - "last_updated": "2025-01-29", + "open_weights": true, + "release_date": "2025-08-05", + "last_updated": "2025-08-05", "cost": { - "input": 1.1, - "output": 4.4, - "cache_read": 0.55 + "input": 0.039, + "output": 0.19 }, "type": "chat" }, { - "id": "o4-mini", - "name": "o4-mini", - "display_name": "o4-mini", + "id": "openai/gpt-oss-20b", + "name": "GPT OSS 20B", + "display_name": "GPT OSS 20B", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 100000 + "context": 131072, + "output": 16384 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, @@ -83626,64 +88783,87 @@ }, "extra_capabilities": { "reasoning": { - "supported": true, - "default_enabled": true, - "mode": "effort", - "effort": "medium", - "effort_options": [ - "low", - "medium", - "high" - ], - "visibility": "hidden" + "supported": true } }, - "attachment": true, - "open_weights": false, - "knowledge": "2024-05", - "release_date": "2025-04-16", - "last_updated": "2025-04-16", + "attachment": false, + "open_weights": true, + "release_date": "2025-08-05", + "last_updated": "2025-08-05", "cost": { - "input": 1.1, - "output": 4.4, - "cache_read": 0.275 + "input": 0.03, + "output": 0.14 }, "type": "chat" }, { - "id": "text-embedding-3-large", - "name": "text-embedding-3-large", - "display_name": "text-embedding-3-large", + "id": "XiaomiMiMo/MiMo-V2.5", + "name": "MiMo-V2.5", + "display_name": "MiMo-V2.5", "modalities": { "input": [ - "text" + "text", + "image", + "audio", + "video" ], "output": [ "text" ] }, "limit": { - "context": 8191, - "output": 3072 + "context": 262144, + "output": 16384 }, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": false, - "open_weights": false, - "release_date": "2024-01-25", - "last_updated": "2024-01-25", + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } + }, + "attachment": true, + "open_weights": true, + "knowledge": "2024-12", + "release_date": "2026-04-22", + "last_updated": "2026-04-22", "cost": { - "input": 0.13, - "output": 0 + "input": 0.4, + "output": 2, + "cache_read": 0.08, + "tiers": [ + { + "input": 0.8, + "output": 4, + "cache_read": 0.16, + "tier": { + "type": "context", + "size": 256000 + } + } + ], + "context_over_200k": { + "input": 0.8, + "output": 4, + "cache_read": 0.16 + } }, - "type": "embedding" + "type": "chat" }, { - "id": "deepseek-v3.2", - "name": "DeepSeek-V3.2", - "display_name": "DeepSeek-V3.2", + "id": "XiaomiMiMo/MiMo-V2.5-Pro", + "name": "MiMo-V2.5-Pro", + "display_name": "MiMo-V2.5-Pro", "modalities": { "input": [ "text" @@ -83693,8 +88873,8 @@ ] }, "limit": { - "context": 128000, - "output": 128000 + "context": 1048576, + "output": 16384 }, "temperature": true, "tool_call": true, @@ -83704,72 +88884,104 @@ }, "extra_capabilities": { "reasoning": { - "supported": true + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] } }, "attachment": false, "open_weights": true, - "knowledge": "2024-07", - "release_date": "2025-12-01", - "last_updated": "2025-12-01", + "knowledge": "2024-12", + "release_date": "2026-04-22", + "last_updated": "2026-04-22", "cost": { - "input": 0.58, - "output": 1.68 + "input": 1, + "output": 3, + "cache_read": 0.2, + "tiers": [ + { + "input": 2, + "output": 6, + "cache_read": 0.4, + "tier": { + "type": "context", + "size": 256000 + } + } + ], + "context_over_200k": { + "input": 2, + "output": 6, + "cache_read": 0.4 + } }, "type": "chat" }, { - "id": "gpt-4.1-mini", - "name": "GPT-4.1 mini", - "display_name": "GPT-4.1 mini", + "id": "zai-org/GLM-4.7-Flash", + "name": "GLM-4.7-Flash", + "display_name": "GLM-4.7-Flash", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 1047576, - "output": 32768 + "context": 202752, + "output": 16384 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": true, - "open_weights": false, - "knowledge": "2024-04", - "release_date": "2025-04-14", - "last_updated": "2025-04-14", + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } + }, + "attachment": false, + "open_weights": true, + "knowledge": "2025-04", + "release_date": "2026-01-19", + "last_updated": "2026-01-19", "cost": { - "input": 0.4, - "output": 1.6, - "cache_read": 0.1 + "input": 0.06, + "output": 0.4 }, "type": "chat" }, { - "id": "gpt-5", - "name": "GPT-5", - "display_name": "GPT-5", + "id": "zai-org/GLM-4.6", + "name": "GLM-4.6", + "display_name": "GLM-4.6", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 272000, - "output": 128000 + "context": 202752, + "output": 131072 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, @@ -83778,40 +88990,30 @@ "extra_capabilities": { "reasoning": { "supported": true, - "default_enabled": true, - "mode": "effort", - "effort": "medium", - "effort_options": [ - "minimal", - "low", - "medium", - "high" - ], - "verbosity": "medium", - "verbosity_options": [ - "low", - "medium", - "high" - ], - "visibility": "hidden" + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] } }, - "attachment": true, - "open_weights": false, - "knowledge": "2024-09-30", - "release_date": "2025-08-07", - "last_updated": "2025-08-07", + "attachment": false, + "open_weights": true, + "knowledge": "2025-04", + "release_date": "2025-09-30", + "last_updated": "2025-09-30", "cost": { - "input": 1.25, - "output": 10, - "cache_read": 0.13 + "input": 0.43, + "output": 1.74, + "cache_read": 0.08 }, "type": "chat" }, { - "id": "text-embedding-3-small", - "name": "text-embedding-3-small", - "display_name": "text-embedding-3-small", + "id": "zai-org/GLM-5", + "name": "GLM-5", + "display_name": "GLM-5", "modalities": { "input": [ "text" @@ -83821,60 +89023,87 @@ ] }, "limit": { - "context": 8191, - "output": 1536 + "context": 202752, + "output": 16384 }, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } }, "attachment": false, - "open_weights": false, - "release_date": "2024-01-25", - "last_updated": "2024-01-25", + "open_weights": true, + "knowledge": "2025-12", + "release_date": "2026-02-12", + "last_updated": "2026-02-12", "cost": { - "input": 0.02, - "output": 0 + "input": 0.6, + "output": 2.08, + "cache_read": 0.12 }, - "type": "embedding" + "type": "chat" }, { - "id": "mistral-small-2503", - "name": "Mistral Small 3.1", - "display_name": "Mistral Small 3.1", + "id": "zai-org/GLM-4.7", + "name": "GLM-4.7", + "display_name": "GLM-4.7", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 32768 + "context": 202752, + "output": 16384 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": true, - "open_weights": false, - "knowledge": "2024-09", - "release_date": "2025-03-01", - "last_updated": "2025-03-01", + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } + }, + "attachment": false, + "open_weights": true, + "knowledge": "2025-04", + "release_date": "2025-12-22", + "last_updated": "2025-12-22", "cost": { - "input": 0.1, - "output": 0.3 + "input": 0.4, + "output": 1.75, + "cache_read": 0.08 }, "type": "chat" }, { - "id": "kimi-k2-thinking", - "name": "Kimi K2 Thinking", - "display_name": "Kimi K2 Thinking", + "id": "zai-org/GLM-5.1", + "name": "GLM-5.1", + "display_name": "GLM-5.1", "modalities": { "input": [ "text" @@ -83884,8 +89113,8 @@ ] }, "limit": { - "context": 262144, - "output": 262144 + "context": 202752, + "output": 16384 }, "temperature": true, "tool_call": true, @@ -83906,20 +89135,20 @@ }, "attachment": false, "open_weights": true, - "knowledge": "2024-08", - "release_date": "2025-11-06", - "last_updated": "2025-12-02", + "knowledge": "2025-04", + "release_date": "2026-04-07", + "last_updated": "2026-04-07", "cost": { - "input": 0.6, - "output": 2.5, - "cache_read": 0.15 + "input": 1.05, + "output": 3.5, + "cache_read": 0.205 }, "type": "chat" }, { - "id": "deepseek-v3-0324", - "name": "DeepSeek-V3-0324", - "display_name": "DeepSeek-V3-0324", + "id": "deepseek-ai/DeepSeek-R1-0528", + "name": "DeepSeek-R1-0528", + "display_name": "DeepSeek-R1-0528", "modalities": { "input": [ "text" @@ -83929,29 +89158,42 @@ ] }, "limit": { - "context": 131072, - "output": 131072 + "context": 163840, + "output": 64000 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } }, "attachment": false, - "open_weights": true, + "open_weights": false, "knowledge": "2024-07", - "release_date": "2025-03-24", - "last_updated": "2025-03-24", + "release_date": "2025-05-28", + "last_updated": "2025-05-28", "cost": { - "input": 1.14, - "output": 4.56 + "input": 0.5, + "output": 2.15, + "cache_read": 0.35 }, "type": "chat" }, { - "id": "phi-3-medium-128k-instruct", - "name": "Phi-3-medium-instruct (128k)", - "display_name": "Phi-3-medium-instruct (128k)", + "id": "deepseek-ai/DeepSeek-V4-Flash", + "name": "DeepSeek V4 Flash", + "display_name": "DeepSeek V4 Flash", "modalities": { "input": [ "text" @@ -83961,43 +89203,55 @@ ] }, "limit": { - "context": 128000, - "output": 4096 + "context": 1048576, + "output": 16384 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } }, "attachment": false, "open_weights": true, - "knowledge": "2023-10", - "release_date": "2024-04-23", - "last_updated": "2024-04-23", + "knowledge": "2025-05", + "release_date": "2026-04-24", + "last_updated": "2026-04-24", "cost": { - "input": 0.17, - "output": 0.68 + "input": 0.1, + "output": 0.2, + "cache_read": 0.02 }, "type": "chat" }, { - "id": "o3", - "name": "o3", - "display_name": "o3", + "id": "deepseek-ai/DeepSeek-V4-Pro", + "name": "DeepSeek V4 Pro", + "display_name": "DeepSeek V4 Pro", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 100000 + "context": 1048576, + "output": 16384 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, @@ -84006,47 +89260,43 @@ "extra_capabilities": { "reasoning": { "supported": true, - "default_enabled": true, - "mode": "effort", - "effort": "medium", - "effort_options": [ - "low", - "medium", - "high" - ], - "visibility": "hidden" + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] } }, - "attachment": true, - "open_weights": false, - "knowledge": "2024-05", - "release_date": "2025-04-16", - "last_updated": "2025-04-16", + "attachment": false, + "open_weights": true, + "knowledge": "2025-05", + "release_date": "2026-04-24", + "last_updated": "2026-04-24", "cost": { - "input": 2, - "output": 8, - "cache_read": 0.5 + "input": 1.3, + "output": 2.6, + "cache_read": 0.1 }, "type": "chat" }, { - "id": "gpt-5-codex", - "name": "GPT-5-Codex", - "display_name": "GPT-5-Codex", + "id": "deepseek-ai/DeepSeek-V3.2", + "name": "DeepSeek-V3.2", + "display_name": "DeepSeek-V3.2", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 400000, - "output": 128000 + "context": 163840, + "output": 64000 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, @@ -84055,97 +89305,84 @@ "extra_capabilities": { "reasoning": { "supported": true, - "default_enabled": true, - "mode": "effort", - "effort": "medium", - "effort_options": [ - "minimal", - "low", - "medium", - "high" - ], - "verbosity": "medium", - "verbosity_options": [ - "low", - "medium", - "high" - ], - "visibility": "hidden" + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] } }, "attachment": false, "open_weights": false, - "knowledge": "2024-09-30", - "release_date": "2025-09-15", - "last_updated": "2025-09-15", + "knowledge": "2024-12", + "release_date": "2025-12-02", + "last_updated": "2025-12-02", "cost": { - "input": 1.25, - "output": 10, + "input": 0.26, + "output": 0.38, "cache_read": 0.13 }, "type": "chat" }, { - "id": "gpt-5.2", - "name": "GPT-5.2", - "display_name": "GPT-5.2", + "id": "MiniMaxAI/MiniMax-M2.5", + "name": "MiniMax M2.5", + "display_name": "MiniMax M2.5", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 400000, - "output": 128000 + "context": 196608, + "output": 131072 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, - "default": false + "default": true }, "extra_capabilities": { "reasoning": { "supported": true, - "default_enabled": false, - "mode": "effort", - "effort": "none", - "effort_options": [ - "none", - "low", - "medium", - "high", - "xhigh" - ], - "verbosity": "medium", - "verbosity_options": [ - "low", - "medium", - "high" - ], - "visibility": "hidden" + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] } }, - "attachment": true, - "open_weights": false, - "knowledge": "2025-08-31", - "release_date": "2025-12-11", - "last_updated": "2025-12-11", + "attachment": false, + "open_weights": true, + "knowledge": "2025-06", + "release_date": "2026-02-12", + "last_updated": "2026-02-12", "cost": { - "input": 1.75, - "output": 14, - "cache_read": 0.125 + "input": 0.15, + "output": 1.15, + "cache_read": 0.03, + "cache_write": 0.375 }, "type": "chat" - }, + } + ] + }, + "v0": { + "id": "v0", + "name": "v0", + "display_name": "v0", + "doc": "https://sdk.vercel.ai/providers/ai-sdk-providers/vercel", + "models": [ { - "id": "gpt-4o", - "name": "GPT-4o", - "display_name": "GPT-4o", + "id": "v0-1.0-md", + "name": "v0-1.0-md", + "display_name": "v0-1.0-md", "modalities": { "input": [ "text", @@ -84157,29 +89394,28 @@ }, "limit": { "context": 128000, - "output": 16384 + "output": 32000 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "attachment": true, "open_weights": false, - "knowledge": "2023-09", - "release_date": "2024-05-13", - "last_updated": "2024-08-06", + "release_date": "2025-05-22", + "last_updated": "2025-05-22", "cost": { - "input": 2.5, - "output": 10, - "cache_read": 1.25 + "input": 3, + "output": 15 }, "type": "chat" }, { - "id": "gpt-5-chat", - "name": "GPT-5 Chat", - "display_name": "GPT-5 Chat", + "id": "v0-1.5-lg", + "name": "v0-1.5-lg", + "display_name": "v0-1.5-lg", "modalities": { "input": [ "text", @@ -84190,34 +89426,33 @@ ] }, "limit": { - "context": 128000, - "output": 16384 + "context": 512000, + "output": 32000 }, - "temperature": false, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { "supported": true, "default": true }, "attachment": true, "open_weights": false, - "knowledge": "2024-10-24", - "release_date": "2025-08-07", - "last_updated": "2025-08-07", + "release_date": "2025-06-09", + "last_updated": "2025-06-09", "cost": { - "input": 1.25, - "output": 10, - "cache_read": 0.13 + "input": 15, + "output": 75 }, "type": "chat" }, { - "id": "meta-llama-3.1-405b-instruct", - "name": "Meta-Llama-3.1-405B-Instruct", - "display_name": "Meta-Llama-3.1-405B-Instruct", + "id": "v0-1.5-md", + "name": "v0-1.5-md", + "display_name": "v0-1.5-md", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" @@ -84225,61 +89460,70 @@ }, "limit": { "context": 128000, - "output": 32768 + "output": 32000 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": false, - "open_weights": true, - "knowledge": "2023-12", - "release_date": "2024-07-23", - "last_updated": "2024-07-23", + "attachment": true, + "open_weights": false, + "release_date": "2025-06-09", + "last_updated": "2025-06-09", "cost": { - "input": 5.33, - "output": 16 + "input": 3, + "output": 15 }, "type": "chat" - }, + } + ] + }, + "azure": { + "id": "azure", + "name": "Azure", + "display_name": "Azure", + "doc": "https://learn.microsoft.com/en-us/azure/ai-services/openai/concepts/models", + "models": [ { - "id": "gpt-4-turbo-vision", - "name": "GPT-4 Turbo Vision", - "display_name": "GPT-4 Turbo Vision", + "id": "codex-mini", + "name": "Codex Mini", + "display_name": "Codex Mini", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 4096 + "context": 200000, + "output": 100000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "attachment": true, "open_weights": false, - "knowledge": "2023-11", - "release_date": "2023-11-06", - "last_updated": "2024-04-09", + "knowledge": "2024-04", + "release_date": "2025-05-16", + "last_updated": "2025-05-16", "cost": { - "input": 10, - "output": 30 + "input": 1.5, + "output": 6, + "cache_read": 0.375 }, "type": "chat" }, { - "id": "ministral-3b", - "name": "Ministral 3B", - "display_name": "Ministral 3B", + "id": "phi-3.5-moe-instruct", + "name": "Phi-3.5-MoE-instruct", + "display_name": "Phi-3.5-MoE-instruct", "modalities": { "input": [ "text" @@ -84290,77 +89534,53 @@ }, "limit": { "context": 128000, - "output": 8192 + "output": 4096 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": false }, "attachment": false, "open_weights": true, - "knowledge": "2024-03", - "release_date": "2024-10-22", - "last_updated": "2024-10-22", + "knowledge": "2023-10", + "release_date": "2024-08-20", + "last_updated": "2024-08-20", "cost": { - "input": 0.04, - "output": 0.04 + "input": 0.16, + "output": 0.64 }, "type": "chat" }, { - "id": "gpt-5-mini", - "name": "GPT-5 Mini", - "display_name": "GPT-5 Mini", + "id": "gpt-3.5-turbo-instruct", + "name": "GPT-3.5 Turbo Instruct", + "display_name": "GPT-3.5 Turbo Instruct", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 272000, - "output": 128000 + "context": 4096, + "output": 4096 }, - "temperature": false, - "tool_call": true, + "temperature": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": true, - "mode": "effort", - "effort": "medium", - "effort_options": [ - "minimal", - "low", - "medium", - "high" - ], - "verbosity": "medium", - "verbosity_options": [ - "low", - "medium", - "high" - ], - "visibility": "hidden" - } + "supported": false }, - "attachment": true, + "attachment": false, "open_weights": false, - "knowledge": "2024-05-30", - "release_date": "2025-08-07", - "last_updated": "2025-08-07", + "knowledge": "2021-08", + "release_date": "2023-09-21", + "last_updated": "2023-09-21", "cost": { - "input": 0.25, - "output": 2, - "cache_read": 0.03 + "input": 1.5, + "output": 2 }, "type": "chat" }, @@ -84409,9 +89629,53 @@ "type": "chat" }, { - "id": "gpt-5-pro", - "name": "GPT-5 Pro", - "display_name": "GPT-5 Pro", + "id": "deepseek-v4-flash", + "name": "DeepSeek-V4-Flash", + "display_name": "DeepSeek-V4-Flash", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 1000000, + "output": 384000 + }, + "temperature": true, + "tool_call": false, + "reasoning": { + "supported": true, + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } + }, + "attachment": false, + "open_weights": true, + "knowledge": "2025-05", + "release_date": "2026-04-24", + "last_updated": "2026-04-24", + "cost": { + "input": 1.74, + "output": 3.48 + }, + "type": "chat" + }, + { + "id": "gpt-5.2-chat", + "name": "GPT-5.2 Chat", + "display_name": "GPT-5.2 Chat", "modalities": { "input": [ "text", @@ -84422,8 +89686,43 @@ ] }, "limit": { - "context": 400000, - "output": 272000 + "context": 128000, + "output": 16384 + }, + "temperature": false, + "tool_call": true, + "reasoning": { + "supported": true, + "default": true + }, + "attachment": true, + "open_weights": false, + "knowledge": "2025-08-31", + "release_date": "2025-12-11", + "last_updated": "2025-12-11", + "cost": { + "input": 1.75, + "output": 14, + "cache_read": 0.175 + }, + "type": "chat" + }, + { + "id": "o3", + "name": "o3", + "display_name": "o3", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 200000, + "output": 100000 }, "temperature": false, "tool_call": true, @@ -84435,10 +89734,9 @@ "reasoning": { "supported": true, "default_enabled": true, - "mode": "fixed", - "effort": "high", - "verbosity": "medium", - "verbosity_options": [ + "mode": "effort", + "effort": "medium", + "effort_options": [ "low", "medium", "high" @@ -84448,50 +89746,52 @@ }, "attachment": true, "open_weights": false, - "knowledge": "2024-09-30", - "release_date": "2025-10-06", - "last_updated": "2025-10-06", + "knowledge": "2024-05", + "release_date": "2025-04-16", + "last_updated": "2025-04-16", "cost": { - "input": 15, - "output": 120 + "input": 2, + "output": 8, + "cache_read": 0.5 }, "type": "chat" }, { - "id": "model-router", - "name": "Model Router", - "display_name": "Model Router", + "id": "deepseek-v3-0324", + "name": "DeepSeek-V3-0324", + "display_name": "DeepSeek-V3-0324", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 16384 + "context": 131072, + "output": 131072 }, + "temperature": true, "tool_call": true, "reasoning": { "supported": false }, - "attachment": true, - "open_weights": false, - "release_date": "2025-05-19", - "last_updated": "2025-11-18", + "attachment": false, + "open_weights": true, + "knowledge": "2024-07", + "release_date": "2025-03-24", + "last_updated": "2025-03-24", "cost": { - "input": 0.14, - "output": 0 + "input": 1.14, + "output": 4.56 }, "type": "chat" }, { - "id": "gpt-3.5-turbo-1106", - "name": "GPT-3.5 Turbo 1106", - "display_name": "GPT-3.5 Turbo 1106", + "id": "phi-3-small-128k-instruct", + "name": "Phi-3-small-instruct (128k)", + "display_name": "Phi-3-small-instruct (128k)", "modalities": { "input": [ "text" @@ -84501,8 +89801,8 @@ ] }, "limit": { - "context": 16384, - "output": 16384 + "context": 128000, + "output": 4096 }, "temperature": true, "tool_call": false, @@ -84510,20 +89810,20 @@ "supported": false }, "attachment": false, - "open_weights": false, - "knowledge": "2021-08", - "release_date": "2023-11-06", - "last_updated": "2023-11-06", + "open_weights": true, + "knowledge": "2023-10", + "release_date": "2024-04-23", + "last_updated": "2024-04-23", "cost": { - "input": 1, - "output": 2 + "input": 0.15, + "output": 0.6 }, "type": "chat" }, { - "id": "mistral-large-2411", - "name": "Mistral Large 24.11", - "display_name": "Mistral Large 24.11", + "id": "meta-llama-3-8b-instruct", + "name": "Meta-Llama-3-8B-Instruct", + "display_name": "Meta-Llama-3-8B-Instruct", "modalities": { "input": [ "text" @@ -84533,38 +89833,29 @@ ] }, "limit": { - "context": 128000, - "output": 32768 + "context": 8192, + "output": 2048 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": false }, "attachment": false, - "open_weights": false, - "knowledge": "2024-09", - "release_date": "2024-11-01", - "last_updated": "2024-11-01", + "open_weights": true, + "knowledge": "2023-12", + "release_date": "2024-04-18", + "last_updated": "2024-04-18", "cost": { - "input": 2, - "output": 6 + "input": 0.3, + "output": 0.61 }, "type": "chat" - } - ] - }, - "privatemode-ai": { - "id": "privatemode-ai", - "name": "Privatemode AI", - "display_name": "Privatemode AI", - "api": "http://localhost:8080/v1", - "doc": "https://docs.privatemode.ai/api/overview", - "models": [ + }, { - "id": "gemma-3-27b", - "name": "Gemma 3 27B", - "display_name": "Gemma 3 27B", + "id": "mistral-small-2503", + "name": "Mistral Small 3.1", + "display_name": "Mistral Small 3.1", "modalities": { "input": [ "text", @@ -84576,7 +89867,7 @@ }, "limit": { "context": 128000, - "output": 8192 + "output": 32768 }, "temperature": true, "tool_call": true, @@ -84584,20 +89875,20 @@ "supported": false }, "attachment": true, - "open_weights": true, - "knowledge": "2024-08", - "release_date": "2025-03-12", - "last_updated": "2025-03-12", + "open_weights": false, + "knowledge": "2024-09", + "release_date": "2025-03-01", + "last_updated": "2025-03-01", "cost": { - "input": 0, - "output": 0 + "input": 0.1, + "output": 0.3 }, "type": "chat" }, { - "id": "gpt-oss-120b", - "name": "gpt-oss-120b", - "display_name": "gpt-oss-120b", + "id": "text-embedding-3-large", + "name": "text-embedding-3-large", + "display_name": "text-embedding-3-large", "modalities": { "input": [ "text" @@ -84607,67 +89898,75 @@ ] }, "limit": { - "context": 128000, - "output": 128000 + "context": 8191, + "output": 3072 }, - "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true - } + "supported": false }, "attachment": false, - "open_weights": true, - "knowledge": "2025-08", - "release_date": "2025-08-04", - "last_updated": "2025-08-14", + "open_weights": false, + "release_date": "2024-01-25", + "last_updated": "2024-01-25", "cost": { - "input": 0, + "input": 0.13, "output": 0 }, - "type": "chat" + "type": "embedding" }, { - "id": "whisper-large-v3", - "name": "Whisper large-v3", - "display_name": "Whisper large-v3", + "id": "o1-mini", + "name": "o1-mini", + "display_name": "o1-mini", "modalities": { "input": [ - "audio" + "text" ], "output": [ "text" ] }, "limit": { - "context": 8192, - "output": 4096 + "context": 128000, + "output": 65536 }, - "temperature": true, - "tool_call": false, + "temperature": false, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": true, - "open_weights": true, + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": true, + "mode": "effort", + "effort": "medium", + "effort_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" + } + }, + "attachment": false, + "open_weights": false, "knowledge": "2023-09", - "release_date": "2023-09-01", - "last_updated": "2023-09-01", + "release_date": "2024-09-12", + "last_updated": "2024-09-12", "cost": { - "input": 0, - "output": 0 + "input": 1.1, + "output": 4.4, + "cache_read": 0.55 }, "type": "chat" }, { - "id": "qwen3-embedding-4b", - "name": "Qwen3-Embedding 4B", - "display_name": "Qwen3-Embedding 4B", + "id": "phi-3.5-mini-instruct", + "name": "Phi-3.5-mini-instruct", + "display_name": "Phi-3.5-mini-instruct", "modalities": { "input": [ "text" @@ -84677,8 +89976,8 @@ ] }, "limit": { - "context": 32000, - "output": 2560 + "context": 128000, + "output": 4096 }, "temperature": true, "tool_call": false, @@ -84687,19 +89986,19 @@ }, "attachment": false, "open_weights": true, - "knowledge": "2025-06", - "release_date": "2025-06-06", - "last_updated": "2025-06-06", + "knowledge": "2023-10", + "release_date": "2024-08-20", + "last_updated": "2024-08-20", "cost": { - "input": 0, - "output": 0 + "input": 0.13, + "output": 0.52 }, - "type": "embedding" + "type": "chat" }, { - "id": "qwen3-coder-30b-a3b", - "name": "Qwen3-Coder 30B-A3B", - "display_name": "Qwen3-Coder 30B-A3B", + "id": "mistral-nemo", + "name": "Mistral Nemo", + "display_name": "Mistral Nemo", "modalities": { "input": [ "text" @@ -84710,7 +90009,7 @@ }, "limit": { "context": 128000, - "output": 32768 + "output": 128000 }, "temperature": true, "tool_call": true, @@ -84719,28 +90018,19 @@ }, "attachment": false, "open_weights": true, - "knowledge": "2025-04", - "release_date": "2025-04", - "last_updated": "2025-04", + "knowledge": "2024-07", + "release_date": "2024-07-18", + "last_updated": "2024-07-18", "cost": { - "input": 0, - "output": 0 + "input": 0.15, + "output": 0.15 }, "type": "chat" - } - ] - }, - "snowflake-cortex": { - "id": "snowflake-cortex", - "name": "Snowflake Cortex", - "display_name": "Snowflake Cortex", - "api": "https://${SNOWFLAKE_ACCOUNT}.snowflakecomputing.com/api/v2/cortex/v1", - "doc": "https://docs.snowflake.com/en/user-guide/snowflake-cortex/cortex-rest-api", - "models": [ + }, { - "id": "openai-gpt-5.2", - "name": "GPT-5.2", - "display_name": "GPT-5.2", + "id": "cohere-embed-v-4-0", + "name": "Embed v4", + "display_name": "Embed v4", "modalities": { "input": [ "text", @@ -84751,26 +90041,28 @@ ] }, "limit": { - "context": 400000, - "output": 128000 + "context": 128000, + "output": 1536 }, "temperature": false, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": true + "supported": false }, "attachment": true, - "open_weights": false, - "knowledge": "2025-08-31", - "release_date": "2025-12-11", - "last_updated": "2025-12-11", + "open_weights": true, + "release_date": "2025-04-15", + "last_updated": "2025-04-15", + "cost": { + "input": 0.12, + "output": 0 + }, "type": "chat" }, { - "id": "claude-sonnet-4-6", - "name": "Claude Sonnet 4.6", - "display_name": "Claude Sonnet 4.6", + "id": "claude-opus-4-5", + "name": "Claude Opus 4.5", + "display_name": "Claude Opus 4.5", "modalities": { "input": [ "text", @@ -84782,8 +90074,8 @@ ] }, "limit": { - "context": 1000000, - "output": 16384 + "context": 200000, + "output": 64000 }, "temperature": true, "tool_call": true, @@ -84804,8 +90096,7 @@ "effort_options": [ "low", "medium", - "high", - "max" + "high" ], "interleaved": true, "summaries": true, @@ -84814,135 +90105,152 @@ "thinking_blocks" ], "notes": [ - "Anthropic recommends adaptive thinking with effort for Claude 4.6; budget_tokens remains a deprecated compatibility path.", - "Anthropic API defaults effort to high; lower effort levels should be chosen per workload." + "Claude Opus 4.5 uses manual thinking.type = \"enabled\" with budget_tokens; effort can be used alongside the thinking budget.", + "Interleaved thinking requires the interleaved-thinking-2025-05-14 beta header." ] } }, "attachment": true, "open_weights": false, - "knowledge": "2025-08-31", - "release_date": "2026-02-17", - "last_updated": "2026-03-13", + "knowledge": "2025-03-31", + "release_date": "2025-11-24", + "last_updated": "2025-08-01", + "cost": { + "input": 5, + "output": 25, + "cache_read": 0.5, + "cache_write": 6.25 + }, "type": "chat" }, { - "id": "openai-gpt-4.1", - "name": "GPT-4.1", - "display_name": "GPT-4.1", + "id": "gpt-5", + "name": "GPT-5", + "display_name": "GPT-5", "modalities": { "input": [ "text", - "image", - "pdf" + "image" ], "output": [ "text" ] }, "limit": { - "context": 1047576, - "output": 32768 + "context": 272000, + "output": 128000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": true, + "mode": "effort", + "effort": "medium", + "effort_options": [ + "minimal", + "low", + "medium", + "high" + ], + "verbosity": "medium", + "verbosity_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" + } }, "attachment": true, "open_weights": false, - "knowledge": "2024-04", - "release_date": "2025-04-14", - "last_updated": "2025-04-14", + "knowledge": "2024-09-30", + "release_date": "2025-08-07", + "last_updated": "2025-08-07", + "cost": { + "input": 1.25, + "output": 10, + "cache_read": 0.13 + }, "type": "chat" }, { - "id": "openai-gpt-5.4", - "name": "GPT-5.4", - "display_name": "GPT-5.4", + "id": "gpt-5-chat", + "name": "GPT-5 Chat", + "display_name": "GPT-5 Chat", "modalities": { "input": [ "text", - "image", - "pdf" + "image" ], "output": [ "text" ] }, "limit": { - "context": 1050000, - "output": 128000 + "context": 128000, + "output": 16384 }, "temperature": false, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": true, "default": true }, "attachment": true, "open_weights": false, - "knowledge": "2025-08-31", - "release_date": "2026-03-05", - "last_updated": "2026-03-05", + "knowledge": "2024-10-24", + "release_date": "2025-08-07", + "last_updated": "2025-08-07", + "cost": { + "input": 1.25, + "output": 10, + "cache_read": 0.13 + }, "type": "chat" }, { - "id": "claude-haiku-4-5", - "name": "Claude Haiku 4.5 (latest)", - "display_name": "Claude Haiku 4.5 (latest)", + "id": "cohere-command-a", + "name": "Command A", + "display_name": "Command A", "modalities": { "input": [ - "text", - "image", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 16384 + "context": 256000, + "output": 8000 }, "temperature": true, "tool_call": true, "reasoning": { "supported": true, - "default": false + "default": true }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": false, - "mode": "budget", - "budget": { - "min": 1024, - "unit": "tokens" - }, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ], - "notes": [ - "Claude 4 manual thinking uses thinking.type = \"enabled\" with budget_tokens.", - "Interleaved thinking requires the interleaved-thinking-2025-05-14 beta header for this model family." - ] - } + "attachment": false, + "open_weights": true, + "knowledge": "2024-06-01", + "release_date": "2025-03-13", + "last_updated": "2025-03-13", + "cost": { + "input": 2.5, + "output": 10 }, - "attachment": true, - "open_weights": false, - "knowledge": "2025-02-28", - "release_date": "2025-10-15", - "last_updated": "2025-10-15", "type": "chat" }, { - "id": "openai-gpt-5", - "name": "GPT-5", - "display_name": "GPT-5", + "id": "llama-3.2-11b-vision-instruct", + "name": "Llama-3.2-11B-Vision-Instruct", + "display_name": "Llama-3.2-11B-Vision-Instruct", "modalities": { "input": [ "text", @@ -84953,26 +90261,29 @@ ] }, "limit": { - "context": 400000, - "output": 128000 + "context": 128000, + "output": 8192 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, "attachment": true, - "open_weights": false, - "knowledge": "2024-09-30", - "release_date": "2025-08-07", - "last_updated": "2025-08-07", + "open_weights": true, + "knowledge": "2023-12", + "release_date": "2024-09-25", + "last_updated": "2024-09-25", + "cost": { + "input": 0.37, + "output": 0.37 + }, "type": "chat" - }, - { - "id": "openai-gpt-5-mini", - "name": "GPT-5 Mini", - "display_name": "GPT-5 Mini", + }, + { + "id": "gpt-5-pro", + "name": "GPT-5 Pro", + "display_name": "GPT-5 Pro", "modalities": { "input": [ "text", @@ -84983,8 +90294,8 @@ ] }, "limit": { - "context": 272000, - "output": 8192 + "context": 400000, + "output": 272000 }, "temperature": false, "tool_call": true, @@ -84992,47 +90303,68 @@ "supported": true, "default": true }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": true, + "mode": "fixed", + "effort": "high", + "verbosity": "medium", + "verbosity_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" + } + }, "attachment": true, "open_weights": false, - "knowledge": "2024-05-30", - "release_date": "2025-08-07", - "last_updated": "2025-08-07", + "knowledge": "2024-09-30", + "release_date": "2025-10-06", + "last_updated": "2025-10-06", + "cost": { + "input": 15, + "output": 120 + }, "type": "chat" }, { - "id": "openai-gpt-5-nano", - "name": "GPT-5 Nano", - "display_name": "GPT-5 Nano", + "id": "cohere-command-r-08-2024", + "name": "Command R", + "display_name": "Command R", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 400000, - "output": 128000 + "context": 128000, + "output": 4000 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false + }, + "attachment": false, + "open_weights": true, + "knowledge": "2024-06-01", + "release_date": "2024-08-30", + "last_updated": "2024-08-30", + "cost": { + "input": 0.15, + "output": 0.6 }, - "attachment": true, - "open_weights": false, - "knowledge": "2024-05-30", - "release_date": "2025-08-07", - "last_updated": "2025-08-07", "type": "chat" }, { - "id": "openai-gpt-5.1", - "name": "GPT-5.1", - "display_name": "GPT-5.1", + "id": "gpt-4o", + "name": "GPT-4o", + "display_name": "GPT-4o", "modalities": { "input": [ "text", @@ -85043,144 +90375,111 @@ ] }, "limit": { - "context": 400000, - "output": 128000 + "context": 128000, + "output": 16384 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, "attachment": true, "open_weights": false, - "knowledge": "2024-09-30", - "release_date": "2025-11-13", - "last_updated": "2025-11-13", + "knowledge": "2023-09", + "release_date": "2024-05-13", + "last_updated": "2024-08-06", + "cost": { + "input": 2.5, + "output": 10, + "cache_read": 1.25 + }, "type": "chat" }, { - "id": "claude-sonnet-4-5", - "name": "Claude Sonnet 4.5 (latest)", - "display_name": "Claude Sonnet 4.5 (latest)", + "id": "gpt-4", + "name": "GPT-4", + "display_name": "GPT-4", "modalities": { "input": [ - "text", - "image", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 16384 + "context": 8192, + "output": 8192 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": false - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": false, - "mode": "budget", - "budget": { - "min": 1024, - "unit": "tokens" - }, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ], - "notes": [ - "Claude 4 manual thinking uses thinking.type = \"enabled\" with budget_tokens.", - "Interleaved thinking requires the interleaved-thinking-2025-05-14 beta header for this model family." - ] - } + "supported": false }, - "attachment": true, + "attachment": false, "open_weights": false, - "knowledge": "2025-07-31", - "release_date": "2025-09-29", - "last_updated": "2025-09-29", + "knowledge": "2023-11", + "release_date": "2023-03-14", + "last_updated": "2023-03-14", + "cost": { + "input": 60, + "output": 120 + }, "type": "chat" }, { - "id": "claude-opus-4-7", - "name": "Claude Opus 4.7", - "display_name": "Claude Opus 4.7", + "id": "o4-mini", + "name": "o4-mini", + "display_name": "o4-mini", "modalities": { "input": [ "text", - "image", - "pdf" + "image" ], "output": [ "text" ] }, "limit": { - "context": 1000000, - "output": 128000 + "context": 200000, + "output": 100000 }, "temperature": false, "tool_call": true, "reasoning": { "supported": true, - "default": false + "default": true }, "extra_capabilities": { "reasoning": { "supported": true, - "default_enabled": false, + "default_enabled": true, "mode": "effort", - "effort": "high", + "effort": "medium", "effort_options": [ "low", "medium", - "high", - "xhigh", - "max" - ], - "interleaved": true, - "summaries": true, - "visibility": "omitted", - "continuation": [ - "thinking_blocks" + "high" ], - "notes": [ - "Claude Opus 4.7 and newer Opus models require thinking.type = \"adaptive\" to enable thinking explicitly.", - "Manual budget_tokens requests return 400 on Claude Opus 4.7 and newer adaptive-only Opus models.", - "task_budget is separate from thinking control and should not be treated as a thinking budget." - ] + "visibility": "hidden" } }, "attachment": true, "open_weights": false, - "knowledge": "2026-01-31", - "release_date": "2026-04-16", - "last_updated": "2026-04-16", + "knowledge": "2024-05", + "release_date": "2025-04-16", + "last_updated": "2025-04-16", + "cost": { + "input": 1.1, + "output": 4.4, + "cache_read": 0.275 + }, "type": "chat" - } - ] - }, - "moonshot-ai": { - "id": "moonshot-ai", - "name": "Moonshot AI", - "display_name": "Moonshot AI", - "api": "https://api.moonshot.ai/v1", - "doc": "https://platform.moonshot.ai/docs/api/chat", - "models": [ + }, { - "id": "kimi-k2-thinking-turbo", - "name": "Kimi K2 Thinking Turbo", - "display_name": "Kimi K2 Thinking Turbo", + "id": "phi-3-medium-128k-instruct", + "name": "Phi-3-medium-instruct (128k)", + "display_name": "Phi-3-medium-instruct (128k)", "modalities": { "input": [ "text" @@ -85190,42 +90489,29 @@ ] }, "limit": { - "context": 262144, - "output": 262144 + "context": 128000, + "output": 4096 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } + "supported": false }, "attachment": false, "open_weights": true, - "knowledge": "2024-08", - "release_date": "2025-11-06", - "last_updated": "2025-11-06", + "knowledge": "2023-10", + "release_date": "2024-04-23", + "last_updated": "2024-04-23", "cost": { - "input": 1.15, - "output": 8, - "cache_read": 0.15 + "input": 0.17, + "output": 0.68 }, "type": "chat" }, { - "id": "kimi-k2-thinking", - "name": "Kimi K2 Thinking", - "display_name": "Kimi K2 Thinking", + "id": "gpt-4-32k", + "name": "GPT-4 32K", + "display_name": "GPT-4 32K", "modalities": { "input": [ "text" @@ -85235,89 +90521,61 @@ ] }, "limit": { - "context": 262144, - "output": 262144 + "context": 32768, + "output": 32768 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } + "supported": false }, "attachment": false, - "open_weights": true, - "knowledge": "2024-08", - "release_date": "2025-11-06", - "last_updated": "2025-11-06", + "open_weights": false, + "knowledge": "2023-11", + "release_date": "2023-03-14", + "last_updated": "2023-03-14", "cost": { - "input": 0.6, - "output": 2.5, - "cache_read": 0.15 + "input": 60, + "output": 120 }, "type": "chat" }, { - "id": "kimi-k2.6", - "name": "Kimi K2.6", - "display_name": "Kimi K2.6", + "id": "meta-llama-3.1-405b-instruct", + "name": "Meta-Llama-3.1-405B-Instruct", + "display_name": "Meta-Llama-3.1-405B-Instruct", "modalities": { "input": [ - "text", - "image", - "video" + "text" ], "output": [ "text" ] }, "limit": { - "context": 262144, - "output": 262144 + "context": 128000, + "output": 32768 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } + "supported": false }, - "attachment": true, + "attachment": false, "open_weights": true, - "knowledge": "2025-01", - "release_date": "2026-04-21", - "last_updated": "2026-04-21", + "knowledge": "2023-12", + "release_date": "2024-07-23", + "last_updated": "2024-07-23", "cost": { - "input": 0.95, - "output": 4, - "cache_read": 0.16 + "input": 5.33, + "output": 16 }, "type": "chat" }, { - "id": "kimi-k2-turbo-preview", - "name": "Kimi K2 Turbo", - "display_name": "Kimi K2 Turbo", + "id": "cohere-command-r-plus-08-2024", + "name": "Command R+", + "display_name": "Command R+", "modalities": { "input": [ "text" @@ -85327,8 +90585,8 @@ ] }, "limit": { - "context": 262144, - "output": 262144 + "context": 128000, + "output": 4000 }, "temperature": true, "tool_call": true, @@ -85337,20 +90595,19 @@ }, "attachment": false, "open_weights": true, - "knowledge": "2024-10", - "release_date": "2025-09-05", - "last_updated": "2025-09-05", + "knowledge": "2024-06-01", + "release_date": "2024-08-30", + "last_updated": "2024-08-30", "cost": { - "input": 2.4, - "output": 10, - "cache_read": 0.6 + "input": 2.5, + "output": 10 }, "type": "chat" }, { - "id": "kimi-k2-0905-preview", - "name": "Kimi K2 0905", - "display_name": "Kimi K2 0905", + "id": "phi-4-mini", + "name": "Phi-4-mini", + "display_name": "Phi-4-mini", "modalities": { "input": [ "text" @@ -85360,8 +90617,8 @@ ] }, "limit": { - "context": 262144, - "output": 262144 + "context": 128000, + "output": 4096 }, "temperature": true, "tool_call": true, @@ -85370,20 +90627,19 @@ }, "attachment": false, "open_weights": true, - "knowledge": "2024-10", - "release_date": "2025-09-05", - "last_updated": "2025-09-05", + "knowledge": "2023-10", + "release_date": "2024-12-11", + "last_updated": "2024-12-11", "cost": { - "input": 0.6, - "output": 2.5, - "cache_read": 0.15 + "input": 0.075, + "output": 0.3 }, "type": "chat" }, { - "id": "kimi-k2-0711-preview", - "name": "Kimi K2 0711", - "display_name": "Kimi K2 0711", + "id": "gpt-3.5-turbo-1106", + "name": "GPT-3.5 Turbo 1106", + "display_name": "GPT-3.5 Turbo 1106", "modalities": { "input": [ "text" @@ -85393,85 +90649,62 @@ ] }, "limit": { - "context": 131072, + "context": 16384, "output": 16384 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": false }, "attachment": false, - "open_weights": true, - "knowledge": "2024-10", - "release_date": "2025-07-14", - "last_updated": "2025-07-14", + "open_weights": false, + "knowledge": "2021-08", + "release_date": "2023-11-06", + "last_updated": "2023-11-06", "cost": { - "input": 0.6, - "output": 2.5, - "cache_read": 0.15 + "input": 1, + "output": 2 }, "type": "chat" }, { - "id": "kimi-k2.5", - "name": "Kimi K2.5", - "display_name": "Kimi K2.5", + "id": "llama-4-scout-17b-16e-instruct", + "name": "Llama 4 Scout 17B 16E Instruct", + "display_name": "Llama 4 Scout 17B 16E Instruct", "modalities": { "input": [ "text", - "image", - "video" + "image" ], "output": [ "text" ] }, "limit": { - "context": 262144, - "output": 262144 + "context": 128000, + "output": 8192 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } + "supported": false }, - "attachment": false, + "attachment": true, "open_weights": true, - "knowledge": "2025-01", - "release_date": "2026-01", - "last_updated": "2026-01", + "knowledge": "2024-08", + "release_date": "2025-04-05", + "last_updated": "2025-04-05", "cost": { - "input": 0.6, - "output": 3, - "cache_read": 0.1 + "input": 0.2, + "output": 0.78 }, "type": "chat" - } - ] - }, - "perplexity": { - "id": "perplexity", - "name": "Perplexity", - "display_name": "Perplexity", - "doc": "https://docs.perplexity.ai", - "models": [ + }, { - "id": "sonar", - "name": "Sonar", - "display_name": "Sonar", + "id": "llama-3.3-70b-instruct", + "name": "Llama-3.3-70B-Instruct", + "display_name": "Llama-3.3-70B-Instruct", "modalities": { "input": [ "text" @@ -85482,95 +90715,103 @@ }, "limit": { "context": 128000, - "output": 4096 + "output": 32768 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { "supported": false }, "attachment": false, - "open_weights": false, - "knowledge": "2025-09-01", - "release_date": "2024-01-01", - "last_updated": "2025-09-01", + "open_weights": true, + "knowledge": "2023-12", + "release_date": "2024-12-06", + "last_updated": "2024-12-06", "cost": { - "input": 1, - "output": 1 + "input": 0.71, + "output": 0.71 }, "type": "chat" }, { - "id": "sonar-pro", - "name": "Sonar Pro", - "display_name": "Sonar Pro", + "id": "grok-4-20-non-reasoning", + "name": "Grok 4.20 (Non-Reasoning)", + "display_name": "Grok 4.20 (Non-Reasoning)", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 200000, + "context": 262000, "output": 8192 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { - "supported": false + "supported": true }, - "attachment": true, + "extra_capabilities": { + "reasoning": { + "supported": true + } + }, + "attachment": false, "open_weights": false, - "knowledge": "2025-09-01", - "release_date": "2024-01-01", - "last_updated": "2025-09-01", + "knowledge": "2025-09", + "release_date": "2026-04-08", + "last_updated": "2026-04-08", "cost": { - "input": 3, - "output": 15 + "input": 2, + "output": 6 }, "type": "chat" }, { - "id": "sonar-reasoning-pro", - "name": "Sonar Reasoning Pro", - "display_name": "Sonar Reasoning Pro", + "id": "gpt-5.1-chat", + "name": "GPT-5.1 Chat", + "display_name": "GPT-5.1 Chat", "modalities": { "input": [ "text", - "image" + "image", + "audio" ], "output": [ - "text" + "text", + "image", + "audio" ] }, "limit": { "context": 128000, - "output": 4096 + "output": 16384 }, - "temperature": true, - "tool_call": false, + "temperature": false, + "tool_call": true, "reasoning": { "supported": true, "default": true }, "attachment": true, "open_weights": false, - "knowledge": "2025-09-01", - "release_date": "2024-01-01", - "last_updated": "2025-09-01", + "knowledge": "2024-09-30", + "release_date": "2025-11-14", + "last_updated": "2025-11-14", "cost": { - "input": 2, - "output": 8 + "input": 1.25, + "output": 10, + "cache_read": 0.125 }, "type": "chat" }, { - "id": "sonar-deep-research", - "name": "Perplexity Sonar Deep Research", - "display_name": "Perplexity Sonar Deep Research", + "id": "deepseek-v4-pro", + "name": "DeepSeek-V4-Pro", + "display_name": "DeepSeek-V4-Pro", "modalities": { "input": [ "text" @@ -85580,40 +90821,41 @@ ] }, "limit": { - "context": 128000, - "output": 32768 + "context": 1000000, + "output": 384000 }, - "temperature": false, + "temperature": true, "tool_call": false, "reasoning": { "supported": true, "default": true }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } + }, "attachment": false, - "open_weights": false, - "knowledge": "2025-01", - "release_date": "2025-02-01", - "last_updated": "2025-09-01", + "open_weights": true, + "knowledge": "2025-05", + "release_date": "2026-04-24", + "last_updated": "2026-04-24", "cost": { - "input": 2, - "output": 8, - "reasoning": 3 + "input": 0.19, + "output": 0.51 }, "type": "chat" - } - ] - }, - "llmgateway": { - "id": "llmgateway", - "name": "LLM Gateway", - "display_name": "LLM Gateway", - "api": "https://api.llmgateway.io/v1", - "doc": "https://llmgateway.io/docs", - "models": [ + }, { - "id": "kimi-k2-thinking-turbo", - "name": "Kimi K2 Thinking Turbo", - "display_name": "Kimi K2 Thinking Turbo", + "id": "kimi-k2-thinking", + "name": "Kimi K2 Thinking", + "display_name": "Kimi K2 Thinking", "modalities": { "input": [ "text" @@ -85647,52 +90889,76 @@ "open_weights": true, "knowledge": "2024-08", "release_date": "2025-11-06", - "last_updated": "2025-11-06", + "last_updated": "2025-12-02", "cost": { - "input": 1.15, - "output": 8, + "input": 0.6, + "output": 2.5, "cache_read": 0.15 }, "type": "chat" }, { - "id": "gemini-pro-latest", - "name": "Gemini Pro Latest", - "display_name": "Gemini Pro Latest", + "id": "claude-sonnet-4-5", + "name": "Claude Sonnet 4.5", + "display_name": "Claude Sonnet 4.5", "modalities": { "input": [ "text", - "image" + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 1048576, - "output": 65536 + "context": 200000, + "output": 64000 }, "temperature": true, "tool_call": true, "reasoning": { "supported": true, - "default": true + "default": false + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": false, + "mode": "budget", + "budget": { + "min": 1024, + "unit": "tokens" + }, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ], + "notes": [ + "Claude 4 manual thinking uses thinking.type = \"enabled\" with budget_tokens.", + "Interleaved thinking requires the interleaved-thinking-2025-05-14 beta header for this model family." + ] + } }, "attachment": true, "open_weights": false, - "release_date": "2026-02-27", - "last_updated": "2026-02-27", + "knowledge": "2025-07-31", + "release_date": "2025-11-18", + "last_updated": "2025-11-18", "cost": { - "input": 2, - "output": 12, - "cache_read": 0.2 + "input": 3, + "output": 15, + "cache_read": 0.3, + "cache_write": 3.75 }, "type": "chat" }, { - "id": "llama-3.1-70b-instruct", - "name": "Llama 3.1 70B Instruct", - "display_name": "Llama 3.1 70B Instruct", + "id": "deepseek-r1", + "name": "DeepSeek-R1", + "display_name": "DeepSeek-R1", "modalities": { "input": [ "text" @@ -85702,83 +90968,79 @@ ] }, "limit": { - "context": 128000, - "output": 2048 + "context": 163840, + "output": 163840 }, "temperature": true, "tool_call": false, "reasoning": { - "supported": false + "supported": true, + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } }, "attachment": false, "open_weights": true, - "release_date": "2024-07-23", - "last_updated": "2024-07-23", + "knowledge": "2024-07", + "release_date": "2025-01-20", + "last_updated": "2025-01-20", "cost": { - "input": 0.72, - "output": 0.72 + "input": 1.35, + "output": 5.4 }, "type": "chat" }, { - "id": "grok-4-20-beta-0309-reasoning", - "name": "Grok 4.20 (Reasoning)", - "display_name": "Grok 4.20 (Reasoning)", + "id": "grok-4-1-fast-non-reasoning", + "name": "Grok 4.1 Fast (Non-Reasoning)", + "display_name": "Grok 4.1 Fast (Non-Reasoning)", "modalities": { "input": [ "text", - "image", - "pdf" + "image" ], "output": [ "text" ] }, "limit": { - "context": 1000000, - "output": 30000 + "context": 128000, + "output": 8192 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, "attachment": true, "open_weights": false, - "release_date": "2026-03-09", - "last_updated": "2026-03-09", + "release_date": "2025-06-27", + "last_updated": "2025-06-27", "cost": { - "input": 1.25, - "output": 2.5, - "cache_read": 0.2, - "tiers": [ - { - "input": 2.5, - "output": 5, - "cache_read": 0.4, - "tier": { - "type": "context", - "size": 200000 - } - } - ], - "context_over_200k": { - "input": 2.5, - "output": 5, - "cache_read": 0.4 - } + "input": 0.2, + "output": 0.5, + "cache_read": 0.05 }, "type": "chat" }, { - "id": "gpt-5-pro", - "name": "GPT-5 Pro", - "display_name": "GPT-5 Pro", + "id": "gpt-5.4-nano", + "name": "GPT-5.4 Nano", + "display_name": "GPT-5.4 Nano", "modalities": { "input": [ "text", - "image" + "image", + "pdf" ], "output": [ "text" @@ -85786,20 +91048,27 @@ }, "limit": { "context": 400000, - "output": 272000 + "output": 128000 }, "temperature": false, "tool_call": true, "reasoning": { "supported": true, - "default": true + "default": false }, "extra_capabilities": { "reasoning": { "supported": true, - "default_enabled": true, - "mode": "fixed", - "effort": "high", + "default_enabled": false, + "mode": "effort", + "effort": "none", + "effort_options": [ + "none", + "low", + "medium", + "high", + "xhigh" + ], "verbosity": "medium", "verbosity_options": [ "low", @@ -85811,19 +91080,20 @@ }, "attachment": true, "open_weights": false, - "knowledge": "2024-09-30", - "release_date": "2025-10-06", - "last_updated": "2025-10-06", + "knowledge": "2025-08-31", + "release_date": "2026-03-17", + "last_updated": "2026-03-17", "cost": { - "input": 15, - "output": 120 + "input": 0.2, + "output": 1.25, + "cache_read": 0.02 }, "type": "chat" }, { - "id": "glm-4.5-flash", - "name": "GLM-4.5-Flash", - "display_name": "GLM-4.5-Flash", + "id": "phi-3-small-8k-instruct", + "name": "Phi-3-small-instruct (8k)", + "display_name": "Phi-3-small-instruct (8k)", "modalities": { "input": [ "text" @@ -85833,32 +91103,64 @@ ] }, "limit": { - "context": 131072, - "output": 98304 + "context": 8192, + "output": 2048 }, "temperature": true, + "tool_call": false, + "reasoning": { + "supported": false + }, + "attachment": false, + "open_weights": true, + "knowledge": "2023-10", + "release_date": "2024-04-23", + "last_updated": "2024-04-23", + "cost": { + "input": 0.15, + "output": 0.6 + }, + "type": "chat" + }, + { + "id": "gpt-5.3-chat", + "name": "GPT-5.3 Chat", + "display_name": "GPT-5.3 Chat", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 128000, + "output": 16384 + }, + "temperature": false, "tool_call": true, "reasoning": { "supported": true, "default": true }, - "attachment": false, + "attachment": true, "open_weights": false, - "knowledge": "2025-04", - "release_date": "2025-07-28", - "last_updated": "2025-07-28", + "knowledge": "2025-08-31", + "release_date": "2026-03-03", + "last_updated": "2026-03-03", "cost": { - "input": 0, - "output": 0, - "cache_read": 0, - "cache_write": 0 + "input": 1.75, + "output": 14, + "cache_read": 0.175 }, "type": "chat" }, { - "id": "qwen3-30b-a3b-instruct-2507", - "name": "Qwen3 30B A3B Instruct (2507)", - "display_name": "Qwen3 30B A3B Instruct (2507)", + "id": "gpt-3.5-turbo-0125", + "name": "GPT-3.5 Turbo 0125", + "display_name": "GPT-3.5 Turbo 0125", "modalities": { "input": [ "text" @@ -85868,28 +91170,29 @@ ] }, "limit": { - "context": 131072, - "output": 8192 + "context": 16384, + "output": 16384 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": false }, "attachment": false, - "open_weights": true, - "release_date": "2025-07-08", - "last_updated": "2025-07-08", + "open_weights": false, + "knowledge": "2021-08", + "release_date": "2024-01-25", + "last_updated": "2024-01-25", "cost": { - "input": 0.1, - "output": 0.3 + "input": 0.5, + "output": 1.5 }, "type": "chat" }, { - "id": "deepseek-r1-0528", - "name": "DeepSeek R1 (0528)", - "display_name": "DeepSeek R1 (0528)", + "id": "cohere-embed-v3-multilingual", + "name": "Embed v3 Multilingual", + "display_name": "Embed v3 Multilingual", "modalities": { "input": [ "text" @@ -85899,112 +91202,70 @@ ] }, "limit": { - "context": 64000, - "output": 16384 + "context": 512, + "output": 1024 }, - "temperature": true, + "temperature": false, "tool_call": false, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } + "supported": false }, "attachment": false, "open_weights": true, - "release_date": "2025-05-28", - "last_updated": "2025-05-28", + "release_date": "2023-11-07", + "last_updated": "2023-11-07", "cost": { - "input": 0.55, - "output": 2.19 + "input": 0.1, + "output": 0 }, "type": "chat" }, { - "id": "claude-sonnet-4-6", - "name": "Claude Sonnet 4.6", - "display_name": "Claude Sonnet 4.6", + "id": "gpt-3.5-turbo-0613", + "name": "GPT-3.5 Turbo 0613", + "display_name": "GPT-3.5 Turbo 0613", "modalities": { "input": [ - "text", - "image", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 1000000, - "output": 64000 + "context": 16384, + "output": 16384 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": false - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": false, - "mode": "mixed", - "budget": { - "min": 1024, - "unit": "tokens" - }, - "effort": "high", - "effort_options": [ - "low", - "medium", - "high", - "max" - ], - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ], - "notes": [ - "Anthropic recommends adaptive thinking with effort for Claude 4.6; budget_tokens remains a deprecated compatibility path.", - "Anthropic API defaults effort to high; lower effort levels should be chosen per workload." - ] - } + "supported": false }, - "attachment": true, + "attachment": false, "open_weights": false, - "knowledge": "2025-08-31", - "release_date": "2026-02-17", - "last_updated": "2026-03-13", + "knowledge": "2021-08", + "release_date": "2023-06-13", + "last_updated": "2023-06-13", "cost": { "input": 3, - "output": 15, - "cache_read": 0.3, - "cache_write": 3.75 + "output": 4 }, "type": "chat" }, { - "id": "gpt-5-mini", - "name": "GPT-5 Mini", - "display_name": "GPT-5 Mini", + "id": "gpt-5.1-codex", + "name": "GPT-5.1 Codex", + "display_name": "GPT-5.1 Codex", "modalities": { "input": [ "text", - "image" + "image", + "audio" ], "output": [ - "text" + "text", + "image", + "audio" ] }, "limit": { @@ -86015,16 +91276,16 @@ "tool_call": true, "reasoning": { "supported": true, - "default": true + "default": false }, "extra_capabilities": { "reasoning": { "supported": true, - "default_enabled": true, + "default_enabled": false, "mode": "effort", - "effort": "medium", + "effort": "none", "effort_options": [ - "minimal", + "none", "low", "medium", "high" @@ -86038,154 +91299,111 @@ "visibility": "hidden" } }, - "attachment": true, + "attachment": false, "open_weights": false, - "knowledge": "2024-05-30", - "release_date": "2025-08-07", - "last_updated": "2025-08-07", + "knowledge": "2024-09-30", + "release_date": "2025-11-14", + "last_updated": "2025-11-14", "cost": { - "input": 0.25, - "output": 2, - "cache_read": 0.025 + "input": 1.25, + "output": 10, + "cache_read": 0.125 }, "type": "chat" }, { - "id": "qwen35-397b-a17b", - "name": "Qwen3.5 397B-A17B", - "display_name": "Qwen3.5 397B-A17B", + "id": "gpt-5.1-codex-max", + "name": "GPT-5.1 Codex Max", + "display_name": "GPT-5.1 Codex Max", "modalities": { "input": [ "text", - "image", - "video", - "audio" - ], - "output": [ - "text" - ] - }, - "limit": { - "context": 262144, - "output": 65536 - }, - "temperature": true, - "tool_call": true, - "reasoning": { - "supported": true, - "default": true - }, - "attachment": true, - "open_weights": true, - "release_date": "2026-02-15", - "last_updated": "2026-02-15", - "cost": { - "input": 0.6, - "output": 3.6 - }, - "type": "chat" - }, - { - "id": "qwen3-next-80b-a3b-instruct", - "name": "Qwen3-Next 80B-A3B Instruct", - "display_name": "Qwen3-Next 80B-A3B Instruct", - "modalities": { - "input": [ - "text" - ], - "output": [ - "text" - ] - }, - "limit": { - "context": 131072, - "output": 32768 - }, - "temperature": true, - "tool_call": true, - "reasoning": { - "supported": false - }, - "attachment": false, - "open_weights": true, - "knowledge": "2025-04", - "release_date": "2025-09", - "last_updated": "2025-09", - "cost": { - "input": 0.5, - "output": 2 - }, - "type": "chat" - }, - { - "id": "sonar", - "name": "Sonar", - "display_name": "Sonar", - "modalities": { - "input": [ - "text" + "image" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 4096 + "context": 400000, + "output": 128000 }, - "temperature": true, - "tool_call": false, + "temperature": false, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": false }, - "attachment": false, + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": false, + "mode": "effort", + "effort": "none", + "effort_options": [ + "none", + "low", + "medium", + "high" + ], + "verbosity": "medium", + "verbosity_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" + } + }, + "attachment": true, "open_weights": false, - "knowledge": "2025-09-01", - "release_date": "2024-01-01", - "last_updated": "2025-09-01", + "knowledge": "2024-09-30", + "release_date": "2025-11-13", + "last_updated": "2025-11-13", "cost": { - "input": 1, - "output": 1 + "input": 1.25, + "output": 10, + "cache_read": 0.125 }, "type": "chat" }, { - "id": "qwen2-5-vl-72b-instruct", - "name": "Qwen2.5-VL 72B Instruct", - "display_name": "Qwen2.5-VL 72B Instruct", + "id": "phi-4-reasoning", + "name": "Phi-4-reasoning", + "display_name": "Phi-4-reasoning", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 131072, - "output": 8192 + "context": 32000, + "output": 4096 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": false + "supported": true, + "default": true }, "attachment": false, "open_weights": true, - "knowledge": "2024-04", - "release_date": "2024-09", - "last_updated": "2024-09", + "knowledge": "2023-10", + "release_date": "2024-12-11", + "last_updated": "2024-12-11", "cost": { - "input": 2.8, - "output": 8.4 + "input": 0.125, + "output": 0.5 }, "type": "chat" }, { - "id": "gemma-3-27b", - "name": "Gemma 3 27B", - "display_name": "Gemma 3 27B", + "id": "mistral-medium-2505", + "name": "Mistral Medium 3", + "display_name": "Mistral Medium 3", "modalities": { "input": [ "text", @@ -86197,27 +91415,28 @@ }, "limit": { "context": 128000, - "output": 16384 + "output": 128000 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { "supported": false }, "attachment": true, - "open_weights": true, - "release_date": "2025-03-12", - "last_updated": "2025-03-12", + "open_weights": false, + "knowledge": "2025-05", + "release_date": "2025-05-07", + "last_updated": "2025-05-07", "cost": { - "input": 0.27, - "output": 0.27 + "input": 0.4, + "output": 2 }, "type": "chat" }, { - "id": "glm-4.7-flashx", - "name": "GLM-4.7-FlashX", - "display_name": "GLM-4.7-FlashX", + "id": "meta-llama-3.1-70b-instruct", + "name": "Meta-Llama-3.1-70B-Instruct", + "display_name": "Meta-Llama-3.1-70B-Instruct", "modalities": { "input": [ "text" @@ -86227,92 +91446,100 @@ ] }, "limit": { - "context": 200000, - "output": 131072 + "context": 128000, + "output": 32768 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, "attachment": false, "open_weights": true, - "knowledge": "2025-04", - "release_date": "2026-01-19", - "last_updated": "2026-01-19", + "knowledge": "2023-12", + "release_date": "2024-07-23", + "last_updated": "2024-07-23", "cost": { - "input": 0.07, - "output": 0.4, - "cache_read": 0.01, - "cache_write": 0 + "input": 2.68, + "output": 3.54 }, "type": "chat" }, { - "id": "gpt-4o", - "name": "GPT-4o", - "display_name": "GPT-4o", + "id": "text-embedding-ada-002", + "name": "text-embedding-ada-002", + "display_name": "text-embedding-ada-002", "modalities": { "input": [ - "text", - "image", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 16384 + "context": 8192, + "output": 1536 }, - "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": false }, - "attachment": true, + "attachment": false, "open_weights": false, - "knowledge": "2023-09", - "release_date": "2024-05-13", - "last_updated": "2024-08-06", + "release_date": "2022-12-15", + "last_updated": "2022-12-15", "cost": { - "input": 2.5, - "output": 10, - "cache_read": 1.25 + "input": 0.1, + "output": 0 }, - "type": "chat" + "type": "embedding" }, { - "id": "qwen3-vl-30b-a3b-instruct", - "name": "Qwen3 VL 30B A3B Instruct", - "display_name": "Qwen3 VL 30B A3B Instruct", + "id": "o3-mini", + "name": "o3-mini", + "display_name": "o3-mini", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 131072, - "output": 8192 + "context": 200000, + "output": 100000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": true, - "open_weights": true, - "release_date": "2025-10-02", - "last_updated": "2025-10-02", + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": true, + "mode": "effort", + "effort": "medium", + "effort_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" + } + }, + "attachment": false, + "open_weights": false, + "knowledge": "2024-05", + "release_date": "2024-12-20", + "last_updated": "2025-01-29", "cost": { - "input": 0.2, - "output": 0.7 + "input": 1.1, + "output": 4.4, + "cache_read": 0.55 }, "type": "chat" }, @@ -86369,14 +91596,14 @@ "cost": { "input": 1.75, "output": 14, - "cache_read": 0.175 + "cache_read": 0.125 }, "type": "chat" }, { - "id": "glm-4.6v-flash", - "name": "GLM-4.6V Flash", - "display_name": "GLM-4.6V Flash", + "id": "gpt-4-turbo-vision", + "name": "GPT-4 Turbo Vision", + "display_name": "GPT-4 Turbo Vision", "modalities": { "input": [ "text", @@ -86388,108 +91615,72 @@ }, "limit": { "context": 128000, - "output": 16000 + "output": 4096 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true - }, - "attachment": true, - "open_weights": true, - "release_date": "2025-12-08", - "last_updated": "2025-12-08", - "cost": { - "input": 0, - "output": 0 - }, - "type": "chat" - }, - { - "id": "gpt-5-chat-latest", - "name": "GPT-5 Chat (latest)", - "display_name": "GPT-5 Chat (latest)", - "modalities": { - "input": [ - "text", - "image" - ], - "output": [ - "text" - ] - }, - "limit": { - "context": 400000, - "output": 128000 - }, - "temperature": true, - "tool_call": false, - "reasoning": { - "supported": true, - "default": true + "supported": false }, "attachment": true, "open_weights": false, - "knowledge": "2024-09-30", - "release_date": "2025-08-07", - "last_updated": "2025-08-07", + "knowledge": "2023-11", + "release_date": "2023-11-06", + "last_updated": "2024-04-09", "cost": { - "input": 1.25, - "output": 10, - "cache_read": 0.125 + "input": 10, + "output": 30 }, "type": "chat" }, { - "id": "ministral-14b-2512", - "name": "Ministral 14B", - "display_name": "Ministral 14B", + "id": "mistral-large-2411", + "name": "Mistral Large 24.11", + "display_name": "Mistral Large 24.11", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 262144, - "output": 8192 + "context": 128000, + "output": 32768 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { "supported": false }, - "attachment": true, - "open_weights": true, - "release_date": "2025-12-02", - "last_updated": "2025-12-02", + "attachment": false, + "open_weights": false, + "knowledge": "2024-09", + "release_date": "2024-11-01", + "last_updated": "2024-11-01", "cost": { - "input": 0.2, - "output": 0.2 + "input": 2, + "output": 6 }, "type": "chat" }, { - "id": "o3", - "name": "o3", - "display_name": "o3", + "id": "gpt-5.3-codex", + "name": "GPT-5.3 Codex", + "display_name": "GPT-5.3 Codex", "modalities": { "input": [ "text", - "image", - "pdf" + "image" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 100000 + "context": 400000, + "output": 128000 }, "temperature": false, "tool_call": true, @@ -86504,6 +91695,13 @@ "mode": "effort", "effort": "medium", "effort_options": [ + "low", + "medium", + "high", + "xhigh" + ], + "verbosity": "medium", + "verbosity_options": [ "low", "medium", "high" @@ -86511,22 +91709,22 @@ "visibility": "hidden" } }, - "attachment": true, + "attachment": false, "open_weights": false, - "knowledge": "2024-05", - "release_date": "2025-04-16", - "last_updated": "2025-04-16", + "knowledge": "2025-08-31", + "release_date": "2026-02-24", + "last_updated": "2026-02-24", "cost": { - "input": 2, - "output": 8, - "cache_read": 0.5 + "input": 1.75, + "output": 14, + "cache_read": 0.175 }, "type": "chat" }, { - "id": "glm-4.6", - "name": "GLM-4.6", - "display_name": "GLM-4.6", + "id": "text-embedding-3-small", + "name": "text-embedding-3-small", + "display_name": "text-embedding-3-small", "modalities": { "input": [ "text" @@ -86536,71 +91734,27 @@ ] }, "limit": { - "context": 204800, - "output": 131072 - }, - "temperature": true, - "tool_call": true, - "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true - } - }, - "attachment": false, - "open_weights": true, - "knowledge": "2025-04", - "release_date": "2025-09-30", - "last_updated": "2025-09-30", - "cost": { - "input": 0.6, - "output": 2.2, - "cache_read": 0.11, - "cache_write": 0 - }, - "type": "chat" - }, - { - "id": "gpt-5.3-chat-latest", - "name": "GPT-5.3 Chat (latest)", - "display_name": "GPT-5.3 Chat (latest)", - "modalities": { - "input": [ - "text", - "image" - ], - "output": [ - "text" - ] - }, - "limit": { - "context": 128000, - "output": 16384 + "context": 8191, + "output": 1536 }, - "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": false }, - "attachment": true, + "attachment": false, "open_weights": false, - "knowledge": "2025-08-31", - "release_date": "2026-03-03", - "last_updated": "2026-03-03", + "release_date": "2024-01-25", + "last_updated": "2024-01-25", "cost": { - "input": 1.75, - "output": 14, - "cache_read": 0.175 + "input": 0.02, + "output": 0 }, - "type": "chat" + "type": "embedding" }, { - "id": "qwen3-32b", - "name": "Qwen3 32B", - "display_name": "Qwen3 32B", + "id": "deepseek-v3.2-speciale", + "name": "DeepSeek-V3.2-Speciale", + "display_name": "DeepSeek-V3.2-Speciale", "modalities": { "input": [ "text" @@ -86610,42 +91764,30 @@ ] }, "limit": { - "context": 131072, - "output": 16384 + "context": 128000, + "output": 128000 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": true, "default": true }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } - }, "attachment": false, "open_weights": true, - "knowledge": "2025-04", - "release_date": "2025-04", - "last_updated": "2025-04", + "knowledge": "2024-07", + "release_date": "2025-12-01", + "last_updated": "2025-12-01", "cost": { - "input": 0.7, - "output": 2.8, - "reasoning": 8.4 + "input": 0.58, + "output": 1.68 }, "type": "chat" }, { - "id": "qwen3-coder-30b-a3b-instruct", - "name": "Qwen3-Coder 30B-A3B Instruct", - "display_name": "Qwen3-Coder 30B-A3B Instruct", + "id": "gpt-3.5-turbo-0301", + "name": "GPT-3.5 Turbo 0301", + "display_name": "GPT-3.5 Turbo 0301", "modalities": { "input": [ "text" @@ -86655,29 +91797,29 @@ ] }, "limit": { - "context": 262144, - "output": 65536 + "context": 4096, + "output": 4096 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": false }, "attachment": false, - "open_weights": true, - "knowledge": "2025-04", - "release_date": "2025-04", - "last_updated": "2025-04", + "open_weights": false, + "knowledge": "2021-08", + "release_date": "2023-03-01", + "last_updated": "2023-03-01", "cost": { - "input": 0.45, - "output": 2.25 + "input": 1.5, + "output": 2 }, "type": "chat" }, { - "id": "kimi-k2-thinking", - "name": "Kimi K2 Thinking", - "display_name": "Kimi K2 Thinking", + "id": "meta-llama-3.1-8b-instruct", + "name": "Meta-Llama-3.1-8B-Instruct", + "display_name": "Meta-Llama-3.1-8B-Instruct", "modalities": { "input": [ "text" @@ -86687,86 +91829,29 @@ ] }, "limit": { - "context": 262144, - "output": 262144 + "context": 128000, + "output": 32768 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } + "supported": false }, "attachment": false, "open_weights": true, - "knowledge": "2024-08", - "release_date": "2025-11-06", - "last_updated": "2025-11-06", - "cost": { - "input": 0.6, - "output": 2.5, - "cache_read": 0.15 - }, - "type": "chat" - }, - { - "id": "qwen3-vl-30b-a3b-thinking", - "name": "Qwen3 VL 30B A3B Thinking", - "display_name": "Qwen3 VL 30B A3B Thinking", - "modalities": { - "input": [ - "text", - "image" - ], - "output": [ - "text" - ] - }, - "limit": { - "context": 131072, - "output": 8192 - }, - "temperature": true, - "tool_call": true, - "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } - }, - "attachment": true, - "open_weights": true, - "release_date": "2025-10-02", - "last_updated": "2025-10-02", + "knowledge": "2023-12", + "release_date": "2024-07-23", + "last_updated": "2024-07-23", "cost": { - "input": 0.2, - "output": 1 + "input": 0.3, + "output": 0.61 }, "type": "chat" }, { - "id": "claude-haiku-4-5-20251001", - "name": "Claude Haiku 4.5", - "display_name": "Claude Haiku 4.5", + "id": "claude-opus-4-1", + "name": "Claude Opus 4.1", + "display_name": "Claude Opus 4.1", "modalities": { "input": [ "text", @@ -86779,7 +91864,7 @@ }, "limit": { "context": 200000, - "output": 64000 + "output": 32000 }, "temperature": true, "tool_call": true, @@ -86810,21 +91895,21 @@ }, "attachment": true, "open_weights": false, - "knowledge": "2025-02-28", - "release_date": "2025-10-15", - "last_updated": "2025-10-15", + "knowledge": "2025-03-31", + "release_date": "2025-11-18", + "last_updated": "2025-11-18", "cost": { - "input": 1, - "output": 5, - "cache_read": 0.1, - "cache_write": 1.25 + "input": 15, + "output": 75, + "cache_read": 1.5, + "cache_write": 18.75 }, "type": "chat" }, { - "id": "ministral-8b-2512", - "name": "Ministral 8B", - "display_name": "Ministral 8B", + "id": "gpt-5.1-codex-mini", + "name": "GPT-5.1 Codex Mini", + "display_name": "GPT-5.1 Codex Mini", "modalities": { "input": [ "text", @@ -86835,59 +91920,97 @@ ] }, "limit": { - "context": 262144, - "output": 8192 + "context": 400000, + "output": 128000 }, - "temperature": true, - "tool_call": false, + "temperature": false, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": false }, - "attachment": true, - "open_weights": true, - "release_date": "2025-12-02", - "last_updated": "2025-12-02", + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": false, + "mode": "effort", + "effort": "none", + "effort_options": [ + "none", + "low", + "medium", + "high" + ], + "verbosity": "medium", + "verbosity_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" + } + }, + "attachment": false, + "open_weights": false, + "knowledge": "2024-09-30", + "release_date": "2025-11-14", + "last_updated": "2025-11-14", "cost": { - "input": 0.15, - "output": 0.15 + "input": 0.25, + "output": 2, + "cache_read": 0.025 }, "type": "chat" }, { - "id": "glm-4-32b-0414-128k", - "name": "GLM-4 32B (0414-128k)", - "display_name": "GLM-4 32B (0414-128k)", + "id": "kimi-k2.5", + "name": "Kimi K2.5", + "display_name": "Kimi K2.5", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 16384 + "context": 262144, + "output": 262144 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } }, "attachment": false, - "open_weights": false, - "release_date": "2025-04-14", - "last_updated": "2025-04-14", + "open_weights": true, + "knowledge": "2025-01", + "release_date": "2026-02-06", + "last_updated": "2026-02-06", "cost": { - "input": 0.1, - "output": 0.1 + "input": 0.6, + "output": 3 }, "type": "chat" }, { - "id": "qwen3-235b-a22b-fp8", - "name": "Qwen3 235B A22B FP8", - "display_name": "Qwen3 235B A22B FP8", + "id": "phi-4", + "name": "Phi-4", + "display_name": "Phi-4", "modalities": { "input": [ "text" @@ -86897,29 +92020,29 @@ ] }, "limit": { - "context": 131072, - "output": 8192 + "context": 128000, + "output": 4096 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": true + "supported": false }, "attachment": false, "open_weights": true, - "release_date": "2025-04-28", - "last_updated": "2025-04-28", + "knowledge": "2023-10", + "release_date": "2024-12-11", + "last_updated": "2024-12-11", "cost": { - "input": 0.2, - "output": 0.8 + "input": 0.125, + "output": 0.5 }, "type": "chat" }, { - "id": "qwen2-5-vl-32b-instruct", - "name": "Qwen2.5 VL 32B Instruct", - "display_name": "Qwen2.5 VL 32B Instruct", + "id": "grok-4-fast-reasoning", + "name": "Grok 4 Fast (Reasoning)", + "display_name": "Grok 4 Fast (Reasoning)", "modalities": { "input": [ "text", @@ -86930,28 +92053,36 @@ ] }, "limit": { - "context": 131072, - "output": 8192 + "context": 2000000, + "output": 30000 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true + } }, "attachment": true, - "open_weights": true, - "release_date": "2025-03-15", - "last_updated": "2025-03-15", + "open_weights": false, + "knowledge": "2025-07", + "release_date": "2025-09-19", + "last_updated": "2025-09-19", "cost": { - "input": 1.4, - "output": 4.2 + "input": 0.2, + "output": 0.5, + "cache_read": 0.05 }, "type": "chat" }, { - "id": "qwen3-vl-235b-a22b-instruct", - "name": "Qwen3 VL 235B A22B Instruct", - "display_name": "Qwen3 VL 235B A22B Instruct", + "id": "gpt-4.1-nano", + "name": "GPT-4.1 nano", + "display_name": "GPT-4.1 nano", "modalities": { "input": [ "text", @@ -86962,8 +92093,8 @@ ] }, "limit": { - "context": 131072, - "output": 8192 + "context": 1047576, + "output": 32768 }, "temperature": true, "tool_call": true, @@ -86971,30 +92102,33 @@ "supported": false }, "attachment": true, - "open_weights": true, - "release_date": "2025-09-15", - "last_updated": "2025-09-15", + "open_weights": false, + "knowledge": "2024-04", + "release_date": "2025-04-14", + "last_updated": "2025-04-14", "cost": { - "input": 0.3, - "output": 1.5 + "input": 0.1, + "output": 0.4, + "cache_read": 0.025 }, "type": "chat" }, { - "id": "gpt-5", - "name": "GPT-5", - "display_name": "GPT-5", + "id": "claude-fable-5", + "name": "Claude Fable 5", + "display_name": "Claude Fable 5", "modalities": { "input": [ "text", - "image" + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 400000, + "context": 1000000, "output": 128000 }, "temperature": false, @@ -87008,87 +92142,58 @@ "supported": true, "default_enabled": true, "mode": "effort", - "effort": "medium", + "effort": "high", "effort_options": [ - "minimal", "low", "medium", - "high" + "high", + "xhigh", + "max" ], - "verbosity": "medium", - "verbosity_options": [ - "low", - "medium", - "high" + "interleaved": true, + "summaries": true, + "visibility": "omitted", + "continuation": [ + "thinking_blocks" ], - "visibility": "hidden" + "notes": [ + "Adaptive thinking is always on for Claude Fable 5 and Claude Mythos 5; thinking.type = \"disabled\" is rejected.", + "Manual budget_tokens requests return 400 on Claude Fable 5 and Claude Mythos 5.", + "thinking.display defaults to omitted; set display to summarized to receive readable thinking summaries." + ] } }, "attachment": true, "open_weights": false, - "knowledge": "2024-09-30", - "release_date": "2025-08-07", - "last_updated": "2025-08-07", - "cost": { - "input": 1.25, - "output": 10, - "cache_read": 0.125 - }, - "type": "chat" - }, - { - "id": "qwen3-32b-fp8", - "name": "Qwen3 32B FP8", - "display_name": "Qwen3 32B FP8", - "modalities": { - "input": [ - "text" - ], - "output": [ - "text" - ] - }, - "limit": { - "context": 131072, - "output": 8192 - }, - "temperature": true, - "tool_call": true, - "reasoning": { - "supported": true, - "default": true - }, - "attachment": false, - "open_weights": true, - "release_date": "2025-04-28", - "last_updated": "2025-04-28", + "knowledge": "2026-01-31", + "release_date": "2026-06-09", + "last_updated": "2026-06-09", "cost": { - "input": 0.1, - "output": 0.1 + "input": 10, + "output": 50, + "cache_read": 1, + "cache_write": 12.5 }, "type": "chat" }, { - "id": "gemini-3.1-flash-lite-preview", - "name": "Gemini 3.1 Flash Lite Preview", - "display_name": "Gemini 3.1 Flash Lite Preview", + "id": "o1", + "name": "o1", + "display_name": "o1", "modalities": { "input": [ "text", - "image", - "video", - "audio", - "pdf" + "image" ], "output": [ "text" ] }, "limit": { - "context": 1048576, - "output": 65536 + "context": 200000, + "output": 100000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { "supported": true, @@ -87096,26 +92201,34 @@ }, "extra_capabilities": { "reasoning": { - "supported": true + "supported": true, + "default_enabled": true, + "mode": "effort", + "effort": "medium", + "effort_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" } }, - "attachment": true, + "attachment": false, "open_weights": false, - "knowledge": "2025-01", - "release_date": "2026-03-03", - "last_updated": "2026-03-03", + "knowledge": "2023-09", + "release_date": "2024-12-05", + "last_updated": "2024-12-05", "cost": { - "input": 0.25, - "output": 1.5, - "cache_read": 0.025, - "input_audio": 0.5 + "input": 15, + "output": 60, + "cache_read": 7.5 }, "type": "chat" }, { - "id": "grok-4-0709", - "name": "Grok 4 (0709)", - "display_name": "Grok 4 (0709)", + "id": "deepseek-v3.1", + "name": "DeepSeek-V3.1", + "display_name": "DeepSeek-V3.1", "modalities": { "input": [ "text" @@ -87125,72 +92238,63 @@ ] }, "limit": { - "context": 256000, - "output": 256000 + "context": 131072, + "output": 131072 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "attachment": false, - "open_weights": false, - "release_date": "2025-07-09", - "last_updated": "2025-07-09", + "open_weights": true, + "knowledge": "2024-07", + "release_date": "2025-08-21", + "last_updated": "2025-08-21", "cost": { - "input": 3, - "output": 15 + "input": 0.56, + "output": 1.68 }, "type": "chat" }, { - "id": "qwen-flash", - "name": "Qwen Flash", - "display_name": "Qwen Flash", + "id": "llama-3.2-90b-vision-instruct", + "name": "Llama-3.2-90B-Vision-Instruct", + "display_name": "Llama-3.2-90B-Vision-Instruct", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 1000000, - "output": 32768 + "context": 128000, + "output": 8192 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } + "supported": false }, - "attachment": false, - "open_weights": false, - "knowledge": "2024-04", - "release_date": "2025-07-28", - "last_updated": "2025-07-28", + "attachment": true, + "open_weights": true, + "knowledge": "2023-12", + "release_date": "2024-09-25", + "last_updated": "2024-09-25", "cost": { - "input": 0.05, - "output": 0.4 + "input": 2.04, + "output": 2.04 }, "type": "chat" }, { "id": "claude-haiku-4-5", - "name": "Claude Haiku 4.5 (latest)", - "display_name": "Claude Haiku 4.5 (latest)", + "name": "Claude Haiku 4.5", + "display_name": "Claude Haiku 4.5", "modalities": { "input": [ "text", @@ -87234,9 +92338,9 @@ }, "attachment": true, "open_weights": false, - "knowledge": "2025-02-28", - "release_date": "2025-10-15", - "last_updated": "2025-10-15", + "knowledge": "2025-02-31", + "release_date": "2025-11-18", + "last_updated": "2025-11-18", "cost": { "input": 1, "output": 5, @@ -87246,23 +92350,19 @@ "type": "chat" }, { - "id": "gemini-2.0-flash-lite", - "name": "Gemini 2.0 Flash-Lite", - "display_name": "Gemini 2.0 Flash-Lite", + "id": "ministral-3b", + "name": "Ministral 3B", + "display_name": "Ministral 3B", "modalities": { "input": [ - "text", - "image", - "audio", - "video", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 1048576, + "context": 128000, "output": 8192 }, "temperature": true, @@ -87270,120 +92370,124 @@ "reasoning": { "supported": false }, - "attachment": true, - "open_weights": false, - "knowledge": "2024-06", - "release_date": "2024-12-11", - "last_updated": "2024-12-11", + "attachment": false, + "open_weights": true, + "knowledge": "2024-03", + "release_date": "2024-10-22", + "last_updated": "2024-10-22", "cost": { - "input": 0.075, - "output": 0.3 + "input": 0.04, + "output": 0.04 }, "type": "chat" }, { - "id": "minimax-m3", - "name": "MiniMax-M3", - "display_name": "MiniMax-M3", + "id": "gpt-5.4", + "name": "GPT-5.4", + "display_name": "GPT-5.4", "modalities": { "input": [ "text", "image", - "video" + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 512000, + "context": 1050000, "output": 128000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { "supported": true, - "default": true + "default": false }, "extra_capabilities": { "reasoning": { - "supported": true + "supported": true, + "default_enabled": false, + "mode": "effort", + "effort": "none", + "effort_options": [ + "none", + "low", + "medium", + "high", + "xhigh" + ], + "verbosity": "medium", + "verbosity_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" } }, "attachment": true, "open_weights": false, - "release_date": "2026-06-01", - "last_updated": "2026-06-01", + "knowledge": "2025-08-31", + "release_date": "2026-03-05", + "last_updated": "2026-03-05", "cost": { - "input": 0.6, - "output": 2.4, - "cache_read": 0.12 - }, - "type": "chat" - }, - { - "id": "sonar-pro", - "name": "Sonar Pro", - "display_name": "Sonar Pro", - "modalities": { - "input": [ - "text", - "image" + "input": 2.5, + "output": 15, + "cache_read": 0.25, + "tiers": [ + { + "input": 5, + "output": 22.5, + "cache_read": 0.5, + "tier": { + "type": "context", + "size": 272000 + } + } ], - "output": [ - "text" - ] - }, - "limit": { - "context": 200000, - "output": 8192 - }, - "temperature": true, - "tool_call": false, - "reasoning": { - "supported": false - }, - "attachment": true, - "open_weights": false, - "knowledge": "2025-09-01", - "release_date": "2024-01-01", - "last_updated": "2025-09-01", - "cost": { - "input": 3, - "output": 15 + "context_over_200k": { + "input": 5, + "output": 22.5, + "cache_read": 0.5 + } }, "type": "chat" }, { - "id": "gpt-5.4-pro", - "name": "GPT-5.4 Pro", - "display_name": "GPT-5.4 Pro", + "id": "gpt-5.4-mini", + "name": "GPT-5.4 Mini", + "display_name": "GPT-5.4 Mini", "modalities": { "input": [ "text", - "image" + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 1050000, + "context": 400000, "output": 128000 }, "temperature": false, "tool_call": true, "reasoning": { "supported": true, - "default": true + "default": false }, "extra_capabilities": { "reasoning": { "supported": true, - "default_enabled": true, + "default_enabled": false, "mode": "effort", - "effort": "high", + "effort": "none", "effort_options": [ + "none", + "low", "medium", "high", "xhigh" @@ -87400,18 +92504,19 @@ "attachment": true, "open_weights": false, "knowledge": "2025-08-31", - "release_date": "2026-03-05", - "last_updated": "2026-03-05", + "release_date": "2026-03-17", + "last_updated": "2026-03-17", "cost": { - "input": 30, - "output": 180 + "input": 0.75, + "output": 4.5, + "cache_read": 0.075 }, "type": "chat" }, { - "id": "qwen-max-latest", - "name": "Qwen Max Latest", - "display_name": "Qwen Max Latest", + "id": "kimi-k2.6", + "name": "Kimi K2.6", + "display_name": "Kimi K2.6", "modalities": { "input": [ "text", @@ -87422,33 +92527,40 @@ ] }, "limit": { - "context": 32768, - "output": 8192 + "context": 262144, + "output": 262144 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": true, - "open_weights": false, - "release_date": "2025-01-25", - "last_updated": "2025-01-25", + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true + } + }, + "attachment": false, + "open_weights": true, + "knowledge": "2025-01", + "release_date": "2026-04-22", + "last_updated": "2026-04-22", "cost": { - "input": 0.345, - "output": 1.377 + "input": 0.95, + "output": 4 }, "type": "chat" }, { - "id": "gpt-4.1-mini", - "name": "GPT-4.1 mini", - "display_name": "GPT-4.1 mini", + "id": "gpt-4.1", + "name": "GPT-4.1", + "display_name": "GPT-4.1", "modalities": { "input": [ "text", - "image", - "pdf" + "image" ], "output": [ "text" @@ -87469,16 +92581,16 @@ "release_date": "2025-04-14", "last_updated": "2025-04-14", "cost": { - "input": 0.4, - "output": 1.6, - "cache_read": 0.1 + "input": 2, + "output": 8, + "cache_read": 0.5 }, "type": "chat" }, { - "id": "grok-4-20-beta-0309-non-reasoning", - "name": "Grok 4.20 (Non-Reasoning)", - "display_name": "Grok 4.20 (Non-Reasoning)", + "id": "claude-opus-4-6", + "name": "Claude Opus 4.6", + "display_name": "Claude Opus 4.6", "modalities": { "input": [ "text", @@ -87490,27 +92602,59 @@ ] }, "limit": { - "context": 1000000, - "output": 30000 + "context": 200000, + "output": 128000 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": false + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": false, + "mode": "mixed", + "budget": { + "min": 1024, + "unit": "tokens" + }, + "effort": "high", + "effort_options": [ + "low", + "medium", + "high", + "max" + ], + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ], + "notes": [ + "Anthropic recommends adaptive thinking with effort for Claude 4.6; budget_tokens remains a deprecated compatibility path.", + "Anthropic API defaults effort to high; lower effort levels should be chosen per workload." + ] + } }, "attachment": true, "open_weights": false, - "release_date": "2026-03-09", - "last_updated": "2026-03-09", + "knowledge": "2025-05-31", + "release_date": "2026-02-05", + "last_updated": "2026-02-05", "cost": { - "input": 1.25, - "output": 2.5, - "cache_read": 0.2, + "input": 5, + "output": 25, + "cache_read": 0.5, + "cache_write": 6.25, "tiers": [ { - "input": 2.5, - "output": 5, - "cache_read": 0.4, + "input": 10, + "output": 37.5, + "cache_read": 1, + "cache_write": 12.5, "tier": { "type": "context", "size": 200000 @@ -87518,17 +92662,18 @@ } ], "context_over_200k": { - "input": 2.5, - "output": 5, - "cache_read": 0.4 + "input": 10, + "output": 37.5, + "cache_read": 1, + "cache_write": 12.5 } }, "type": "chat" }, { - "id": "deepseek-v3.2", - "name": "DeepSeek V3.2", - "display_name": "DeepSeek V3.2", + "id": "grok-4-1-fast-reasoning", + "name": "Grok 4.1 Fast (Reasoning)", + "display_name": "Grok 4.1 Fast (Reasoning)", "modalities": { "input": [ "text", @@ -87539,8 +92684,8 @@ ] }, "limit": { - "context": 163840, - "output": 16384 + "context": 128000, + "output": 8192 }, "temperature": true, "tool_call": true, @@ -87554,20 +92699,20 @@ } }, "attachment": true, - "open_weights": true, - "release_date": "2025-09-29", - "last_updated": "2025-09-29", + "open_weights": false, + "release_date": "2025-06-27", + "last_updated": "2025-06-27", "cost": { - "input": 0.28, - "output": 0.42, - "cache_read": 0.056 + "input": 0.2, + "output": 0.5, + "cache_read": 0.05 }, "type": "chat" }, { - "id": "seed-1-8-251228", - "name": "Seed 1.8 (251228)", - "display_name": "Seed 1.8 (251228)", + "id": "gpt-5-mini", + "name": "GPT-5 Mini", + "display_name": "GPT-5 Mini", "modalities": { "input": [ "text", @@ -87578,30 +92723,52 @@ ] }, "limit": { - "context": 256000, - "output": 8192 + "context": 272000, + "output": 128000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { "supported": true, "default": true }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": true, + "mode": "effort", + "effort": "medium", + "effort_options": [ + "minimal", + "low", + "medium", + "high" + ], + "verbosity": "medium", + "verbosity_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" + } + }, "attachment": true, - "open_weights": true, - "release_date": "2025-12-18", - "last_updated": "2025-12-18", + "open_weights": false, + "knowledge": "2024-05-30", + "release_date": "2025-08-07", + "last_updated": "2025-08-07", "cost": { "input": 0.25, "output": 2, - "cache_read": 0.05 + "cache_read": 0.03 }, "type": "chat" }, { - "id": "gpt-5.2-pro", - "name": "GPT-5.2 Pro", - "display_name": "GPT-5.2 Pro", + "id": "gpt-4.1-mini", + "name": "GPT-4.1 mini", + "display_name": "GPT-4.1 mini", "modalities": { "input": [ "text", @@ -87612,50 +92779,30 @@ ] }, "limit": { - "context": 400000, - "output": 128000 + "context": 1047576, + "output": 32768 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": true, - "mode": "effort", - "effort": "high", - "effort_options": [ - "medium", - "high", - "xhigh" - ], - "verbosity": "medium", - "verbosity_options": [ - "low", - "medium", - "high" - ], - "visibility": "hidden" - } + "supported": false }, "attachment": true, "open_weights": false, - "knowledge": "2025-08-31", - "release_date": "2025-12-11", - "last_updated": "2025-12-11", + "knowledge": "2024-04", + "release_date": "2025-04-14", + "last_updated": "2025-04-14", "cost": { - "input": 21, - "output": 168 + "input": 0.4, + "output": 1.6, + "cache_read": 0.1 }, "type": "chat" }, { - "id": "gpt-4o-mini-search-preview", - "name": "GPT-4o Mini Search Preview", - "display_name": "GPT-4o Mini Search Preview", + "id": "gpt-4-turbo", + "name": "GPT-4 Turbo", + "display_name": "GPT-4 Turbo", "modalities": { "input": [ "text", @@ -87667,85 +92814,84 @@ }, "limit": { "context": 128000, - "output": 16384 + "output": 4096 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { "supported": false }, "attachment": true, "open_weights": false, - "release_date": "2024-10-01", - "last_updated": "2024-10-01", + "knowledge": "2023-12", + "release_date": "2023-11-06", + "last_updated": "2024-04-09", "cost": { - "input": 0.15, - "output": 0.6 + "input": 10, + "output": 30 }, "type": "chat" }, { - "id": "claude-opus-4-20250514", - "name": "Claude Opus 4", - "display_name": "Claude Opus 4", + "id": "gpt-5-nano", + "name": "GPT-5 Nano", + "display_name": "GPT-5 Nano", "modalities": { "input": [ "text", - "image", - "pdf" + "image" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 32000 + "context": 272000, + "output": 128000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { "supported": true, - "default": false + "default": true }, "extra_capabilities": { "reasoning": { "supported": true, - "default_enabled": false, - "mode": "budget", - "budget": { - "min": 1024, - "unit": "tokens" - }, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" + "default_enabled": true, + "mode": "effort", + "effort": "medium", + "effort_options": [ + "minimal", + "low", + "medium", + "high" ], - "notes": [ - "Claude 4 manual thinking uses thinking.type = \"enabled\" with budget_tokens.", - "Interleaved thinking requires the interleaved-thinking-2025-05-14 beta header for this model family." - ] + "verbosity": "medium", + "verbosity_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" } }, "attachment": true, "open_weights": false, - "knowledge": "2025-03-31", - "release_date": "2025-05-22", - "last_updated": "2025-05-22", + "knowledge": "2024-05-30", + "release_date": "2025-08-07", + "last_updated": "2025-08-07", "cost": { - "input": 15, - "output": 75, - "cache_read": 1.5, - "cache_write": 18.75 + "input": 0.05, + "output": 0.4, + "cache_read": 0.01 }, "type": "chat" }, { - "id": "minimax-m2.7-highspeed", - "name": "MiniMax-M2.7-highspeed", - "display_name": "MiniMax-M2.7-highspeed", + "id": "phi-3-medium-4k-instruct", + "name": "Phi-3-medium-instruct (4k)", + "display_name": "Phi-3-medium-instruct (4k)", "modalities": { "input": [ "text" @@ -87755,42 +92901,29 @@ ] }, "limit": { - "context": 204800, - "output": 131072 + "context": 4096, + "output": 1024 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } + "supported": false }, "attachment": false, "open_weights": true, - "release_date": "2026-03-18", - "last_updated": "2026-03-18", + "knowledge": "2023-10", + "release_date": "2024-04-23", + "last_updated": "2024-04-23", "cost": { - "input": 0.6, - "output": 2.4, - "cache_read": 0.06, - "cache_write": 0.375 + "input": 0.17, + "output": 0.68 }, "type": "chat" }, { - "id": "o4-mini", - "name": "o4-mini", - "display_name": "o4-mini", + "id": "gpt-5.4-pro", + "name": "GPT-5.4 Pro", + "display_name": "GPT-5.4 Pro", "modalities": { "input": [ "text", @@ -87801,8 +92934,8 @@ ] }, "limit": { - "context": 200000, - "output": 100000 + "context": 1050000, + "output": 128000 }, "temperature": false, "tool_call": true, @@ -87815,8 +92948,14 @@ "supported": true, "default_enabled": true, "mode": "effort", - "effort": "medium", + "effort": "high", "effort_options": [ + "medium", + "high", + "xhigh" + ], + "verbosity": "medium", + "verbosity_options": [ "low", "medium", "high" @@ -87826,20 +92965,64 @@ }, "attachment": true, "open_weights": false, - "knowledge": "2024-05", - "release_date": "2025-04-16", - "last_updated": "2025-04-16", + "knowledge": "2025-08-31", + "release_date": "2026-03-05", + "last_updated": "2026-03-05", "cost": { - "input": 1.1, - "output": 4.4, - "cache_read": 0.275 + "input": 30, + "output": 180, + "tiers": [ + { + "input": 60, + "output": 270, + "tier": { + "type": "context", + "size": 272000 + } + } + ], + "context_over_200k": { + "input": 60, + "output": 270 + } }, "type": "chat" }, { - "id": "gpt-5.4", - "name": "GPT-5.4", - "display_name": "GPT-5.4", + "id": "cohere-embed-v3-english", + "name": "Embed v3 English", + "display_name": "Embed v3 English", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 512, + "output": 1024 + }, + "temperature": false, + "tool_call": false, + "reasoning": { + "supported": false + }, + "attachment": false, + "open_weights": true, + "release_date": "2023-11-07", + "last_updated": "2023-11-07", + "cost": { + "input": 0.1, + "output": 0 + }, + "type": "chat" + }, + { + "id": "claude-sonnet-4-6", + "name": "Claude Sonnet 4.6", + "display_name": "Claude Sonnet 4.6", "modalities": { "input": [ "text", @@ -87851,10 +93034,10 @@ ] }, "limit": { - "context": 1050000, - "output": 128000 + "context": 1000000, + "output": 64000 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, @@ -87864,40 +93047,47 @@ "reasoning": { "supported": true, "default_enabled": false, - "mode": "effort", - "effort": "none", + "mode": "mixed", + "budget": { + "min": 1024, + "unit": "tokens" + }, + "effort": "high", "effort_options": [ - "none", "low", "medium", "high", - "xhigh" + "max" ], - "verbosity": "medium", - "verbosity_options": [ - "low", - "medium", - "high" + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" ], - "visibility": "hidden" + "notes": [ + "Anthropic recommends adaptive thinking with effort for Claude 4.6; budget_tokens remains a deprecated compatibility path.", + "Anthropic API defaults effort to high; lower effort levels should be chosen per workload." + ] } }, "attachment": true, "open_weights": false, "knowledge": "2025-08-31", - "release_date": "2026-03-05", - "last_updated": "2026-03-05", + "release_date": "2026-02-17", + "last_updated": "2026-03-13", "cost": { - "input": 2.5, + "input": 3, "output": 15, - "cache_read": 0.25 + "cache_read": 0.3, + "cache_write": 3.75 }, "type": "chat" }, { - "id": "o3-mini", - "name": "o3-mini", - "display_name": "o3-mini", + "id": "codestral-2501", + "name": "Codestral 25.01", + "display_name": "Codestral 25.01", "modalities": { "input": [ "text" @@ -87907,183 +93097,162 @@ ] }, "limit": { - "context": 200000, - "output": 100000 + "context": 256000, + "output": 256000 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": true, - "mode": "effort", - "effort": "medium", - "effort_options": [ - "low", - "medium", - "high" - ], - "visibility": "hidden" - } + "supported": false }, "attachment": false, "open_weights": false, - "knowledge": "2024-05", - "release_date": "2024-12-20", - "last_updated": "2025-01-29", + "knowledge": "2024-03", + "release_date": "2025-01-01", + "last_updated": "2025-01-01", "cost": { - "input": 1.1, - "output": 4.4, - "cache_read": 0.55 + "input": 0.3, + "output": 0.9 }, "type": "chat" }, { - "id": "gemini-3-flash-preview", - "name": "Gemini 3 Flash Preview", - "display_name": "Gemini 3 Flash Preview", + "id": "phi-4-reasoning-plus", + "name": "Phi-4-reasoning-plus", + "display_name": "Phi-4-reasoning-plus", "modalities": { "input": [ - "text", - "image", - "video", - "audio", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 1048576, - "output": 65536 + "context": 32000, + "output": 4096 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": true, "default": true }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": true, - "mode": "level", - "level": "high", - "level_options": [ - "minimal", - "low", - "medium", - "high" - ], - "summaries": true, - "visibility": "summary", - "continuation": [ - "thought_signatures" - ] - } + "attachment": false, + "open_weights": true, + "knowledge": "2023-10", + "release_date": "2024-12-11", + "last_updated": "2024-12-11", + "cost": { + "input": 0.125, + "output": 0.5 + }, + "type": "chat" + }, + { + "id": "phi-4-multimodal", + "name": "Phi-4-multimodal", + "display_name": "Phi-4-multimodal", + "modalities": { + "input": [ + "text", + "image", + "audio" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 128000, + "output": 4096 + }, + "temperature": true, + "tool_call": false, + "reasoning": { + "supported": false }, "attachment": true, - "open_weights": false, - "knowledge": "2025-01", - "release_date": "2025-12-17", - "last_updated": "2025-12-17", + "open_weights": true, + "knowledge": "2023-10", + "release_date": "2024-12-11", + "last_updated": "2024-12-11", "cost": { - "input": 0.5, - "output": 3, - "cache_read": 0.05, - "input_audio": 1 + "input": 0.08, + "output": 0.32, + "input_audio": 4 }, "type": "chat" }, { - "id": "mimo-v2-omni", - "name": "MiMo-V2-Omni", - "display_name": "MiMo-V2-Omni", + "id": "gpt-4o-mini", + "name": "GPT-4o mini", + "display_name": "GPT-4o mini", "modalities": { "input": [ "text", - "image", - "audio", - "video", - "pdf" + "image" ], "output": [ "text" ] }, "limit": { - "context": 262144, - "output": 131072 + "context": 128000, + "output": 16384 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } + "supported": false }, "attachment": true, "open_weights": false, - "knowledge": "2024-12", - "release_date": "2026-03-18", - "last_updated": "2026-03-18", + "knowledge": "2023-09", + "release_date": "2024-07-18", + "last_updated": "2024-07-18", "cost": { - "input": 0.4, - "output": 2, - "cache_read": 0.08 + "input": 0.15, + "output": 0.6, + "cache_read": 0.075 }, "type": "chat" }, { - "id": "qwen-coder-plus", - "name": "Qwen Coder Plus", - "display_name": "Qwen Coder Plus", + "id": "model-router", + "name": "Model Router", + "display_name": "Model Router", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 131072, - "output": 8192 + "context": 128000, + "output": 16384 }, - "temperature": true, "tool_call": true, "reasoning": { "supported": false }, - "attachment": false, + "attachment": true, "open_weights": false, - "release_date": "2024-09-18", - "last_updated": "2024-09-18", + "release_date": "2025-05-19", + "last_updated": "2025-11-18", "cost": { - "input": 0.502, - "output": 1.004 + "input": 0.14, + "output": 0 }, "type": "chat" }, { - "id": "minimax-m2.1", - "name": "MiniMax-M2.1", - "display_name": "MiniMax-M2.1", + "id": "grok-4-20-reasoning", + "name": "Grok 4.20 (Reasoning)", + "display_name": "Grok 4.20 (Reasoning)", "modalities": { "input": [ "text" @@ -88093,8 +93262,8 @@ ] }, "limit": { - "context": 204800, - "output": 131072 + "context": 262000, + "output": 8192 }, "temperature": true, "tool_call": true, @@ -88108,31 +93277,31 @@ } }, "attachment": false, - "open_weights": true, - "release_date": "2025-12-23", - "last_updated": "2025-12-23", + "open_weights": false, + "knowledge": "2025-09", + "release_date": "2026-04-08", + "last_updated": "2026-04-08", "cost": { - "input": 0.3, - "output": 1.2 + "input": 2, + "output": 6 }, "type": "chat" }, { - "id": "gpt-5.5", - "name": "GPT-5.5", - "display_name": "GPT-5.5", + "id": "gpt-5-codex", + "name": "GPT-5-Codex", + "display_name": "GPT-5-Codex", "modalities": { "input": [ "text", - "image", - "pdf" + "image" ], "output": [ "text" ] }, "limit": { - "context": 1050000, + "context": 400000, "output": 128000 }, "temperature": false, @@ -88148,10 +93317,10 @@ "mode": "effort", "effort": "medium", "effort_options": [ + "minimal", "low", "medium", - "high", - "xhigh" + "high" ], "verbosity": "medium", "verbosity_options": [ @@ -88162,38 +93331,22 @@ "visibility": "hidden" } }, - "attachment": true, + "attachment": false, "open_weights": false, - "knowledge": "2025-12-01", - "release_date": "2026-04-23", - "last_updated": "2026-04-23", + "knowledge": "2024-09-30", + "release_date": "2025-09-15", + "last_updated": "2025-09-15", "cost": { - "input": 5, - "output": 30, - "cache_read": 0.5, - "tiers": [ - { - "input": 10, - "output": 45, - "cache_read": 1, - "tier": { - "type": "context", - "size": 272000 - } - } - ], - "context_over_200k": { - "input": 10, - "output": 45, - "cache_read": 1 - } + "input": 1.25, + "output": 10, + "cache_read": 0.13 }, "type": "chat" }, { - "id": "qwen3-max", - "name": "Qwen3 Max", - "display_name": "Qwen3 Max", + "id": "deepseek-v3.2", + "name": "DeepSeek-V3.2", + "display_name": "DeepSeek-V3.2", "modalities": { "input": [ "text" @@ -88203,56 +93356,83 @@ ] }, "limit": { - "context": 262144, - "output": 65536 + "context": 128000, + "output": 128000 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true + "supported": true, + "default": true }, "extra_capabilities": { "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] + "supported": true } }, "attachment": false, - "open_weights": false, - "knowledge": "2025-04", - "release_date": "2025-09-23", - "last_updated": "2025-09-23", + "open_weights": true, + "knowledge": "2024-07", + "release_date": "2025-12-01", + "last_updated": "2025-12-01", "cost": { - "input": 1.2, - "output": 6 + "input": 0.58, + "output": 1.68 }, "type": "chat" }, { - "id": "kimi-k2.6", - "name": "Kimi K2.6", - "display_name": "Kimi K2.6", + "id": "llama-4-maverick-17b-128e-instruct-fp8", + "name": "Llama 4 Maverick 17B 128E Instruct FP8", + "display_name": "Llama 4 Maverick 17B 128E Instruct FP8", "modalities": { "input": [ "text", - "image", - "video" + "image" ], "output": [ "text" ] }, "limit": { - "context": 262144, - "output": 262144 + "context": 128000, + "output": 8192 }, "temperature": true, "tool_call": true, + "reasoning": { + "supported": false + }, + "attachment": true, + "open_weights": true, + "knowledge": "2024-08", + "release_date": "2025-04-05", + "last_updated": "2025-04-05", + "cost": { + "input": 0.25, + "output": 1 + }, + "type": "chat" + }, + { + "id": "gpt-5.2-codex", + "name": "GPT-5.2 Codex", + "display_name": "GPT-5.2 Codex", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 400000, + "output": 128000 + }, + "temperature": false, + "tool_call": true, "reasoning": { "supported": true, "default": true @@ -88260,63 +93440,73 @@ "extra_capabilities": { "reasoning": { "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] + "default_enabled": true, + "mode": "effort", + "effort": "medium", + "effort_options": [ + "low", + "medium", + "high", + "xhigh" + ], + "verbosity": "medium", + "verbosity_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" } }, - "attachment": true, - "open_weights": true, - "knowledge": "2025-01", - "release_date": "2026-04-21", - "last_updated": "2026-04-21", + "attachment": false, + "open_weights": false, + "knowledge": "2025-08-31", + "release_date": "2026-01-14", + "last_updated": "2026-01-14", "cost": { - "input": 0.95, - "output": 4, - "cache_read": 0.16 + "input": 1.75, + "output": 14, + "cache_read": 0.175 }, "type": "chat" }, { - "id": "mistral-large-2512", - "name": "Mistral Large 3", - "display_name": "Mistral Large 3", + "id": "phi-4-mini-reasoning", + "name": "Phi-4-mini-reasoning", + "display_name": "Phi-4-mini-reasoning", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 262144, - "output": 262144 + "context": 128000, + "output": 4096 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": true, + "attachment": false, "open_weights": true, - "knowledge": "2024-11", - "release_date": "2024-11-01", - "last_updated": "2025-12-02", + "knowledge": "2023-10", + "release_date": "2024-12-11", + "last_updated": "2024-12-11", "cost": { - "input": 0.5, - "output": 1.5 + "input": 0.075, + "output": 0.3 }, "type": "chat" }, { - "id": "qwen3-coder-plus", - "name": "Qwen3 Coder Plus", - "display_name": "Qwen3 Coder Plus", + "id": "phi-3-mini-128k-instruct", + "name": "Phi-3-mini-instruct (128k)", + "display_name": "Phi-3-mini-instruct (128k)", "modalities": { "input": [ "text" @@ -88326,29 +93516,29 @@ ] }, "limit": { - "context": 1048576, - "output": 65536 + "context": 128000, + "output": 4096 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": false }, "attachment": false, - "open_weights": false, - "knowledge": "2025-04", - "release_date": "2025-07-23", - "last_updated": "2025-07-23", + "open_weights": true, + "knowledge": "2023-10", + "release_date": "2024-04-23", + "last_updated": "2024-04-23", "cost": { - "input": 1, - "output": 5 + "input": 0.13, + "output": 0.52 }, "type": "chat" }, { - "id": "glm-4.7", - "name": "GLM-4.7", - "display_name": "GLM-4.7", + "id": "phi-3-mini-4k-instruct", + "name": "Phi-3-mini-instruct (4k)", + "display_name": "Phi-3-mini-instruct (4k)", "modalities": { "input": [ "text" @@ -88358,71 +93548,54 @@ ] }, "limit": { - "context": 204800, - "output": 131072 + "context": 4096, + "output": 1024 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } + "supported": false }, "attachment": false, "open_weights": true, - "knowledge": "2025-04", - "release_date": "2025-12-22", - "last_updated": "2025-12-22", + "knowledge": "2023-10", + "release_date": "2024-04-23", + "last_updated": "2024-04-23", "cost": { - "input": 0.6, - "output": 2.2, - "cache_read": 0.11, - "cache_write": 0 + "input": 0.13, + "output": 0.52 }, "type": "chat" }, { - "id": "gpt-5.2-chat-latest", - "name": "GPT-5.2 Chat", - "display_name": "GPT-5.2 Chat", + "id": "meta-llama-3-70b-instruct", + "name": "Meta-Llama-3-70B-Instruct", + "display_name": "Meta-Llama-3-70B-Instruct", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 16384 + "context": 8192, + "output": 2048 }, - "temperature": false, - "tool_call": true, + "temperature": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": true + "supported": false }, - "attachment": true, - "open_weights": false, - "knowledge": "2025-08-31", - "release_date": "2025-12-11", - "last_updated": "2025-12-11", + "attachment": false, + "open_weights": true, + "knowledge": "2023-12", + "release_date": "2024-04-18", + "last_updated": "2024-04-18", "cost": { - "input": 1.75, - "output": 14, - "cache_read": 0.175 + "input": 2.68, + "output": 3.54 }, "type": "chat" }, @@ -88433,14 +93606,17 @@ "modalities": { "input": [ "text", - "image" + "image", + "audio" ], "output": [ - "text" + "text", + "image", + "audio" ] }, "limit": { - "context": 400000, + "context": 272000, "output": 128000 }, "temperature": false, @@ -88473,8 +93649,8 @@ "attachment": true, "open_weights": false, "knowledge": "2024-09-30", - "release_date": "2025-11-13", - "last_updated": "2025-11-13", + "release_date": "2025-11-14", + "last_updated": "2025-11-14", "cost": { "input": 1.25, "output": 10, @@ -88483,20 +93659,21 @@ "type": "chat" }, { - "id": "gpt-5-nano", - "name": "GPT-5 Nano", - "display_name": "GPT-5 Nano", + "id": "gpt-5.5", + "name": "GPT-5.5", + "display_name": "GPT-5.5", "modalities": { "input": [ "text", - "image" + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 400000, + "context": 1050000, "output": 128000 }, "temperature": false, @@ -88512,10 +93689,10 @@ "mode": "effort", "effort": "medium", "effort_options": [ - "minimal", "low", "medium", - "high" + "high", + "xhigh" ], "verbosity": "medium", "verbosity_options": [ @@ -88526,18 +93703,42 @@ "visibility": "hidden" } }, - "attachment": true, - "open_weights": false, - "knowledge": "2024-05-30", - "release_date": "2025-08-07", - "last_updated": "2025-08-07", - "cost": { - "input": 0.05, - "output": 0.4, - "cache_read": 0.005 - }, + "attachment": true, + "open_weights": false, + "knowledge": "2025-12-01", + "release_date": "2026-04-24", + "last_updated": "2026-04-24", + "cost": { + "input": 5, + "output": 30, + "cache_read": 0.5, + "tiers": [ + { + "input": 10, + "output": 45, + "cache_read": 1, + "tier": { + "type": "context", + "size": 272000 + } + } + ], + "context_over_200k": { + "input": 10, + "output": 45, + "cache_read": 1 + } + }, "type": "chat" - }, + } + ] + }, + "cerebras": { + "id": "cerebras", + "name": "Cerebras", + "display_name": "Cerebras", + "doc": "https://inference-docs.cerebras.ai/models/overview", + "models": [ { "id": "gpt-oss-120b", "name": "GPT OSS 120B", @@ -88552,7 +93753,7 @@ }, "limit": { "context": 131072, - "output": 32766 + "output": 40960 }, "temperature": true, "tool_call": true, @@ -88566,23 +93767,22 @@ } }, "attachment": false, - "open_weights": false, + "open_weights": true, "release_date": "2025-08-05", - "last_updated": "2025-08-05", + "last_updated": "2026-06-10", "cost": { - "input": 0.05, - "output": 0.25 + "input": 0.35, + "output": 0.75 }, "type": "chat" }, { - "id": "ministral-3b-2512", - "name": "Ministral 3B", - "display_name": "Ministral 3B", + "id": "zai-glm-4.7", + "name": "Z.AI GLM-4.7", + "display_name": "Z.AI GLM-4.7", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" @@ -88590,62 +93790,85 @@ }, "limit": { "context": 131072, - "output": 8192 + "output": 40960 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": true, + "attachment": false, "open_weights": true, - "release_date": "2025-12-02", - "last_updated": "2025-12-02", + "release_date": "2026-01-07", + "last_updated": "2026-06-10", "cost": { - "input": 0.1, - "output": 0.1 + "input": 2.25, + "output": 2.75, + "cache_read": 0, + "cache_write": 0 }, "type": "chat" - }, + } + ] + }, + "zai-coding-plan": { + "id": "zai-coding-plan", + "name": "Z.AI Coding Plan", + "display_name": "Z.AI Coding Plan", + "api": "https://api.z.ai/api/coding/paas/v4", + "doc": "https://docs.z.ai/devpack/overview", + "models": [ { - "id": "gpt-4o-mini", - "name": "GPT-4o mini", - "display_name": "GPT-4o mini", + "id": "glm-4.7", + "name": "GLM-4.7", + "display_name": "GLM-4.7", "modalities": { "input": [ - "text", - "image", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 16384 + "context": 204800, + "output": 131072 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": true, - "open_weights": false, - "knowledge": "2023-09", - "release_date": "2024-07-18", - "last_updated": "2024-07-18", + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } + }, + "attachment": false, + "open_weights": true, + "knowledge": "2025-04", + "release_date": "2025-12-22", + "last_updated": "2025-12-22", "cost": { - "input": 0.15, - "output": 0.6, - "cache_read": 0.075 + "input": 0, + "output": 0, + "cache_read": 0, + "cache_write": 0 }, "type": "chat" }, { - "id": "qwen3-coder-next", - "name": "Qwen3 Coder Next", - "display_name": "Qwen3 Coder Next", + "id": "glm-5.1", + "name": "GLM-5.1", + "display_name": "GLM-5.1", "modalities": { "input": [ "text" @@ -88655,8 +93878,8 @@ ] }, "limit": { - "context": 262144, - "output": 65536 + "context": 200000, + "output": 131072 }, "temperature": true, "tool_call": true, @@ -88664,32 +93887,47 @@ "supported": true, "default": true }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } + }, "attachment": false, "open_weights": false, - "release_date": "2025-10-15", - "last_updated": "2025-10-15", + "release_date": "2026-03-27", + "last_updated": "2026-03-27", "cost": { - "input": 0.108, - "output": 0.675 + "input": 0, + "output": 0, + "cache_read": 0, + "cache_write": 0 }, "type": "chat" }, { - "id": "grok-4-fast-reasoning", - "name": "Grok 4 Fast Reasoning", - "display_name": "Grok 4 Fast Reasoning", + "id": "glm-5v-turbo", + "name": "GLM-5V-Turbo", + "display_name": "GLM-5V-Turbo", "modalities": { "input": [ "text", - "image" + "image", + "video", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 2000000, - "output": 30000 + "context": 200000, + "output": 131072 }, "temperature": true, "tool_call": true, @@ -88699,84 +93937,123 @@ }, "extra_capabilities": { "reasoning": { - "supported": true + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] } }, "attachment": true, "open_weights": false, - "release_date": "2025-07-09", - "last_updated": "2025-07-09", + "release_date": "2026-04-01", + "last_updated": "2026-04-01", "cost": { - "input": 0.2, - "output": 0.5, - "cache_read": 0.05 + "input": 0, + "output": 0, + "cache_read": 0, + "cache_write": 0 }, "type": "chat" }, { - "id": "gpt-5.1-codex-mini", - "name": "GPT-5.1 Codex mini", - "display_name": "GPT-5.1 Codex mini", + "id": "glm-4.5-air", + "name": "GLM-4.5-Air", + "display_name": "GLM-4.5-Air", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 400000, - "output": 128000 + "context": 131072, + "output": 98304 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, - "default": false + "default": true + }, + "attachment": false, + "open_weights": true, + "knowledge": "2025-04", + "release_date": "2025-07-28", + "last_updated": "2025-07-28", + "cost": { + "input": 0, + "output": 0, + "cache_read": 0, + "cache_write": 0 + }, + "type": "chat" + }, + { + "id": "glm-5-turbo", + "name": "GLM-5-Turbo", + "display_name": "GLM-5-Turbo", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 200000, + "output": 131072 + }, + "temperature": true, + "tool_call": true, + "reasoning": { + "supported": true, + "default": true }, "extra_capabilities": { "reasoning": { "supported": true, - "default_enabled": false, - "mode": "effort", - "effort": "none", - "effort_options": [ - "none", - "low", - "medium", - "high" - ], - "verbosity": "medium", - "verbosity_options": [ - "low", - "medium", - "high" - ], - "visibility": "hidden" + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] } }, - "attachment": true, + "attachment": false, "open_weights": false, - "knowledge": "2024-09-30", - "release_date": "2025-11-13", - "last_updated": "2025-11-13", + "release_date": "2026-03-16", + "last_updated": "2026-03-16", "cost": { - "input": 0.25, - "output": 2, - "cache_read": 0.025 + "input": 0, + "output": 0, + "cache_read": 0, + "cache_write": 0 }, "type": "chat" - }, + } + ] + }, + "nvidia": { + "id": "nvidia", + "name": "Nvidia", + "display_name": "Nvidia", + "api": "https://integrate.api.nvidia.com/v1", + "doc": "https://docs.api.nvidia.com/nim/", + "models": [ { - "id": "llama-4-maverick-17b-instruct", - "name": "Llama 4 Maverick 17B Instruct", - "display_name": "Llama 4 Maverick 17B Instruct", + "id": "baai/bge-m3", + "name": "BGE M3", + "display_name": "BGE M3", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" @@ -88784,27 +94061,27 @@ }, "limit": { "context": 8192, - "output": 2048 + "output": 1024 }, - "temperature": true, + "temperature": false, "tool_call": false, "reasoning": { "supported": false }, - "attachment": true, + "attachment": false, "open_weights": true, - "release_date": "2025-04-05", - "last_updated": "2025-04-05", + "release_date": "2024-01-30", + "last_updated": "2026-04-30", "cost": { - "input": 0.24, - "output": 0.97 + "input": 0, + "output": 0 }, - "type": "chat" + "type": "embedding" }, { - "id": "llama-3.2-3b-instruct", - "name": "Llama 3.2 3B Instruct", - "display_name": "Llama 3.2 3B Instruct", + "id": "moonshotai/kimi-k2-instruct-0905", + "name": "Kimi K2 0905", + "display_name": "Kimi K2 0905", "modalities": { "input": [ "text" @@ -88814,39 +94091,42 @@ ] }, "limit": { - "context": 32768, - "output": 32000 + "context": 262144, + "output": 262144 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { "supported": false }, "attachment": false, "open_weights": true, - "release_date": "2024-09-18", - "last_updated": "2024-09-18", + "knowledge": "2024-10", + "release_date": "2025-09-05", + "last_updated": "2025-09-05", "cost": { - "input": 0.03, - "output": 0.05 + "input": 0, + "output": 0 }, "type": "chat" }, { - "id": "qwen3-235b-a22b-thinking-2507", - "name": "Qwen3 235B A22B Thinking (2507)", - "display_name": "Qwen3 235B A22B Thinking (2507)", + "id": "moonshotai/kimi-k2.6", + "name": "Kimi K2.6", + "display_name": "Kimi K2.6", "modalities": { "input": [ - "text" + "text", + "image", + "video" ], "output": [ "text" ] }, "limit": { - "context": 131072, - "output": 8192 + "context": 262144, + "output": 262144 }, "temperature": true, "tool_call": true, @@ -88865,64 +94145,76 @@ ] } }, - "attachment": false, + "attachment": true, "open_weights": true, - "release_date": "2025-07-08", - "last_updated": "2025-07-08", + "knowledge": "2025-01", + "release_date": "2026-04-21", + "last_updated": "2026-04-21", "cost": { - "input": 0.2, - "output": 0.6 + "input": 0, + "output": 0 }, "type": "chat" }, { - "id": "mistral-large-latest", - "name": "Mistral Large (latest)", - "display_name": "Mistral Large (latest)", + "id": "minimaxai/minimax-m2.7", + "name": "MiniMax-M2.7", + "display_name": "MiniMax-M2.7", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 262144, - "output": 262144 + "context": 204800, + "output": 131072 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": true, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } + }, + "attachment": false, "open_weights": true, - "knowledge": "2024-11", - "release_date": "2024-11-01", - "last_updated": "2025-12-02", + "release_date": "2026-03-18", + "last_updated": "2026-04-11", "cost": { - "input": 0.5, - "output": 1.5 + "input": 0, + "output": 0 }, "type": "chat" }, { - "id": "qwen3-4b-fp8", - "name": "Qwen3 4B FP8", - "display_name": "Qwen3 4B FP8", + "id": "stepfun-ai/step-3.7-flash", + "name": "Step 3.7 Flash", + "display_name": "Step 3.7 Flash", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 131072, - "output": 8192 + "context": 256000, + "output": 16384 }, "temperature": true, "tool_call": true, @@ -88930,20 +94222,20 @@ "supported": true, "default": true }, - "attachment": false, + "attachment": true, "open_weights": true, - "release_date": "2025-04-28", - "last_updated": "2025-04-28", + "release_date": "2026-05-28", + "last_updated": "2026-05-28", "cost": { - "input": 0.03, - "output": 0.03 + "input": 0, + "output": 0 }, "type": "chat" }, { - "id": "qwen3.7-max", - "name": "Qwen3.7 Max", - "display_name": "Qwen3.7 Max", + "id": "stepfun-ai/step-3.5-flash", + "name": "Step 3.5 Flash", + "display_name": "Step 3.5 Flash", "modalities": { "input": [ "text" @@ -88953,8 +94245,8 @@ ] }, "limit": { - "context": 1000000, - "output": 65536 + "context": 256000, + "output": 16384 }, "temperature": true, "tool_call": true, @@ -88962,27 +94254,20 @@ "supported": true, "default": true }, - "extra_capabilities": { - "reasoning": { - "supported": true - } - }, "attachment": false, - "open_weights": false, - "release_date": "2026-05-21", - "last_updated": "2026-05-21", + "open_weights": true, + "release_date": "2026-02-02", + "last_updated": "2026-02-02", "cost": { - "input": 2.5, - "output": 7.5, - "cache_read": 0.5, - "cache_write": 3.125 + "input": 0, + "output": 0 }, "type": "chat" }, { - "id": "qwen-vl-plus", - "name": "Qwen-VL Plus", - "display_name": "Qwen-VL Plus", + "id": "google/gemma-3n-e4b-it", + "name": "Gemma 3n E4b It", + "display_name": "Gemma 3n E4b It", "modalities": { "input": [ "text", @@ -88993,345 +94278,276 @@ ] }, "limit": { - "context": 131072, - "output": 8192 + "context": 128000, + "output": 4096 }, "temperature": true, "tool_call": true, "reasoning": { "supported": false }, - "attachment": false, - "open_weights": false, - "knowledge": "2024-04", - "release_date": "2024-01-25", - "last_updated": "2025-08-15", + "attachment": true, + "open_weights": true, + "knowledge": "2024-06", + "release_date": "2025-06-03", + "last_updated": "2025-06-03", "cost": { - "input": 0.21, - "output": 0.63 + "input": 0, + "output": 0 }, "type": "chat" }, { - "id": "gpt-oss-20b", - "name": "GPT OSS 20B", - "display_name": "GPT OSS 20B", + "id": "google/gemma-3n-e2b-it", + "name": "Gemma 3n E2b It", + "display_name": "Gemma 3n E2b It", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 131072, - "output": 32766 + "context": 128000, + "output": 4096 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true - } + "supported": false }, - "attachment": false, - "open_weights": false, - "release_date": "2025-08-05", - "last_updated": "2025-08-05", + "attachment": true, + "open_weights": true, + "knowledge": "2024-06", + "release_date": "2025-06-12", + "last_updated": "2025-06-12", "cost": { - "input": 0.04, - "output": 0.15 + "input": 0, + "output": 0 }, "type": "chat" }, { - "id": "llama-4-scout", - "name": "Llama 4 Scout", - "display_name": "Llama 4 Scout", + "id": "google/google-paligemma", + "name": "paligemma", + "display_name": "paligemma", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 32768, - "output": 16384 + "context": 128000, + "output": 8192 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": false }, - "attachment": false, + "attachment": true, "open_weights": true, - "release_date": "2025-04-05", - "last_updated": "2025-04-05", + "release_date": "2024-05-14", + "last_updated": "2024-08-26", "cost": { - "input": 0.18, - "output": 0.59 + "input": 0, + "output": 0 }, "type": "chat" }, { - "id": "sonar-reasoning-pro", - "name": "Sonar Reasoning Pro", - "display_name": "Sonar Reasoning Pro", + "id": "google/gemma-4-31b-it", + "name": "Gemma-4-31B-IT", + "display_name": "Gemma-4-31B-IT", "modalities": { "input": [ "text", - "image" + "image", + "video" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 4096 + "context": 256000, + "output": 16384 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { "supported": true, "default": true }, "attachment": true, - "open_weights": false, - "knowledge": "2025-09-01", - "release_date": "2024-01-01", - "last_updated": "2025-09-01", + "open_weights": true, + "knowledge": "2025-01", + "release_date": "2026-04-02", + "last_updated": "2026-04-02", "cost": { - "input": 2, - "output": 8 + "input": 0, + "output": 0 }, "type": "chat" }, { - "id": "gemini-2.5-pro", - "name": "Gemini 2.5 Pro", - "display_name": "Gemini 2.5 Pro", + "id": "google/gemma-2-2b-it", + "name": "Gemma 2 2b It", + "display_name": "Gemma 2 2b It", "modalities": { "input": [ - "text", - "image", - "audio", - "video", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 1048576, - "output": 65536 + "context": 128000, + "output": 4096 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": true, - "mode": "budget", - "budget": { - "default": -1, - "min": 128, - "max": 32768, - "auto": -1, - "unit": "tokens" - }, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thought_signatures" - ] - } + "supported": false }, - "attachment": true, - "open_weights": false, - "knowledge": "2025-01", - "release_date": "2025-03-20", - "last_updated": "2025-06-05", + "attachment": false, + "open_weights": true, + "release_date": "2024-07-16", + "last_updated": "2024-07-16", "cost": { - "input": 1.25, - "output": 10, - "cache_read": 0.125, - "tiers": [ - { - "input": 2.5, - "output": 15, - "cache_read": 0.25, - "tier": { - "type": "context", - "size": 200000 - } - } - ], - "context_over_200k": { - "input": 2.5, - "output": 15, - "cache_read": 0.25 - } + "input": 0, + "output": 0 }, "type": "chat" }, { - "id": "glm-4.5v", - "name": "GLM-4.5V", - "display_name": "GLM-4.5V", + "id": "microsoft/phi-4-mini-instruct", + "name": "Phi-4-Mini", + "display_name": "Phi-4-Mini", "modalities": { "input": [ - "text", - "image", - "video" + "text" ], "output": [ "text" ] }, "limit": { - "context": 64000, - "output": 16384 + "context": 131072, + "output": 8192 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, - "attachment": true, + "attachment": false, "open_weights": true, - "knowledge": "2025-04", - "release_date": "2025-08-11", - "last_updated": "2025-08-11", + "knowledge": "2024-12", + "release_date": "2024-12-01", + "last_updated": "2025-09-05", "cost": { - "input": 0.6, - "output": 1.8 + "input": 0, + "output": 0 }, "type": "chat" }, { - "id": "gpt-4.1", - "name": "GPT-4.1", - "display_name": "GPT-4.1", + "id": "microsoft/phi-4-multimodal-instruct", + "name": "Phi 4 Multimodal", + "display_name": "Phi 4 Multimodal", "modalities": { "input": [ - "text", - "image", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 1047576, - "output": 32768 + "context": 128000, + "output": 16384 }, - "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": false }, - "attachment": true, + "attachment": false, "open_weights": false, - "knowledge": "2024-04", - "release_date": "2025-04-14", - "last_updated": "2025-04-14", + "release_date": "2025-07-26", + "last_updated": "2025-07-26", "cost": { - "input": 2, - "output": 8, - "cache_read": 0.5 + "input": 0, + "output": 0 }, "type": "chat" }, { - "id": "claude-sonnet-4-5-20250929", - "name": "Claude Sonnet 4.5", - "display_name": "Claude Sonnet 4.5", + "id": "z-ai/glm-5.1", + "name": "GLM-5.1", + "display_name": "GLM-5.1", "modalities": { "input": [ - "text", - "image", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 64000 + "context": 131072, + "output": 131072 }, "temperature": true, "tool_call": true, "reasoning": { "supported": true, - "default": false + "default": true }, "extra_capabilities": { "reasoning": { "supported": true, - "default_enabled": false, - "mode": "budget", - "budget": { - "min": 1024, - "unit": "tokens" - }, "interleaved": true, "summaries": true, "visibility": "summary", "continuation": [ "thinking_blocks" - ], - "notes": [ - "Claude 4 manual thinking uses thinking.type = \"enabled\" with budget_tokens.", - "Interleaved thinking requires the interleaved-thinking-2025-05-14 beta header for this model family." ] } }, - "attachment": true, - "open_weights": false, - "knowledge": "2025-07-31", - "release_date": "2025-09-29", - "last_updated": "2025-09-29", + "attachment": false, + "open_weights": true, + "release_date": "2026-03-27", + "last_updated": "2026-03-27", "cost": { - "input": 3, - "output": 15, - "cache_read": 0.3, - "cache_write": 3.75 + "input": 0, + "output": 0 }, "type": "chat" }, { - "id": "qwen3.6-plus", - "name": "Qwen3.6 Plus", - "display_name": "Qwen3.6 Plus", + "id": "openai/gpt-oss-120b", + "name": "GPT-OSS-120B", + "display_name": "GPT-OSS-120B", "modalities": { "input": [ - "text", - "image", - "video" + "text" ], "output": [ "text" ] }, "limit": { - "context": 1000000, - "output": 65536 + "context": 128000, + "output": 8192 }, "temperature": true, "tool_call": true, @@ -89341,92 +94557,66 @@ }, "extra_capabilities": { "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] + "supported": true } }, "attachment": false, - "open_weights": false, - "knowledge": "2025-04", - "release_date": "2026-04-02", - "last_updated": "2026-04-02", + "open_weights": true, + "knowledge": "2025-08", + "release_date": "2025-08-04", + "last_updated": "2025-08-14", "cost": { - "input": 0.5, - "output": 3, - "cache_read": 0.05, - "cache_write": 0.625, - "tiers": [ - { - "input": 2, - "output": 6, - "cache_read": 0.2, - "cache_write": 2.5, - "tier": { - "type": "context", - "size": 256000 - } - } - ], - "context_over_200k": { - "input": 2, - "output": 6, - "cache_read": 0.2, - "cache_write": 2.5 - } + "input": 0, + "output": 0 }, "type": "chat" }, { - "id": "llama-3.2-11b-instruct", - "name": "Llama 3.2 11B Instruct", - "display_name": "Llama 3.2 11B Instruct", + "id": "openai/whisper-large-v3", + "name": "Whisper Large v3", + "display_name": "Whisper Large v3", "modalities": { "input": [ - "text" + "audio" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 8192 + "context": 8192, + "output": 4096 }, - "temperature": true, + "temperature": false, "tool_call": false, "reasoning": { "supported": false }, "attachment": false, "open_weights": true, - "release_date": "2024-09-25", - "last_updated": "2024-09-25", + "knowledge": "2023-09", + "release_date": "2023-09-01", + "last_updated": "2025-09-05", "cost": { - "input": 0.07, - "output": 0.33 + "input": 0, + "output": 0 }, "type": "chat" }, { - "id": "qwen3-vl-plus", - "name": "Qwen3-VL Plus", - "display_name": "Qwen3-VL Plus", + "id": "openai/gpt-oss-20b", + "name": "GPT OSS 20B", + "display_name": "GPT OSS 20B", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 262144, + "context": 131072, "output": 32768 }, "temperature": true, @@ -89437,122 +94627,59 @@ }, "extra_capabilities": { "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] + "supported": true } }, "attachment": false, - "open_weights": false, - "knowledge": "2025-04", - "release_date": "2025-09-23", - "last_updated": "2025-09-23", + "open_weights": true, + "release_date": "2025-08-05", + "last_updated": "2025-08-05", "cost": { - "input": 0.2, - "output": 1.6, - "reasoning": 4.8 + "input": 0, + "output": 0 }, "type": "chat" }, { - "id": "glm-4.6v-flashx", - "name": "GLM-4.6V FlashX", - "display_name": "GLM-4.6V FlashX", + "id": "bytedance/seed-oss-36b-instruct", + "name": "ByteDance-Seed/Seed-OSS-36B-Instruct", + "display_name": "ByteDance-Seed/Seed-OSS-36B-Instruct", "modalities": { "input": [ - "text", - "image" - ], - "output": [ "text" - ] - }, - "limit": { - "context": 128000, - "output": 16000 - }, - "temperature": true, - "tool_call": true, - "reasoning": { - "supported": true, - "default": true - }, - "attachment": true, - "open_weights": false, - "release_date": "2025-12-08", - "last_updated": "2025-12-08", - "cost": { - "input": 0.04, - "output": 0.4, - "cache_read": 0.004 - }, - "type": "chat" - }, - { - "id": "gpt-5.4-nano", - "name": "GPT-5.4 nano", - "display_name": "GPT-5.4 nano", - "modalities": { - "input": [ - "text", - "image" ], "output": [ "text" ] }, "limit": { - "context": 400000, - "output": 128000 + "context": 262000, + "output": 262000 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": false + "supported": true }, "extra_capabilities": { "reasoning": { - "supported": true, - "default_enabled": false, - "mode": "effort", - "effort": "none", - "effort_options": [ - "none", - "low", - "medium", - "high", - "xhigh" - ], - "verbosity": "medium", - "verbosity_options": [ - "low", - "medium", - "high" - ], - "visibility": "hidden" + "supported": true } }, - "attachment": true, + "attachment": false, "open_weights": false, - "knowledge": "2025-08-31", - "release_date": "2026-03-17", - "last_updated": "2026-03-17", + "release_date": "2025-09-04", + "last_updated": "2025-11-25", "cost": { - "input": 0.2, - "output": 1.25, - "cache_read": 0.02 + "input": 0, + "output": 0 }, "type": "chat" }, { - "id": "claude-3-5-haiku", - "name": "Claude 3.5 Haiku", - "display_name": "Claude 3.5 Haiku", + "id": "mistralai/mistral-7b-instruct-v03", + "name": "Mistral-7B-Instruct-v0.3", + "display_name": "Mistral-7B-Instruct-v0.3", "modalities": { "input": [ "text" @@ -89562,8 +94689,8 @@ ] }, "limit": { - "context": 200000, - "output": 8192 + "context": 65536, + "output": 65536 }, "temperature": true, "tool_call": true, @@ -89571,110 +94698,49 @@ "supported": false }, "attachment": false, - "open_weights": false, - "release_date": "2024-10-22", - "last_updated": "2024-10-22", + "open_weights": true, + "release_date": "2025-04-01", + "last_updated": "2025-04-01", "cost": { - "input": 0.8, - "output": 4, - "cache_read": 0.08 + "input": 0, + "output": 0 }, "type": "chat" }, { - "id": "claude-opus-4-1-20250805", - "name": "Claude Opus 4.1", - "display_name": "Claude Opus 4.1", + "id": "mistralai/magistral-small-2506", + "name": "Magistral Small 2506", + "display_name": "Magistral Small 2506", "modalities": { "input": [ - "text", - "image", - "pdf" - ], - "output": [ "text" - ] - }, - "limit": { - "context": 200000, - "output": 32000 - }, - "temperature": true, - "tool_call": true, - "reasoning": { - "supported": true, - "default": false - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": false, - "mode": "budget", - "budget": { - "min": 1024, - "unit": "tokens" - }, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ], - "notes": [ - "Claude 4 manual thinking uses thinking.type = \"enabled\" with budget_tokens.", - "Interleaved thinking requires the interleaved-thinking-2025-05-14 beta header for this model family." - ] - } - }, - "attachment": true, - "open_weights": false, - "knowledge": "2025-03-31", - "release_date": "2025-08-05", - "last_updated": "2025-08-05", - "cost": { - "input": 15, - "output": 75, - "cache_read": 1.5, - "cache_write": 18.75 - }, - "type": "chat" - }, - { - "id": "qwen3-vl-8b-instruct", - "name": "Qwen3 VL 8B Instruct", - "display_name": "Qwen3 VL 8B Instruct", - "modalities": { - "input": [ - "text", - "image" ], "output": [ "text" ] }, "limit": { - "context": 131072, - "output": 8192 + "context": 32768, + "output": 32768 }, - "temperature": true, "tool_call": false, "reasoning": { "supported": false }, - "attachment": true, - "open_weights": true, - "release_date": "2025-08-19", - "last_updated": "2025-08-19", + "attachment": false, + "open_weights": false, + "release_date": "2025-09-25", + "last_updated": "2025-09-25", "cost": { - "input": 0.08, - "output": 0.5 + "input": 0, + "output": 0 }, "type": "chat" }, { - "id": "qwen-max", - "name": "Qwen Max", - "display_name": "Qwen Max", + "id": "mistralai/mixtral-8x7b-instruct", + "name": "Mistral: Mixtral 8x7B Instruct", + "display_name": "Mistral: Mixtral 8x7B Instruct", "modalities": { "input": [ "text" @@ -89685,7 +94751,7 @@ }, "limit": { "context": 32768, - "output": 8192 + "output": 16384 }, "temperature": true, "tool_call": true, @@ -89693,73 +94759,62 @@ "supported": false }, "attachment": false, - "open_weights": false, - "knowledge": "2024-04", - "release_date": "2024-04-03", - "last_updated": "2025-01-25", + "open_weights": true, + "release_date": "2023-12-10", + "last_updated": "2026-03-15", "cost": { - "input": 1.6, - "output": 6.4 + "input": 0, + "output": 0 }, "type": "chat" }, { - "id": "qwen-omni-turbo", - "name": "Qwen-Omni Turbo", - "display_name": "Qwen-Omni Turbo", + "id": "mistralai/mistral-medium-3-instruct", + "name": "Mistral Medium 3", + "display_name": "Mistral Medium 3", "modalities": { "input": [ "text", - "image", - "audio", - "video" + "image" ], "output": [ - "text", - "audio" + "text" ] }, "limit": { - "context": 32768, - "output": 2048 + "context": 131072, + "output": 32768 }, - "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": false }, - "attachment": false, + "attachment": true, "open_weights": false, - "knowledge": "2024-04", - "release_date": "2025-01-19", - "last_updated": "2025-03-26", + "release_date": "2025-09-25", + "last_updated": "2025-09-25", "cost": { - "input": 0.07, - "output": 0.27, - "input_audio": 4.44, - "output_audio": 8.89 + "input": 0, + "output": 0 }, "type": "chat" }, { - "id": "gemini-3.1-pro-preview", - "name": "Gemini 3.1 Pro Preview", - "display_name": "Gemini 3.1 Pro Preview", + "id": "mistralai/mistral-small-4-119b-2603", + "name": "mistral-small-4-119b-2603", + "display_name": "mistral-small-4-119b-2603", "modalities": { "input": [ "text", - "image", - "video", - "audio", - "pdf" + "image" ], "output": [ "text" ] }, "limit": { - "context": 1048576, - "output": 65536 + "context": 128000, + "output": 8192 }, "temperature": true, "tool_call": true, @@ -89767,55 +94822,20 @@ "supported": true, "default": true }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": true, - "mode": "level", - "level": "high", - "level_options": [ - "low", - "high" - ], - "summaries": true, - "visibility": "summary", - "continuation": [ - "thought_signatures" - ] - } - }, "attachment": true, - "open_weights": false, - "knowledge": "2025-01", - "release_date": "2026-02-19", - "last_updated": "2026-02-19", + "open_weights": true, + "release_date": "2026-03-16", + "last_updated": "2026-03-16", "cost": { - "input": 2, - "output": 12, - "cache_read": 0.2, - "tiers": [ - { - "input": 4, - "output": 18, - "cache_read": 0.4, - "tier": { - "type": "context", - "size": 200000 - } - } - ], - "context_over_200k": { - "input": 4, - "output": 18, - "cache_read": 0.4 - } + "input": 0, + "output": 0 }, "type": "chat" }, { - "id": "qwen3-coder-480b-a35b-instruct", - "name": "Qwen3-Coder 480B-A35B Instruct", - "display_name": "Qwen3-Coder 480B-A35B Instruct", + "id": "mistralai/mistral-nemotron", + "name": "mistral-nemotron", + "display_name": "mistral-nemotron", "modalities": { "input": [ "text" @@ -89825,8 +94845,8 @@ ] }, "limit": { - "context": 262144, - "output": 65536 + "context": 128000, + "output": 8192 }, "temperature": true, "tool_call": true, @@ -89835,271 +94855,193 @@ }, "attachment": false, "open_weights": true, - "knowledge": "2025-04", - "release_date": "2025-04", - "last_updated": "2025-04", + "release_date": "2025-06-11", + "last_updated": "2025-06-12", "cost": { - "input": 1.5, - "output": 7.5 + "input": 0, + "output": 0 }, "type": "chat" }, { - "id": "glm-4.6v", - "name": "GLM-4.6V", - "display_name": "GLM-4.6V", + "id": "mistralai/mistral-large-3-675b-instruct-2512", + "name": "Mistral Large 3 675B Instruct 2512", + "display_name": "Mistral Large 3 675B Instruct 2512", "modalities": { "input": [ "text", - "image", - "video" + "image" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 32768 + "context": 262144, + "output": 262144 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, "attachment": true, "open_weights": true, - "knowledge": "2025-04", - "release_date": "2025-12-08", - "last_updated": "2025-12-08", + "knowledge": "2025-01", + "release_date": "2025-12-02", + "last_updated": "2025-12-02", "cost": { - "input": 0.3, - "output": 0.9 + "input": 0, + "output": 0 }, "type": "chat" }, { - "id": "gemini-3.1-flash-lite", - "name": "Gemini 3.1 Flash Lite", - "display_name": "Gemini 3.1 Flash Lite", + "id": "mistralai/mixtral-8x22b-instruct", + "name": "Mistral: Mixtral 8x22B Instruct", + "display_name": "Mistral: Mixtral 8x22B Instruct", "modalities": { "input": [ - "text", - "image", - "video", - "audio", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 1048576, - "output": 65536 + "context": 65536, + "output": 13108 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true - } + "supported": false }, - "attachment": true, - "open_weights": false, - "knowledge": "2025-01", - "release_date": "2026-05-07", - "last_updated": "2026-05-07", + "attachment": false, + "open_weights": true, + "release_date": "2024-04-17", + "last_updated": "2024-04-17", "cost": { - "input": 0.25, - "output": 1.5, - "cache_read": 0.025, - "input_audio": 0.5 + "input": 0, + "output": 0 }, "type": "chat" }, { - "id": "gpt-5.3-codex", - "name": "GPT-5.3 Codex", - "display_name": "GPT-5.3 Codex", + "id": "nvidia/cosmos-transfer1-7b", + "name": "cosmos-transfer1-7b", + "display_name": "cosmos-transfer1-7b", "modalities": { "input": [ "text", "image", - "pdf" + "video" ], "output": [ - "text" + "video" ] }, "limit": { - "context": 400000, - "output": 128000 + "context": 8192, + "output": 4096 }, "temperature": false, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": true, - "mode": "effort", - "effort": "medium", - "effort_options": [ - "low", - "medium", - "high", - "xhigh" - ], - "verbosity": "medium", - "verbosity_options": [ - "low", - "medium", - "high" - ], - "visibility": "hidden" - } + "supported": false }, "attachment": true, - "open_weights": false, - "knowledge": "2025-08-31", - "release_date": "2026-02-05", - "last_updated": "2026-02-05", + "open_weights": true, + "release_date": "2025-06-13", + "last_updated": "2025-06-30", "cost": { - "input": 1.75, - "output": 14, - "cache_read": 0.175 + "input": 0, + "output": 0 }, "type": "chat" }, { - "id": "gemini-2.5-flash-lite", - "name": "Gemini 2.5 Flash-Lite", - "display_name": "Gemini 2.5 Flash-Lite", + "id": "nvidia/cosmos-transfer2_5-2b", + "name": "cosmos-transfer2.5-2b", + "display_name": "cosmos-transfer2.5-2b", "modalities": { "input": [ "text", "image", - "audio", - "video", - "pdf" + "video" ], "output": [ - "text" + "video" ] }, "limit": { - "context": 1048576, - "output": 65536 + "context": 8192, + "output": 4096 }, - "temperature": true, - "tool_call": true, + "temperature": false, + "tool_call": false, "reasoning": { - "supported": true, - "default": false - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": false, - "mode": "budget", - "budget": { - "default": -1, - "min": 512, - "max": 24576, - "auto": -1, - "unit": "tokens" - }, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thought_signatures" - ] - } + "supported": false }, "attachment": true, - "open_weights": false, - "knowledge": "2025-01", - "release_date": "2025-06-17", - "last_updated": "2025-06-17", + "open_weights": true, + "release_date": "2026-02-26", + "last_updated": "2026-02-26", "cost": { - "input": 0.1, - "output": 0.4, - "cache_read": 0.01, - "input_audio": 0.3 + "input": 0, + "output": 0 }, "type": "chat" }, { - "id": "qwen3-next-80b-a3b-thinking", - "name": "Qwen3-Next 80B-A3B (Thinking)", - "display_name": "Qwen3-Next 80B-A3B (Thinking)", + "id": "nvidia/llama-nemotron-embed-vl-1b-v2", + "name": "llama-nemotron-embed-vl-1b-v2", + "display_name": "llama-nemotron-embed-vl-1b-v2", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 131072, - "output": 32768 + "context": 32768, + "output": 2048 }, - "temperature": true, - "tool_call": true, + "temperature": false, + "tool_call": false, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } + "supported": false }, - "attachment": false, + "attachment": true, "open_weights": true, - "knowledge": "2025-04", - "release_date": "2025-09", - "last_updated": "2025-09", + "release_date": "2026-02-10", + "last_updated": "2026-02-10", "cost": { - "input": 0.5, - "output": 6 + "input": 0, + "output": 0 }, "type": "chat" }, { - "id": "gemini-2.5-flash", - "name": "Gemini 2.5 Flash", - "display_name": "Gemini 2.5 Flash", + "id": "nvidia/nemotron-3-nano-omni-30b-a3b-reasoning", + "name": "Nemotron 3 Nano Omni", + "display_name": "Nemotron 3 Nano Omni", "modalities": { "input": [ "text", "image", - "audio", "video", - "pdf" + "audio" ], "output": [ "text" ] }, "limit": { - "context": 1048576, + "context": 256000, "output": 65536 }, "temperature": true, @@ -90108,219 +95050,148 @@ "supported": true, "default": true }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": true, - "mode": "budget", - "budget": { - "default": -1, - "min": 0, - "max": 24576, - "auto": -1, - "off": 0, - "unit": "tokens" - }, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thought_signatures" - ] - } - }, "attachment": true, - "open_weights": false, - "knowledge": "2025-01", - "release_date": "2025-03-20", - "last_updated": "2025-06-05", + "open_weights": true, + "release_date": "2026-04-28", + "last_updated": "2026-04-28", "cost": { - "input": 0.3, - "output": 2.5, - "cache_read": 0.03, - "input_audio": 1 + "input": 0, + "output": 0 }, "type": "chat" }, { - "id": "qwen3-coder-flash", - "name": "Qwen3 Coder Flash", - "display_name": "Qwen3 Coder Flash", + "id": "nvidia/magpie-tts-zeroshot", + "name": "magpie-tts-zeroshot", + "display_name": "magpie-tts-zeroshot", "modalities": { "input": [ - "text" + "text", + "audio" ], "output": [ - "text" + "audio" ] }, "limit": { - "context": 1000000, - "output": 65536 + "context": 8192, + "output": 4096 }, - "temperature": true, - "tool_call": true, + "temperature": false, + "tool_call": false, "reasoning": { "supported": false }, - "attachment": false, - "open_weights": false, - "knowledge": "2025-04", - "release_date": "2025-07-28", - "last_updated": "2025-07-28", + "attachment": true, + "open_weights": true, + "release_date": "2025-05-22", + "last_updated": "2025-06-12", "cost": { - "input": 0.3, - "output": 1.5 + "input": 0, + "output": 0 }, "type": "chat" }, { - "id": "claude-3-7-sonnet-20250219", - "name": "Claude Sonnet 3.7", - "display_name": "Claude Sonnet 3.7", + "id": "nvidia/nvidia-nemotron-nano-9b-v2", + "name": "nvidia-nemotron-nano-9b-v2", + "display_name": "nvidia-nemotron-nano-9b-v2", "modalities": { "input": [ - "text", - "image", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 64000 + "context": 131072, + "output": 131072 }, "temperature": true, "tool_call": true, "reasoning": { "supported": true, - "default": false - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": false, - "mode": "budget", - "budget": { - "min": 1024, - "unit": "tokens" - }, - "interleaved": false, - "summaries": false, - "visibility": "full", - "continuation": [ - "thinking_blocks" - ], - "notes": [ - "Anthropic uses thinking budget tokens" - ] - } + "default": true }, - "attachment": true, - "open_weights": false, - "knowledge": "2024-10-31", - "release_date": "2025-02-19", - "last_updated": "2025-02-19", + "attachment": false, + "open_weights": true, + "knowledge": "2024-09", + "release_date": "2025-08-18", + "last_updated": "2025-08-18", "cost": { - "input": 3, - "output": 15, - "cache_read": 0.3, - "cache_write": 3.75 + "input": 0, + "output": 0 }, "type": "chat" }, { - "id": "mistral-small-2506", - "name": "Mistral Small 3.2", - "display_name": "Mistral Small 3.2", + "id": "nvidia/synthetic-video-detector", + "name": "synthetic-video-detector", + "display_name": "synthetic-video-detector", "modalities": { "input": [ - "text", - "image" + "video" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 16384 + "context": 8192, + "output": 4096 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": false }, - "attachment": false, + "attachment": true, "open_weights": true, - "knowledge": "2025-03", - "release_date": "2025-06-20", - "last_updated": "2025-06-20", + "release_date": "2026-04-16", + "last_updated": "2026-04-16", "cost": { - "input": 0.1, - "output": 0.3 + "input": 0, + "output": 0 }, "type": "chat" }, { - "id": "gpt-5.5-pro", - "name": "GPT-5.5 Pro", - "display_name": "GPT-5.5 Pro", + "id": "nvidia/nemotron-content-safety-reasoning-4b", + "name": "nemotron-content-safety-reasoning-4b", + "display_name": "nemotron-content-safety-reasoning-4b", "modalities": { "input": [ - "text", - "image", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 1050000, - "output": 128000 + "context": 128000, + "output": 4096 }, "temperature": false, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": true, "default": true }, - "extra_capabilities": { - "reasoning": { - "supported": true - } - }, - "attachment": true, - "open_weights": false, - "knowledge": "2025-12-01", - "release_date": "2026-04-23", - "last_updated": "2026-04-23", + "attachment": false, + "open_weights": true, + "release_date": "2026-01-22", + "last_updated": "2026-01-22", "cost": { - "input": 30, - "output": 180, - "tiers": [ - { - "input": 60, - "output": 270, - "tier": { - "type": "context", - "size": 272000 - } - } - ], - "context_over_200k": { - "input": 60, - "output": 270 - } + "input": 0, + "output": 0 }, "type": "chat" }, { - "id": "qwen-turbo", - "name": "Qwen Turbo", - "display_name": "Qwen Turbo", + "id": "nvidia/nv-embed-v1", + "name": "nv-embed-v1", + "display_name": "nv-embed-v1", "modalities": { "input": [ "text" @@ -90330,42 +95201,28 @@ ] }, "limit": { - "context": 1000000, - "output": 16384 + "context": 32768, + "output": 2048 }, - "temperature": true, - "tool_call": true, + "temperature": false, + "tool_call": false, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } + "supported": false }, "attachment": false, - "open_weights": false, - "knowledge": "2024-04", - "release_date": "2024-11-01", - "last_updated": "2025-04-28", + "open_weights": true, + "release_date": "2024-06-07", + "last_updated": "2025-07-22", "cost": { - "input": 0.05, - "output": 0.2, - "reasoning": 0.5 + "input": 0, + "output": 0 }, "type": "chat" }, { - "id": "qwq-plus", - "name": "QwQ Plus", - "display_name": "QwQ Plus", + "id": "nvidia/usdcode", + "name": "usdcode", + "display_name": "usdcode", "modalities": { "input": [ "text" @@ -90375,122 +95232,90 @@ ] }, "limit": { - "context": 131072, - "output": 8192 + "context": 128000, + "output": 4096 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } + "supported": false }, "attachment": false, "open_weights": false, - "knowledge": "2024-04", - "release_date": "2025-03-05", - "last_updated": "2025-03-05", + "release_date": "2026-01-01", + "last_updated": "2026-01-01", "cost": { - "input": 0.8, - "output": 2.4 + "input": 0, + "output": 0 }, "type": "chat" }, { - "id": "qwen3-vl-flash", - "name": "Qwen3 VL Flash", - "display_name": "Qwen3 VL Flash", + "id": "nvidia/riva-translate-4b-instruct-v1_1", + "name": "riva-translate-4b-instruct-v1_1", + "display_name": "riva-translate-4b-instruct-v1_1", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 1000000, - "output": 32000 + "context": 128000, + "output": 4096 }, - "temperature": true, - "tool_call": true, + "temperature": false, + "tool_call": false, "reasoning": { - "supported": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } + "supported": false }, - "attachment": true, - "open_weights": false, - "release_date": "2025-10-09", - "last_updated": "2025-10-09", + "attachment": false, + "open_weights": true, + "release_date": "2025-12-12", + "last_updated": "2025-12-12", "cost": { - "input": 0.022, - "output": 0.215, - "cache_read": 0.0044 + "input": 0, + "output": 0 }, "type": "chat" }, { - "id": "gemini-2.0-flash", - "name": "Gemini 2.0 Flash", - "display_name": "Gemini 2.0 Flash", + "id": "nvidia/sparsedrive", + "name": "sparsedrive", + "display_name": "sparsedrive", "modalities": { "input": [ - "text", - "image", - "audio", - "video", - "pdf" + "video" ], "output": [ "text" ] }, "limit": { - "context": 1048576, + "context": 128000, "output": 8192 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": false }, "attachment": true, - "open_weights": false, - "knowledge": "2024-06", - "release_date": "2024-12-11", - "last_updated": "2024-12-11", + "open_weights": true, + "release_date": "2025-03-18", + "last_updated": "2025-07-20", "cost": { - "input": 0.1, - "output": 0.4, - "cache_read": 0.025 + "input": 0, + "output": 0 }, "type": "chat" }, { - "id": "gpt-3.5-turbo", - "name": "GPT-3.5-turbo", - "display_name": "GPT-3.5-turbo", + "id": "nvidia/rerank-qa-mistral-4b", + "name": "rerank-qa-mistral-4b", + "display_name": "rerank-qa-mistral-4b", "modalities": { "input": [ "text" @@ -90500,347 +95325,248 @@ ] }, "limit": { - "context": 16385, + "context": 128000, "output": 4096 }, - "temperature": true, + "temperature": false, "tool_call": false, "reasoning": { "supported": false }, "attachment": false, - "open_weights": false, - "knowledge": "2021-09-01", - "release_date": "2023-03-01", - "last_updated": "2023-11-06", + "open_weights": true, + "release_date": "2024-03-17", + "last_updated": "2025-01-17", "cost": { - "input": 0.5, - "output": 1.5, - "cache_read": 0 + "input": 0, + "output": 0 }, "type": "chat" }, { - "id": "glm-4.7-flash", - "name": "GLM-4.7-Flash", - "display_name": "GLM-4.7-Flash", + "id": "nvidia/streampetr", + "name": "streampetr", + "display_name": "streampetr", "modalities": { "input": [ - "text" + "video" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 131072 + "context": 128000, + "output": 8192 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true - } + "supported": false }, - "attachment": false, + "attachment": true, "open_weights": true, - "knowledge": "2025-04", - "release_date": "2026-01-19", - "last_updated": "2026-01-19", + "release_date": "2025-11-13", + "last_updated": "2025-11-13", "cost": { "input": 0, - "output": 0, - "cache_read": 0, - "cache_write": 0 + "output": 0 }, "type": "chat" }, { - "id": "grok-4-20-reasoning", - "name": "Grok 4.20 (Reasoning)", - "display_name": "Grok 4.20 (Reasoning)", + "id": "nvidia/active-speaker-detection", + "name": "Active Speaker Detection", + "display_name": "Active Speaker Detection", "modalities": { "input": [ - "text", - "image", - "pdf" + "video" ], "output": [ "text" ] }, "limit": { - "context": 1000000, - "output": 30000 + "context": 8192, + "output": 4096 }, - "temperature": true, - "tool_call": true, + "temperature": false, + "tool_call": false, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true - } + "supported": false }, "attachment": true, - "open_weights": false, - "release_date": "2026-03-09", - "last_updated": "2026-03-09", + "open_weights": true, + "release_date": "2026-04-16", + "last_updated": "2026-04-16", "cost": { - "input": 1.25, - "output": 2.5, - "cache_read": 0.2, - "tiers": [ - { - "input": 2.5, - "output": 5, - "cache_read": 0.4, - "tier": { - "type": "context", - "size": 200000 - } - } - ], - "context_over_200k": { - "input": 2.5, - "output": 5, - "cache_read": 0.4 - } + "input": 0, + "output": 0 }, "type": "chat" }, { - "id": "gemini-3.5-flash", - "name": "Gemini 3.5 Flash", - "display_name": "Gemini 3.5 Flash", + "id": "nvidia/llama-3_1-nemotron-safety-guard-8b-v3", + "name": "llama-3.1-nemotron-safety-guard-8b-v3", + "display_name": "llama-3.1-nemotron-safety-guard-8b-v3", "modalities": { "input": [ - "text", - "image", - "video", - "audio", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 1048576, - "output": 65536 + "context": 128000, + "output": 4096 }, - "temperature": true, - "tool_call": true, + "temperature": false, + "tool_call": false, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": true, - "mode": "level", - "level": "high", - "level_options": [ - "minimal", - "low", - "medium", - "high" - ], - "summaries": true, - "visibility": "summary", - "continuation": [ - "thought_signatures" - ] - } + "supported": false }, - "attachment": true, - "open_weights": false, - "knowledge": "2025-01", - "release_date": "2026-05-19", - "last_updated": "2026-05-19", + "attachment": false, + "open_weights": true, + "release_date": "2025-10-28", + "last_updated": "2025-10-28", "cost": { - "input": 1.5, - "output": 9, - "cache_read": 0.15, - "input_audio": 1.5 + "input": 0, + "output": 0 }, "type": "chat" }, { - "id": "claude-3-5-sonnet-20241022", - "name": "Claude Sonnet 3.5 v2", - "display_name": "Claude Sonnet 3.5 v2", + "id": "nvidia/llama-3_2-nemoretriever-300m-embed-v1", + "name": "llama-3_2-nemoretriever-300m-embed-v1", + "display_name": "llama-3_2-nemoretriever-300m-embed-v1", "modalities": { "input": [ - "text", - "image", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 8192 + "context": 32768, + "output": 2048 }, - "temperature": true, - "tool_call": true, + "temperature": false, + "tool_call": false, "reasoning": { "supported": false }, - "attachment": true, - "open_weights": false, - "knowledge": "2024-04-30", - "release_date": "2024-10-22", - "last_updated": "2024-10-22", + "attachment": false, + "open_weights": true, + "release_date": "2025-07-24", + "last_updated": "2025-07-24", "cost": { - "input": 3, - "output": 15, - "cache_read": 0.3, - "cache_write": 3.75 + "input": 0, + "output": 0 }, "type": "chat" }, { - "id": "gemma-2-27b-it-together", - "name": "Gemma 2 27B IT", - "display_name": "Gemma 2 27B IT", + "id": "nvidia/nemotron-voicechat", + "name": "nemotron-voicechat", + "display_name": "nemotron-voicechat", "modalities": { "input": [ - "text" + "text", + "audio" ], "output": [ "text" ] }, "limit": { - "context": 8192, - "output": 16384 + "context": 128000, + "output": 8192 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { "supported": false }, - "attachment": false, + "attachment": true, "open_weights": true, - "release_date": "2024-06-27", - "last_updated": "2024-06-27", + "release_date": "2026-03-16", + "last_updated": "2026-03-16", "cost": { - "input": 0.08, - "output": 0.08 + "input": 0, + "output": 0 }, "type": "chat" }, { - "id": "claude-opus-4-5-20251101", - "name": "Claude Opus 4.5", - "display_name": "Claude Opus 4.5", + "id": "nvidia/nv-embedcode-7b-v1", + "name": "nv-embedcode-7b-v1", + "display_name": "nv-embedcode-7b-v1", "modalities": { "input": [ - "text", - "image", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 64000 + "context": 32768, + "output": 2048 }, - "temperature": true, - "tool_call": true, + "temperature": false, + "tool_call": false, "reasoning": { - "supported": true, - "default": false - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": false, - "mode": "mixed", - "budget": { - "min": 1024, - "unit": "tokens" - }, - "effort": "high", - "effort_options": [ - "low", - "medium", - "high" - ], - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ], - "notes": [ - "Claude Opus 4.5 uses manual thinking.type = \"enabled\" with budget_tokens; effort can be used alongside the thinking budget.", - "Interleaved thinking requires the interleaved-thinking-2025-05-14 beta header." - ] - } + "supported": false }, - "attachment": true, - "open_weights": false, - "knowledge": "2025-03-31", - "release_date": "2025-11-01", - "last_updated": "2025-11-01", + "attachment": false, + "open_weights": true, + "release_date": "2025-03-17", + "last_updated": "2025-05-29", "cost": { - "input": 5, - "output": 25, - "cache_read": 0.5, - "cache_write": 6.25 + "input": 0, + "output": 0 }, "type": "chat" }, { - "id": "custom", - "name": "Custom Model", - "display_name": "Custom Model", + "id": "nvidia/nemotron-3-ultra-550b-a55b", + "name": "Nemotron 3 Ultra 550B A55B", + "display_name": "Nemotron 3 Ultra 550B A55B", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 16384 + "context": 1000000, + "output": 65536 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": true, - "open_weights": false, - "release_date": "2024-01-01", - "last_updated": "2024-01-01", + "attachment": false, + "open_weights": true, + "release_date": "2026-06-04", + "last_updated": "2026-06-04", "cost": { - "input": 0, - "output": 0 + "input": 0.5, + "output": 2.5, + "cache_read": 0.15 }, "type": "chat" }, { - "id": "hermes-2-pro-llama-3-8b", - "name": "Hermes 2 Pro Llama 3 8B", - "display_name": "Hermes 2 Pro Llama 3 8B", + "id": "nvidia/nemotron-3-nano-30b-a3b", + "name": "nemotron-3-nano-30b-a3b", + "display_name": "nemotron-3-nano-30b-a3b", "modalities": { "input": [ "text" @@ -90850,118 +95576,94 @@ ] }, "limit": { - "context": 8192, - "output": 8192 + "context": 131072, + "output": 131072 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "attachment": false, "open_weights": true, - "release_date": "2024-05-27", - "last_updated": "2024-05-27", + "knowledge": "2024-09", + "release_date": "2024-12", + "last_updated": "2024-12", "cost": { - "input": 0.14, - "output": 0.14 + "input": 0, + "output": 0 }, "type": "chat" }, { - "id": "gpt-5.2-codex", - "name": "GPT-5.2 Codex", - "display_name": "GPT-5.2 Codex", + "id": "nvidia/cosmos-predict1-5b", + "name": "cosmos-predict1-5b", + "display_name": "cosmos-predict1-5b", "modalities": { "input": [ "text", "image", - "pdf" + "video" ], "output": [ - "text" + "video" ] }, "limit": { - "context": 400000, - "output": 128000 + "context": 8192, + "output": 4096 }, "temperature": false, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": true, - "mode": "effort", - "effort": "medium", - "effort_options": [ - "low", - "medium", - "high", - "xhigh" - ], - "verbosity": "medium", - "verbosity_options": [ - "low", - "medium", - "high" - ], - "visibility": "hidden" - } + "supported": false }, "attachment": true, - "open_weights": false, - "knowledge": "2025-08-31", - "release_date": "2025-12-11", - "last_updated": "2025-12-11", + "open_weights": true, + "release_date": "2025-03-18", + "last_updated": "2025-03-18", "cost": { - "input": 1.75, - "output": 14, - "cache_read": 0.175 + "input": 0, + "output": 0 }, "type": "chat" }, { - "id": "claude-3-opus", - "name": "Claude 3 Opus", - "display_name": "Claude 3 Opus", + "id": "nvidia/bevformer", + "name": "bevformer", + "display_name": "bevformer", "modalities": { "input": [ - "text", - "image" + "video" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 4096 + "context": 128000, + "output": 8192 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": false }, "attachment": true, - "open_weights": false, - "release_date": "2024-03-04", - "last_updated": "2024-03-04", + "open_weights": true, + "release_date": "2025-03-18", + "last_updated": "2025-07-20", "cost": { - "input": 15, - "output": 75, - "cache_read": 1.5 + "input": 0, + "output": 0 }, "type": "chat" }, { - "id": "llama-3.1-nemotron-ultra-253b", - "name": "Llama 3.1 Nemotron Ultra 253B", - "display_name": "Llama 3.1 Nemotron Ultra 253B", + "id": "nvidia/studiovoice", + "name": "studiovoice", + "display_name": "studiovoice", "modalities": { "input": [ "text" @@ -90981,64 +95683,49 @@ }, "attachment": false, "open_weights": true, - "release_date": "2025-04-07", - "last_updated": "2025-04-07", + "release_date": "2024-10-03", + "last_updated": "2025-06-13", "cost": { - "input": 0.6, - "output": 1.8 + "input": 0, + "output": 0 }, "type": "chat" }, { - "id": "qwen3.6-35b-a3b", - "name": "Qwen3.6 35B-A3B", - "display_name": "Qwen3.6 35B-A3B", + "id": "nvidia/gliner-pii", + "name": "gliner-pii", + "display_name": "gliner-pii", "modalities": { "input": [ - "text", - "image", - "video", - "audio" + "text" ], "output": [ "text" ] }, "limit": { - "context": 262144, - "output": 65536 + "context": 128000, + "output": 4096 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } + "supported": false }, - "attachment": true, + "attachment": false, "open_weights": true, - "release_date": "2026-04-17", - "last_updated": "2026-04-17", + "release_date": "2026-03-03", + "last_updated": "2026-03-03", "cost": { - "input": 0.248, - "output": 1.485 + "input": 0, + "output": 0 }, "type": "chat" }, { - "id": "minimax-m2.7", - "name": "MiniMax-M2.7", - "display_name": "MiniMax-M2.7", + "id": "nvidia/nemotron-mini-4b-instruct", + "name": "nemotron-mini-4b-instruct", + "display_name": "nemotron-mini-4b-instruct", "modalities": { "input": [ "text" @@ -91048,42 +95735,28 @@ ] }, "limit": { - "context": 204800, - "output": 131072 + "context": 128000, + "output": 8192 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } + "supported": false }, "attachment": false, "open_weights": true, - "release_date": "2026-03-18", - "last_updated": "2026-03-18", + "release_date": "2024-08-21", + "last_updated": "2024-08-26", "cost": { - "input": 0.3, - "output": 1.2, - "cache_read": 0.06, - "cache_write": 0.375 + "input": 0, + "output": 0 }, "type": "chat" }, { - "id": "qwen3-max-2026-01-23", - "name": "Qwen3 Max (2026-01-23)", - "display_name": "Qwen3 Max (2026-01-23)", + "id": "nvidia/llama-nemotron-rerank-vl-1b-v2", + "name": "llama-nemotron-rerank-vl-1b-v2", + "display_name": "llama-nemotron-rerank-vl-1b-v2", "modalities": { "input": [ "text", @@ -91094,41 +95767,28 @@ ] }, "limit": { - "context": 256000, - "output": 32800 + "context": 128000, + "output": 4096 }, - "temperature": true, - "tool_call": true, + "temperature": false, + "tool_call": false, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } + "supported": false }, "attachment": true, - "open_weights": false, - "release_date": "2026-01-23", - "last_updated": "2026-01-23", + "open_weights": true, + "release_date": "2026-03-31", + "last_updated": "2026-03-31", "cost": { - "input": 0.359, - "output": 1.434, - "cache_read": 0.072 + "input": 0, + "output": 0 }, "type": "chat" }, { - "id": "deepseek-v4-flash", - "name": "DeepSeek V4 Flash", - "display_name": "DeepSeek V4 Flash", + "id": "nvidia/nemotron-3-super-120b-a12b", + "name": "Nemotron 3 Super", + "display_name": "Nemotron 3 Super", "modalities": { "input": [ "text" @@ -91138,8 +95798,8 @@ ] }, "limit": { - "context": 1000000, - "output": 384000 + "context": 262144, + "output": 262144 }, "temperature": true, "tool_call": true, @@ -91147,33 +95807,21 @@ "supported": true, "default": true }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } - }, "attachment": false, "open_weights": true, - "knowledge": "2025-05", - "release_date": "2026-04-24", - "last_updated": "2026-04-24", + "knowledge": "2024-04", + "release_date": "2026-03-11", + "last_updated": "2026-03-11", "cost": { - "input": 0.14, - "output": 0.28, - "cache_read": 0.0028 + "input": 0.2, + "output": 0.8 }, "type": "chat" }, { - "id": "llama-3-70b-instruct", - "name": "Llama 3 70B Instruct", - "display_name": "Llama 3 70B Instruct", + "id": "nvidia/usdvalidate", + "name": "usdvalidate", + "display_name": "usdvalidate", "modalities": { "input": [ "text" @@ -91184,70 +95832,89 @@ }, "limit": { "context": 8192, - "output": 8000 + "output": 4096 }, - "temperature": true, + "temperature": false, "tool_call": false, "reasoning": { "supported": false }, "attachment": false, "open_weights": true, - "release_date": "2024-04-18", - "last_updated": "2024-04-18", + "release_date": "2024-07-24", + "last_updated": "2025-01-08", "cost": { - "input": 0.51, - "output": 0.74 + "input": 0, + "output": 0 }, "type": "chat" }, { - "id": "qwen-plus-latest", - "name": "Qwen Plus Latest", - "display_name": "Qwen Plus Latest", + "id": "nvidia/nemotron-3-content-safety", + "name": "nemotron-3-content-safety", + "display_name": "nemotron-3-content-safety", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 131072, + "context": 128000, + "output": 4096 + }, + "temperature": false, + "tool_call": false, + "reasoning": { + "supported": false + }, + "attachment": false, + "open_weights": true, + "release_date": "2026-04-16", + "last_updated": "2026-04-16", + "cost": { + "input": 0, + "output": 0 + }, + "type": "chat" + }, + { + "id": "abacusai/dracarys-llama-3_1-70b-instruct", + "name": "dracarys-llama-3.1-70b-instruct", + "display_name": "dracarys-llama-3.1-70b-instruct", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 128000, "output": 8192 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } + "supported": false }, - "attachment": true, - "open_weights": false, - "release_date": "2025-01-25", - "last_updated": "2025-01-25", + "attachment": false, + "open_weights": true, + "release_date": "2024-09-11", + "last_updated": "2025-05-22", "cost": { - "input": 0.115, - "output": 0.287 + "input": 0, + "output": 0 }, "type": "chat" }, { - "id": "qwen3-30b-a3b-thinking-2507", - "name": "Qwen3 30B A3B Thinking (2507)", - "display_name": "Qwen3 30B A3B Thinking (2507)", + "id": "deepseek-ai/deepseek-v4-flash", + "name": "DeepSeek V4 Flash", + "display_name": "DeepSeek V4 Flash", "modalities": { "input": [ "text" @@ -91257,8 +95924,8 @@ ] }, "limit": { - "context": 131072, - "output": 8192 + "context": 1048576, + "output": 393216 }, "temperature": true, "tool_call": true, @@ -91279,80 +95946,65 @@ }, "attachment": false, "open_weights": true, - "release_date": "2025-07-08", - "last_updated": "2025-07-08", + "knowledge": "2025-05", + "release_date": "2026-04-24", + "last_updated": "2026-04-24", "cost": { - "input": 0.1, - "output": 0.1 + "input": 0.14, + "output": 0.28, + "cache_read": 0.0028 }, "type": "chat" }, { - "id": "claude-opus-4-8", - "name": "Claude Opus 4.8", - "display_name": "Claude Opus 4.8", + "id": "deepseek-ai/deepseek-v4-pro", + "name": "DeepSeek V4 Pro", + "display_name": "DeepSeek V4 Pro", "modalities": { "input": [ - "text", - "image", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 1000000, - "output": 128000 + "context": 1048576, + "output": 393216 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, - "default": false + "default": true }, "extra_capabilities": { "reasoning": { "supported": true, - "default_enabled": false, - "mode": "effort", - "effort": "high", - "effort_options": [ - "low", - "medium", - "high", - "xhigh", - "max" - ], "interleaved": true, "summaries": true, - "visibility": "omitted", + "visibility": "summary", "continuation": [ "thinking_blocks" - ], - "notes": [ - "Claude Opus 4.7 and newer Opus models require thinking.type = \"adaptive\" to enable thinking explicitly.", - "Manual budget_tokens requests return 400 on Claude Opus 4.7 and newer adaptive-only Opus models.", - "task_budget is separate from thinking control and should not be treated as a thinking budget." ] } }, - "attachment": true, - "open_weights": false, - "release_date": "2026-05-28", - "last_updated": "2026-05-28", + "attachment": false, + "open_weights": true, + "knowledge": "2025-05", + "release_date": "2026-04-24", + "last_updated": "2026-04-24", "cost": { - "input": 5, - "output": 25, - "cache_read": 0.5, - "cache_write": 6.25 + "input": 0.435, + "output": 0.87, + "cache_read": 0.003625 }, "type": "chat" }, { - "id": "llama-3-8b-instruct", - "name": "Llama 3 8B Instruct", - "display_name": "Llama 3 8B Instruct", + "id": "qwen/qwen3-next-80b-a3b-instruct", + "name": "Qwen3-Next-80B-A3B-Instruct", + "display_name": "Qwen3-Next-80B-A3B-Instruct", "modalities": { "input": [ "text" @@ -91362,105 +96014,93 @@ ] }, "limit": { - "context": 8192, - "output": 8192 + "context": 262144, + "output": 16384 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { "supported": false }, "attachment": false, - "open_weights": true, - "release_date": "2025-04-03", - "last_updated": "2025-04-03", + "open_weights": false, + "knowledge": "2024-12", + "release_date": "2024-12-01", + "last_updated": "2025-09-05", "cost": { - "input": 0.04, - "output": 0.04 + "input": 0, + "output": 0 }, "type": "chat" }, { - "id": "devstral-small-2507", - "name": "Devstral Small", - "display_name": "Devstral Small", + "id": "qwen/qwen-image-edit", + "name": "Qwen Image Edit", + "display_name": "Qwen Image Edit", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ - "text" + "image" ] }, "limit": { - "context": 128000, - "output": 128000 + "context": 8192, + "output": 8192 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": false }, - "attachment": false, - "open_weights": true, - "knowledge": "2025-05", - "release_date": "2025-07-10", - "last_updated": "2025-07-10", + "attachment": true, + "open_weights": false, + "release_date": "2025-08-19", + "last_updated": "2025-08-19", "cost": { - "input": 0.1, - "output": 0.3 + "input": 0, + "output": 0 }, - "type": "chat" + "type": "imageGeneration" }, { - "id": "glm-5", - "name": "GLM-5", - "display_name": "GLM-5", + "id": "qwen/qwen-image", + "name": "Qwen Image", + "display_name": "Qwen Image", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ - "text" + "image" ] }, "limit": { - "context": 204800, - "output": 131072 + "context": 8192, + "output": 8192 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } + "supported": false }, - "attachment": false, - "open_weights": true, - "release_date": "2026-02-11", - "last_updated": "2026-02-11", + "attachment": true, + "open_weights": false, + "release_date": "2025-08-07", + "last_updated": "2025-08-07", "cost": { - "input": 1, - "output": 3.2, - "cache_read": 0.2, - "cache_write": 0 + "input": 0, + "output": 0 }, - "type": "chat" + "type": "imageGeneration" }, { - "id": "devstral-2512", - "name": "Devstral 2", - "display_name": "Devstral 2", + "id": "qwen/qwen3-coder-480b-a35b-instruct", + "name": "Qwen3 Coder 480B A35B Instruct", + "display_name": "Qwen3 Coder 480B A35B Instruct", "modalities": { "input": [ "text" @@ -91471,7 +96111,7 @@ }, "limit": { "context": 262144, - "output": 262144 + "output": 66536 }, "temperature": true, "tool_call": true, @@ -91479,20 +96119,20 @@ "supported": false }, "attachment": false, - "open_weights": true, - "knowledge": "2025-12", - "release_date": "2025-12-09", - "last_updated": "2025-12-09", + "open_weights": false, + "knowledge": "2025-04", + "release_date": "2025-07-23", + "last_updated": "2025-07-23", "cost": { - "input": 0.4, - "output": 2 + "input": 0, + "output": 0 }, "type": "chat" }, { - "id": "glm-4.5", - "name": "GLM-4.5", - "display_name": "GLM-4.5", + "id": "qwen/qwen2.5-coder-32b-instruct", + "name": "Qwen2.5 Coder 32b Instruct", + "display_name": "Qwen2.5 Coder 32b Instruct", "modalities": { "input": [ "text" @@ -91502,228 +96142,182 @@ ] }, "limit": { - "context": 131072, - "output": 98304 + "context": 128000, + "output": 4096 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, "attachment": false, "open_weights": true, - "knowledge": "2025-04", - "release_date": "2025-07-28", - "last_updated": "2025-07-28", + "release_date": "2024-11-06", + "last_updated": "2024-11-06", "cost": { - "input": 0.6, - "output": 2.2, - "cache_read": 0.11, - "cache_write": 0 + "input": 0, + "output": 0 }, "type": "chat" }, { - "id": "qwen3-235b-a22b-instruct-2507", - "name": "Qwen3 235B A22B Instruct (2507)", - "display_name": "Qwen3 235B A22B Instruct (2507)", + "id": "qwen/qwen3.5-397b-a17b", + "name": "Qwen3.5-397B-A17B", + "display_name": "Qwen3.5-397B-A17B", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 131072, + "context": 262144, "output": 8192 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": false, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } + }, + "attachment": true, "open_weights": true, - "release_date": "2025-07-08", - "last_updated": "2025-07-08", + "knowledge": "2026-01", + "release_date": "2026-02-16", + "last_updated": "2026-02-16", "cost": { - "input": 0.09, - "output": 0.58 + "input": 0, + "output": 0 }, "type": "chat" }, { - "id": "gpt-5.1-codex", - "name": "GPT-5.1 Codex", - "display_name": "GPT-5.1 Codex", + "id": "qwen/qwen3.5-122b-a10b", + "name": "Qwen3.5 122B-A10B", + "display_name": "Qwen3.5 122B-A10B", "modalities": { "input": [ "text", - "image" + "image", + "video", + "audio" ], "output": [ "text" ] }, "limit": { - "context": 400000, - "output": 128000 + "context": 262144, + "output": 65536 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, - "default": false + "default": true }, "extra_capabilities": { "reasoning": { "supported": true, - "default_enabled": false, - "mode": "effort", - "effort": "none", - "effort_options": [ - "none", - "low", - "medium", - "high" - ], - "verbosity": "medium", - "verbosity_options": [ - "low", - "medium", - "high" - ], - "visibility": "hidden" + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] } }, "attachment": true, - "open_weights": false, - "knowledge": "2024-09-30", - "release_date": "2025-11-13", - "last_updated": "2025-11-13", + "open_weights": true, + "release_date": "2026-02-23", + "last_updated": "2026-02-23", "cost": { - "input": 1.25, - "output": 10, - "cache_read": 0.125 + "input": 0, + "output": 0 }, "type": "chat" }, { - "id": "grok-4-3", - "name": "Grok 4.3", - "display_name": "Grok 4.3", + "id": "sarvamai/sarvam-m", + "name": "sarvam-m", + "display_name": "sarvam-m", "modalities": { "input": [ - "text", - "image", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 1000000, - "output": 30000 + "context": 128000, + "output": 8192 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, - "attachment": true, - "open_weights": false, - "release_date": "2026-04-17", - "last_updated": "2026-04-17", + "attachment": false, + "open_weights": true, + "release_date": "2025-07-25", + "last_updated": "2025-07-25", "cost": { - "input": 1.25, - "output": 2.5, - "cache_read": 0.2, - "tiers": [ - { - "input": 2.5, - "output": 5, - "cache_read": 0.4, - "tier": { - "type": "context", - "size": 200000 - } - } - ], - "context_over_200k": { - "input": 2.5, - "output": 5, - "cache_read": 0.4 - } + "input": 0, + "output": 0 }, "type": "chat" }, { - "id": "claude-sonnet-4-20250514", - "name": "Claude Sonnet 4", - "display_name": "Claude Sonnet 4", + "id": "meta/llama-3.1-8b-instruct", + "name": "Llama 3.1 8B Instruct", + "display_name": "Llama 3.1 8B Instruct", "modalities": { "input": [ - "text", - "image", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 64000 + "context": 16000, + "output": 4096 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": false - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": false, - "mode": "budget", - "budget": { - "min": 1024, - "unit": "tokens" - }, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ], - "notes": [ - "Claude 4 manual thinking uses thinking.type = \"enabled\" with budget_tokens.", - "Interleaved thinking requires the interleaved-thinking-2025-05-14 beta header for this model family." - ] - } + "supported": false }, - "attachment": true, - "open_weights": false, - "knowledge": "2025-03-31", - "release_date": "2025-05-22", - "last_updated": "2025-05-22", + "attachment": false, + "open_weights": true, + "knowledge": "2023-12", + "release_date": "2025-01-01", + "last_updated": "2025-01-01", "cost": { - "input": 3, - "output": 15, - "cache_read": 0.3, - "cache_write": 3.75 + "input": 0, + "output": 0 }, "type": "chat" }, { - "id": "glm-4.5-x", - "name": "GLM-4.5 X", - "display_name": "GLM-4.5 X", + "id": "meta/llama-3.1-70b-instruct", + "name": "Llama 3.1 70b Instruct", + "display_name": "Llama 3.1 70b Instruct", "modalities": { "input": [ "text" @@ -91734,33 +96328,30 @@ }, "limit": { "context": 128000, - "output": 16384 + "output": 4096 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, "attachment": false, - "open_weights": false, - "release_date": "2025-07-28", - "last_updated": "2025-07-28", + "open_weights": true, + "release_date": "2024-07-16", + "last_updated": "2024-07-16", "cost": { - "input": 2.2, - "output": 8.9, - "cache_read": 0.45 + "input": 0, + "output": 0 }, "type": "chat" }, { - "id": "pixtral-large-latest", - "name": "Pixtral Large (latest)", - "display_name": "Pixtral Large (latest)", + "id": "meta/llama-3.2-1b-instruct", + "name": "Llama 3.2 1b Instruct", + "display_name": "Llama 3.2 1b Instruct", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" @@ -91768,86 +96359,72 @@ }, "limit": { "context": 128000, - "output": 128000 + "output": 4096 }, "temperature": true, "tool_call": true, "reasoning": { "supported": false }, - "attachment": true, + "attachment": false, "open_weights": true, - "knowledge": "2024-11", - "release_date": "2024-11-01", - "last_updated": "2024-11-04", + "knowledge": "2023-12", + "release_date": "2024-09-18", + "last_updated": "2024-09-18", "cost": { - "input": 2, - "output": 6 + "input": 0, + "output": 0 }, "type": "chat" }, { - "id": "qwen3.6-max-preview", - "name": "Qwen3.6 Max Preview", - "display_name": "Qwen3.6 Max Preview", + "id": "meta/llama-3.2-11b-vision-instruct", + "name": "Llama 3.2 11b Vision Instruct", + "display_name": "Llama 3.2 11b Vision Instruct", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 262144, - "output": 65536 + "context": 128000, + "output": 4096 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } + "supported": false }, - "attachment": false, - "open_weights": false, - "knowledge": "2025-04", - "release_date": "2026-04-20", - "last_updated": "2026-04-20", + "attachment": true, + "open_weights": true, + "knowledge": "2023-12", + "release_date": "2024-09-18", + "last_updated": "2024-09-18", "cost": { - "input": 1.3, - "output": 7.8, - "cache_read": 0.13, - "cache_write": 1.625 + "input": 0, + "output": 0 }, "type": "chat" }, { - "id": "qwen-vl-max", - "name": "Qwen-VL Max", - "display_name": "Qwen-VL Max", + "id": "meta/llama-3.3-70b-instruct", + "name": "Llama 3.3 70b Instruct", + "display_name": "Llama 3.3 70b Instruct", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 131072, - "output": 8192 + "context": 128000, + "output": 4096 }, "temperature": true, "tool_call": true, @@ -91855,30 +96432,30 @@ "supported": false }, "attachment": false, - "open_weights": false, - "knowledge": "2024-04", - "release_date": "2024-04-08", - "last_updated": "2025-08-13", + "open_weights": true, + "release_date": "2024-11-26", + "last_updated": "2024-11-26", "cost": { - "input": 0.8, - "output": 3.2 + "input": 0, + "output": 0 }, "type": "chat" }, { - "id": "codestral-2508", - "name": "Codestral", - "display_name": "Codestral", + "id": "meta/llama-guard-4-12b", + "name": "Llama Guard 4 12B", + "display_name": "Llama Guard 4 12B", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 256000, + "context": 128000, "output": 16384 }, "temperature": true, @@ -91886,20 +96463,20 @@ "reasoning": { "supported": false }, - "attachment": false, + "attachment": true, "open_weights": true, - "release_date": "2025-07-30", - "last_updated": "2025-07-30", + "release_date": "2025-04-05", + "last_updated": "2026-04-30", "cost": { - "input": 0.3, - "output": 0.9 + "input": 0, + "output": 0 }, "type": "chat" }, { - "id": "minimax-m2", - "name": "MiniMax-M2", - "display_name": "MiniMax-M2", + "id": "meta/esmfold", + "name": "esmfold", + "display_name": "esmfold", "modalities": { "input": [ "text" @@ -91909,34 +96486,28 @@ ] }, "limit": { - "context": 196608, - "output": 128000 + "context": 128000, + "output": 8192 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true - } + "supported": false }, "attachment": false, "open_weights": true, - "release_date": "2025-10-27", - "last_updated": "2025-10-27", + "release_date": "2024-03-15", + "last_updated": "2025-06-12", "cost": { - "input": 0.3, - "output": 1.2 + "input": 0, + "output": 0 }, "type": "chat" }, { - "id": "minimax-m2.5", - "name": "MiniMax-M2.5", - "display_name": "MiniMax-M2.5", + "id": "meta/esm2-650m", + "name": "esm2-650m", + "display_name": "esm2-650m", "modalities": { "input": [ "text" @@ -91946,39 +96517,32 @@ ] }, "limit": { - "context": 204800, - "output": 131072 + "context": 128000, + "output": 8192 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true - } + "supported": false }, "attachment": false, "open_weights": true, - "release_date": "2026-02-12", - "last_updated": "2026-02-12", + "release_date": "2024-08-29", + "last_updated": "2025-03-10", "cost": { - "input": 0.3, - "output": 1.2, - "cache_read": 0.03, - "cache_write": 0.375 + "input": 0, + "output": 0 }, "type": "chat" }, { - "id": "llama-3.1-8b-instruct", - "name": "Llama 3.1 8B Instruct", - "display_name": "Llama 3.1 8B Instruct", + "id": "meta/llama-3.2-90b-vision-instruct", + "name": "Llama-3.2-90B-Vision-Instruct", + "display_name": "Llama-3.2-90B-Vision-Instruct", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" @@ -91986,27 +96550,28 @@ }, "limit": { "context": 128000, - "output": 2048 + "output": 8192 }, "temperature": true, "tool_call": true, "reasoning": { "supported": false }, - "attachment": false, + "attachment": true, "open_weights": true, - "release_date": "2024-07-23", - "last_updated": "2024-07-23", + "knowledge": "2023-12", + "release_date": "2024-09-25", + "last_updated": "2024-09-25", "cost": { - "input": 0.22, - "output": 0.22 + "input": 0, + "output": 0 }, "type": "chat" }, { - "id": "seed-1-6-250915", - "name": "Seed 1.6 (250915)", - "display_name": "Seed 1.6 (250915)", + "id": "meta/llama-4-maverick-17b-128e-instruct", + "name": "Llama 4 Maverick 17b 128e Instruct", + "display_name": "Llama 4 Maverick 17b 128e Instruct", "modalities": { "input": [ "text", @@ -92017,324 +96582,233 @@ ] }, "limit": { - "context": 256000, - "output": 8192 + "context": 128000, + "output": 4096 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, "attachment": true, "open_weights": true, - "release_date": "2025-09-15", - "last_updated": "2025-09-15", + "knowledge": "2024-02", + "release_date": "2025-04-01", + "last_updated": "2025-04-01", "cost": { - "input": 0.25, - "output": 2, - "cache_read": 0.05 + "input": 0, + "output": 0 }, "type": "chat" }, { - "id": "claude-sonnet-4-5", - "name": "Claude Sonnet 4.5 (latest)", - "display_name": "Claude Sonnet 4.5 (latest)", + "id": "meta/llama-3.2-3b-instruct", + "name": "Llama 3.2 3B Instruct", + "display_name": "Llama 3.2 3B Instruct", "modalities": { "input": [ - "text", - "image", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 64000 + "context": 32768, + "output": 32000 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": false - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": false, - "mode": "budget", - "budget": { - "min": 1024, - "unit": "tokens" - }, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ], - "notes": [ - "Claude 4 manual thinking uses thinking.type = \"enabled\" with budget_tokens.", - "Interleaved thinking requires the interleaved-thinking-2025-05-14 beta header for this model family." - ] - } + "supported": false }, - "attachment": true, - "open_weights": false, - "knowledge": "2025-07-31", - "release_date": "2025-09-29", - "last_updated": "2025-09-29", + "attachment": false, + "open_weights": true, + "release_date": "2024-09-18", + "last_updated": "2024-09-18", "cost": { - "input": 3, - "output": 15, - "cache_read": 0.3, - "cache_write": 3.75 + "input": 0, + "output": 0 }, "type": "chat" }, { - "id": "gpt-5.4-mini", - "name": "GPT-5.4 mini", - "display_name": "GPT-5.4 mini", + "id": "upstage/solar-10_7b-instruct", + "name": "solar-10.7b-instruct", + "display_name": "solar-10.7b-instruct", "modalities": { - "input": [ - "text", - "image" + "input": [ + "text" ], "output": [ "text" ] }, "limit": { - "context": 400000, - "output": 128000 + "context": 128000, + "output": 8192 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": false - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": false, - "mode": "effort", - "effort": "none", - "effort_options": [ - "none", - "low", - "medium", - "high", - "xhigh" - ], - "verbosity": "medium", - "verbosity_options": [ - "low", - "medium", - "high" - ], - "visibility": "hidden" - } + "supported": false }, - "attachment": true, - "open_weights": false, - "knowledge": "2025-08-31", - "release_date": "2026-03-17", - "last_updated": "2026-03-17", + "attachment": false, + "open_weights": true, + "release_date": "2024-06-05", + "last_updated": "2025-04-10", "cost": { - "input": 0.75, - "output": 4.5, - "cache_read": 0.075 + "input": 0, + "output": 0 }, "type": "chat" }, { - "id": "mimo-v2-pro", - "name": "MiMo-V2-Pro", - "display_name": "MiMo-V2-Pro", + "id": "black-forest-labs/flux_1-schnell", + "name": "FLUX.1-schnell", + "display_name": "FLUX.1-schnell", "modalities": { "input": [ "text" ], "output": [ - "text" + "image" ] }, "limit": { - "context": 1048576, - "output": 131072 + "context": 77, + "output": 8192 }, - "temperature": true, - "tool_call": true, + "temperature": false, + "tool_call": false, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } + "supported": false }, "attachment": false, - "open_weights": false, - "knowledge": "2024-12", - "release_date": "2026-03-18", - "last_updated": "2026-03-18", + "open_weights": true, + "knowledge": "2024-07", + "release_date": "2024-08-01", + "last_updated": "2026-02-04", "cost": { - "input": 1, - "output": 3, - "cache_read": 0.2, - "tiers": [ - { - "input": 2, - "output": 6, - "cache_read": 0.4, - "tier": { - "type": "context", - "size": 256000 - } - } - ], - "context_over_200k": { - "input": 2, - "output": 6, - "cache_read": 0.4 - } + "input": 0, + "output": 0 }, "type": "chat" }, { - "id": "gpt-4-turbo", - "name": "GPT-4 Turbo", - "display_name": "GPT-4 Turbo", + "id": "black-forest-labs/flux_1-kontext-dev", + "name": "FLUX.1-Kontext-dev", + "display_name": "FLUX.1-Kontext-dev", "modalities": { "input": [ "text", "image" ], "output": [ - "text" + "image" ] }, "limit": { - "context": 128000, - "output": 4096 + "context": 40960, + "output": 40960 }, - "temperature": true, - "tool_call": true, + "temperature": false, + "tool_call": false, "reasoning": { "supported": false }, "attachment": true, - "open_weights": false, - "knowledge": "2023-12", - "release_date": "2023-11-06", - "last_updated": "2024-04-09", + "open_weights": true, + "release_date": "2025-08-12", + "last_updated": "2025-08-12", "cost": { - "input": 10, - "output": 30 + "input": 0, + "output": 0 }, "type": "chat" }, { - "id": "qwen3.7-plus", - "name": "Qwen3.7 Plus", - "display_name": "Qwen3.7 Plus", + "id": "black-forest-labs/flux.1-dev", + "name": "FLUX.1-dev", + "display_name": "FLUX.1-dev", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ - "text" + "image" ] }, "limit": { - "context": 1000000, - "output": 64000 + "context": 4096, + "output": 8192 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true - } + "supported": false }, "attachment": false, "open_weights": false, - "knowledge": "2025-04", - "release_date": "2026-06-02", - "last_updated": "2026-06-02", + "knowledge": "2024-08", + "release_date": "2024-08-01", + "last_updated": "2025-09-05", "cost": { - "input": 0.4, - "output": 1.6, - "cache_read": 0.08, - "cache_write": 0.5 + "input": 0, + "output": 0 }, "type": "chat" }, { - "id": "minimax-m2.5-highspeed", - "name": "MiniMax-M2.5-highspeed", - "display_name": "MiniMax-M2.5-highspeed", + "id": "black-forest-labs/flux_2-klein-4b", + "name": "FLUX.2 Klein 4B", + "display_name": "FLUX.2 Klein 4B", "modalities": { "input": [ + "image", "text" ], "output": [ - "text" + "image" ] }, "limit": { - "context": 204800, - "output": 131072 + "context": 40960, + "output": 40960 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true - } + "supported": false }, "attachment": false, "open_weights": true, - "release_date": "2026-02-13", - "last_updated": "2026-02-13", + "knowledge": "2025-06", + "release_date": "2026-01-14", + "last_updated": "2026-01-31", "cost": { - "input": 0.6, - "output": 2.4, - "cache_read": 0.06, - "cache_write": 0.375 + "input": 0, + "output": 0 }, "type": "chat" - }, + } + ] + }, + "evroc": { + "id": "evroc", + "name": "evroc", + "display_name": "evroc", + "api": "https://models.think.evroc.com/v1", + "doc": "https://docs.evroc.com/products/think/overview.html", + "models": [ { - "id": "mimo-v2.5", - "name": "MiMo-V2.5", - "display_name": "MiMo-V2.5", + "id": "moonshotai/Kimi-K2.5", + "name": "Kimi K2.5", + "display_name": "Kimi K2.5", "modalities": { "input": [ "text", "image", - "audio", "video" ], "output": [ @@ -92342,10 +96816,9 @@ ] }, "limit": { - "context": 1048576, - "output": 131072 + "context": 262144, + "output": 262144 }, - "temperature": true, "tool_call": true, "reasoning": { "supported": true, @@ -92362,156 +96835,81 @@ ] } }, - "attachment": true, + "attachment": false, "open_weights": true, - "knowledge": "2024-12", - "release_date": "2026-04-22", - "last_updated": "2026-04-22", + "release_date": "2026-01-27", + "last_updated": "2026-01-27", "cost": { - "input": 0.4, - "output": 2, - "cache_read": 0.08, - "tiers": [ - { - "input": 0.8, - "output": 4, - "cache_read": 0.16, - "tier": { - "type": "context", - "size": 256000 - } - } - ], - "context_over_200k": { - "input": 0.8, - "output": 4, - "cache_read": 0.16 - } + "input": 1.47, + "output": 5.9 }, "type": "chat" }, { - "id": "claude-3-7-sonnet", - "name": "Claude 3.7 Sonnet", - "display_name": "Claude 3.7 Sonnet", + "id": "microsoft/Phi-4-multimodal-instruct", + "name": "Phi-4 15B", + "display_name": "Phi-4 15B", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 8192 + "context": 32000, + "output": 32000 }, - "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": false - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": false, - "mode": "budget", - "budget": { - "min": 1024, - "unit": "tokens" - }, - "interleaved": false, - "summaries": false, - "visibility": "full", - "continuation": [ - "thinking_blocks" - ], - "notes": [ - "Anthropic uses thinking budget tokens" - ] - } + "supported": false }, "attachment": false, - "open_weights": false, - "release_date": "2025-02-24", - "last_updated": "2025-02-24", + "open_weights": true, + "release_date": "2025-01-01", + "last_updated": "2025-01-01", "cost": { - "input": 3, - "output": 15, - "cache_read": 0.3 + "input": 0.24, + "output": 0.47 }, "type": "chat" }, { - "id": "claude-opus-4-6", - "name": "Claude Opus 4.6", - "display_name": "Claude Opus 4.6", + "id": "Qwen/Qwen3-Embedding-8B", + "name": "Qwen3 Embedding 8B", + "display_name": "Qwen3 Embedding 8B", "modalities": { "input": [ - "text", - "image", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 1000000, - "output": 128000 + "context": 40960, + "output": 4096 }, - "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": false - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": false, - "mode": "mixed", - "budget": { - "min": 1024, - "unit": "tokens" - }, - "effort": "high", - "effort_options": [ - "low", - "medium", - "high", - "max" - ], - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ], - "notes": [ - "Anthropic recommends adaptive thinking with effort for Claude 4.6; budget_tokens remains a deprecated compatibility path.", - "Anthropic API defaults effort to high; lower effort levels should be chosen per workload." - ] - } + "supported": false }, - "attachment": true, - "open_weights": false, - "knowledge": "2025-05-31", - "release_date": "2026-02-05", - "last_updated": "2026-03-13", + "attachment": false, + "open_weights": true, + "release_date": "2025-07-30", + "last_updated": "2025-07-30", "cost": { - "input": 5, - "output": 25, - "cache_read": 0.5, - "cache_write": 6.25 + "input": 0.12, + "output": 0.12 }, - "type": "chat" + "type": "embedding" }, { - "id": "llama-3.3-70b-instruct", - "name": "Llama-3.3-70B-Instruct", - "display_name": "Llama-3.3-70B-Instruct", + "id": "Qwen/Qwen3-30B-A3B-Instruct-2507-FP8", + "name": "Qwen3 30B 2507", + "display_name": "Qwen3 30B 2507", "modalities": { "input": [ "text" @@ -92521,60 +96919,59 @@ ] }, "limit": { - "context": 128000, - "output": 4096 + "context": 64000, + "output": 64000 }, - "temperature": true, "tool_call": true, "reasoning": { "supported": false }, - "attachment": true, + "attachment": false, "open_weights": true, - "knowledge": "2023-12", - "release_date": "2024-12-06", - "last_updated": "2024-12-06", + "release_date": "2025-07-30", + "last_updated": "2025-07-30", "cost": { - "input": 0, - "output": 0 + "input": 0.35, + "output": 1.42 }, "type": "chat" }, { - "id": "qwen25-coder-7b", - "name": "Qwen2.5 Coder 7B", - "display_name": "Qwen2.5 Coder 7B", + "id": "Qwen/Qwen3-VL-30B-A3B-Instruct", + "name": "Qwen3 VL 30B", + "display_name": "Qwen3 VL 30B", "modalities": { "input": [ - "text" + "text", + "image", + "video" ], "output": [ "text" ] }, "limit": { - "context": 131072, - "output": 8192 + "context": 100000, + "output": 100000 }, - "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { "supported": false }, "attachment": false, "open_weights": true, - "release_date": "2024-09-19", - "last_updated": "2024-09-19", + "release_date": "2025-07-30", + "last_updated": "2025-07-30", "cost": { - "input": 0.05, - "output": 0.05 + "input": 0.24, + "output": 0.94 }, "type": "chat" }, { - "id": "mimo-v2-flash", - "name": "MiMo-V2-Flash", - "display_name": "MiMo-V2-Flash", + "id": "openai/gpt-oss-120b", + "name": "GPT OSS 120B", + "display_name": "GPT OSS 120B", "modalities": { "input": [ "text" @@ -92584,10 +96981,9 @@ ] }, "limit": { - "context": 262144, + "context": 65536, "output": 65536 }, - "temperature": true, "tool_call": true, "reasoning": { "supported": true, @@ -92595,63 +96991,54 @@ }, "extra_capabilities": { "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] + "supported": true } }, "attachment": false, "open_weights": true, - "knowledge": "2024-12-01", - "release_date": "2025-12-16", - "last_updated": "2026-02-04", + "release_date": "2025-08-05", + "last_updated": "2025-08-05", "cost": { - "input": 0.1, - "output": 0.3, - "cache_read": 0.01 + "input": 0.24, + "output": 0.94 }, "type": "chat" }, { - "id": "qwen3-30b-a3b-fp8", - "name": "Qwen3 30B A3B FP8", - "display_name": "Qwen3 30B A3B FP8", + "id": "openai/whisper-large-v3", + "name": "Whisper 3 Large", + "display_name": "Whisper 3 Large", "modalities": { "input": [ - "text" + "audio" ], "output": [ "text" ] }, "limit": { - "context": 131072, - "output": 8192 + "context": 448, + "output": 4096 }, - "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": true + "supported": false }, "attachment": false, "open_weights": true, - "release_date": "2025-04-28", - "last_updated": "2025-04-28", + "release_date": "2024-10-01", + "last_updated": "2024-10-01", "cost": { - "input": 0.1, - "output": 0.1 + "input": 0.00236, + "output": 0.00236, + "output_audio": 2.36 }, "type": "chat" }, { - "id": "kimi-k2", - "name": "Kimi K2", - "display_name": "Kimi K2", + "id": "mistralai/devstral-small-2-24b-instruct-2512", + "name": "Devstral Small 2 24B Instruct 2512", + "display_name": "Devstral Small 2 24B Instruct 2512", "modalities": { "input": [ "text" @@ -92661,29 +97048,27 @@ ] }, "limit": { - "context": 131072, - "output": 16384 + "context": 32768, + "output": 32768 }, - "temperature": true, "tool_call": true, "reasoning": { "supported": false }, "attachment": false, "open_weights": true, - "release_date": "2025-07-11", - "last_updated": "2025-07-11", + "release_date": "2025-12-01", + "last_updated": "2025-12-01", "cost": { - "input": 0.6, - "output": 2.5, - "cache_read": 0.12 + "input": 0.12, + "output": 0.47 }, "type": "chat" }, { - "id": "gemma-3-1b-it", - "name": "Gemma 3 1B IT", - "display_name": "Gemma 3 1B IT", + "id": "mistralai/Magistral-Small-2509", + "name": "Magistral Small 1.2 24B", + "display_name": "Magistral Small 1.2 24B", "modalities": { "input": [ "text" @@ -92693,78 +97078,59 @@ ] }, "limit": { - "context": 1000000, - "output": 16384 + "context": 131072, + "output": 131072 }, - "temperature": true, "tool_call": false, "reasoning": { "supported": false }, "attachment": false, "open_weights": true, - "release_date": "2025-03-12", - "last_updated": "2025-03-12", + "release_date": "2025-06-01", + "last_updated": "2025-06-01", "cost": { - "input": 0.08, - "output": 0.3 + "input": 0.59, + "output": 2.36 }, "type": "chat" }, { - "id": "o1", - "name": "o1", - "display_name": "o1", + "id": "mistralai/Voxtral-Small-24B-2507", + "name": "Voxtral Small 24B", + "display_name": "Voxtral Small 24B", "modalities": { "input": [ - "text", - "image", - "pdf" + "audio", + "text" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 100000 + "context": 32000, + "output": 32000 }, - "temperature": false, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": true, - "mode": "effort", - "effort": "medium", - "effort_options": [ - "low", - "medium", - "high" - ], - "visibility": "hidden" - } + "supported": false }, - "attachment": true, - "open_weights": false, - "knowledge": "2023-09", - "release_date": "2024-12-05", - "last_updated": "2024-12-05", + "attachment": false, + "open_weights": true, + "release_date": "2025-03-01", + "last_updated": "2025-03-01", "cost": { - "input": 15, - "output": 60, - "cache_read": 7.5 + "input": 0.00236, + "output": 0.00236, + "output_audio": 2.36 }, "type": "chat" }, { - "id": "deepseek-v4-pro", - "name": "DeepSeek V4 Pro", - "display_name": "DeepSeek V4 Pro", + "id": "nvidia/Llama-3.3-70B-Instruct-FP8", + "name": "Llama 3.3 70B", + "display_name": "Llama 3.3 70B", "modalities": { "input": [ "text" @@ -92774,123 +97140,97 @@ ] }, "limit": { - "context": 1000000, - "output": 384000 + "context": 131072, + "output": 32768 }, - "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } + "supported": false }, "attachment": false, "open_weights": true, - "knowledge": "2025-05", - "release_date": "2026-04-24", - "last_updated": "2026-04-24", + "release_date": "2024-12-01", + "last_updated": "2024-12-01", "cost": { - "input": 0.435, - "output": 0.87, - "cache_read": 0.003625 + "input": 1.18, + "output": 1.18 }, "type": "chat" }, { - "id": "kimi-k2.5", - "name": "Kimi K2.5", - "display_name": "Kimi K2.5", + "id": "KBLab/kb-whisper-large", + "name": "KB Whisper", + "display_name": "KB Whisper", "modalities": { "input": [ - "text", - "image", - "video" + "audio" ], "output": [ "text" ] }, "limit": { - "context": 262144, - "output": 262144 + "context": 448, + "output": 448 }, - "temperature": false, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } + "supported": false }, "attachment": false, "open_weights": true, - "knowledge": "2025-01", - "release_date": "2026-01", - "last_updated": "2026-01", + "release_date": "2024-10-01", + "last_updated": "2024-10-01", "cost": { - "input": 0.6, - "output": 3, - "cache_read": 0.1 + "input": 0.00236, + "output": 0.00236, + "output_audio": 2.36 }, "type": "chat" }, { - "id": "seed-1-6-250615", - "name": "Seed 1.6 (250615)", - "display_name": "Seed 1.6 (250615)", + "id": "intfloat/multilingual-e5-large-instruct", + "name": "E5 Multi-Lingual Large Embeddings 0.6B", + "display_name": "E5 Multi-Lingual Large Embeddings 0.6B", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 256000, - "output": 8192 + "context": 512, + "output": 512 }, - "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": true + "supported": false }, - "attachment": true, + "attachment": false, "open_weights": true, - "release_date": "2025-06-25", - "last_updated": "2025-06-25", + "release_date": "2024-06-01", + "last_updated": "2024-06-01", "cost": { - "input": 0.25, - "output": 2, - "cache_read": 0.05 + "input": 0.12, + "output": 0.12 }, "type": "chat" - }, + } + ] + }, + "xiaomi": { + "id": "xiaomi", + "name": "Xiaomi", + "display_name": "Xiaomi", + "api": "https://api.xiaomimimo.com/v1", + "doc": "https://platform.xiaomimimo.com/#/docs", + "models": [ { - "id": "glm-4.5-airx", - "name": "GLM-4.5 AirX", - "display_name": "GLM-4.5 AirX", + "id": "mimo-v2.5-pro-ultraspeed", + "name": "MiMo-V2.5-Pro-UltraSpeed", + "display_name": "MiMo-V2.5-Pro-UltraSpeed", "modalities": { "input": [ "text" @@ -92900,41 +97240,56 @@ ] }, "limit": { - "context": 128000, - "output": 16384 + "context": 1048576, + "output": 131072 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } }, "attachment": false, - "open_weights": false, - "release_date": "2025-07-28", - "last_updated": "2025-07-28", + "open_weights": true, + "knowledge": "2024-12", + "release_date": "2026-06-08", + "last_updated": "2026-06-09", "cost": { - "input": 1.1, - "output": 4.5, - "cache_read": 0.22 + "input": 1.305, + "output": 2.61, + "cache_read": 0.0108 }, "type": "chat" }, { - "id": "deepseek-v3.1", - "name": "DeepSeek V3.1", - "display_name": "DeepSeek V3.1", + "id": "mimo-v2.5", + "name": "MiMo-V2.5", + "display_name": "MiMo-V2.5", "modalities": { "input": [ "text", - "image" + "image", + "audio", + "video" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 32768 + "context": 1048576, + "output": 131072 }, "temperature": true, "tool_call": true, @@ -92942,116 +97297,143 @@ "supported": true, "default": true }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } + }, "attachment": true, "open_weights": true, - "release_date": "2025-08-21", - "last_updated": "2025-08-21", + "knowledge": "2024-12", + "release_date": "2026-04-22", + "last_updated": "2026-04-22", "cost": { - "input": 0.56, - "output": 1.68, - "cache_read": 0.07 + "input": 0.4, + "output": 2, + "cache_read": 0.08, + "tiers": [ + { + "input": 0.8, + "output": 4, + "cache_read": 0.16, + "tier": { + "type": "context", + "size": 256000 + } + } + ], + "context_over_200k": { + "input": 0.8, + "output": 4, + "cache_read": 0.16 + } }, "type": "chat" }, { - "id": "llama-4-scout-17b-instruct", - "name": "Llama 4 Scout 17B Instruct", - "display_name": "Llama 4 Scout 17B Instruct", + "id": "mimo-v2-omni", + "name": "MiMo-V2-Omni", + "display_name": "MiMo-V2-Omni", "modalities": { "input": [ "text", - "image" + "image", + "audio", + "video", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 8192, - "output": 2048 + "context": 262144, + "output": 131072 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } }, "attachment": true, - "open_weights": true, - "release_date": "2025-04-05", - "last_updated": "2025-04-05", + "open_weights": false, + "knowledge": "2024-12", + "release_date": "2026-03-18", + "last_updated": "2026-03-18", "cost": { - "input": 0.17, - "output": 0.66 + "input": 0.4, + "output": 2, + "cache_read": 0.08 }, "type": "chat" }, { - "id": "claude-opus-4-7", - "name": "Claude Opus 4.7", - "display_name": "Claude Opus 4.7", + "id": "mimo-v2-flash", + "name": "MiMo-V2-Flash", + "display_name": "MiMo-V2-Flash", "modalities": { "input": [ - "text", - "image", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 1000000, - "output": 128000 + "context": 262144, + "output": 65536 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, - "default": false + "default": true }, "extra_capabilities": { "reasoning": { "supported": true, - "default_enabled": false, - "mode": "effort", - "effort": "high", - "effort_options": [ - "low", - "medium", - "high", - "xhigh", - "max" - ], "interleaved": true, "summaries": true, - "visibility": "omitted", + "visibility": "summary", "continuation": [ "thinking_blocks" - ], - "notes": [ - "Claude Opus 4.7 and newer Opus models require thinking.type = \"adaptive\" to enable thinking explicitly.", - "Manual budget_tokens requests return 400 on Claude Opus 4.7 and newer adaptive-only Opus models.", - "task_budget is separate from thinking control and should not be treated as a thinking budget." ] } }, - "attachment": true, - "open_weights": false, - "knowledge": "2026-01-31", - "release_date": "2026-04-16", - "last_updated": "2026-04-16", + "attachment": false, + "open_weights": true, + "knowledge": "2024-12-01", + "release_date": "2025-12-16", + "last_updated": "2026-02-04", "cost": { - "input": 5, - "output": 25, - "cache_read": 0.5, - "cache_write": 6.25 + "input": 0.1, + "output": 0.3, + "cache_read": 0.01 }, "type": "chat" }, { - "id": "minimax-text-01", - "name": "MiniMax Text 01", - "display_name": "MiniMax Text 01", + "id": "mimo-v2-pro", + "name": "MiMo-V2-Pro", + "display_name": "MiMo-V2-Pro", "modalities": { "input": [ "text" @@ -93061,29 +97443,58 @@ ] }, "limit": { - "context": 1000000, + "context": 1048576, "output": 131072 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { "supported": true, "default": true }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } + }, "attachment": false, - "open_weights": true, - "release_date": "2025-01-15", - "last_updated": "2025-01-15", + "open_weights": false, + "knowledge": "2024-12", + "release_date": "2026-03-18", + "last_updated": "2026-03-18", "cost": { - "input": 0.2, - "output": 1.1 + "input": 1, + "output": 3, + "cache_read": 0.2, + "tiers": [ + { + "input": 2, + "output": 6, + "cache_read": 0.4, + "tier": { + "type": "context", + "size": 256000 + } + } + ], + "context_over_200k": { + "input": 2, + "output": 6, + "cache_read": 0.4 + } }, "type": "chat" }, { - "id": "gpt-4", - "name": "GPT-4", - "display_name": "GPT-4", + "id": "mimo-v2.5-pro", + "name": "MiMo-V2.5-Pro", + "display_name": "MiMo-V2.5-Pro", "modalities": { "input": [ "text" @@ -93093,29 +97504,67 @@ ] }, "limit": { - "context": 8192, - "output": 8192 + "context": 1048576, + "output": 131072 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": true, - "open_weights": false, - "knowledge": "2023-11", - "release_date": "2023-11-06", - "last_updated": "2024-04-09", + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } + }, + "attachment": false, + "open_weights": true, + "knowledge": "2024-12", + "release_date": "2026-04-22", + "last_updated": "2026-04-22", "cost": { - "input": 30, - "output": 60 + "input": 1, + "output": 3, + "cache_read": 0.2, + "tiers": [ + { + "input": 2, + "output": 6, + "cache_read": 0.4, + "tier": { + "type": "context", + "size": 256000 + } + } + ], + "context_over_200k": { + "input": 2, + "output": 6, + "cache_read": 0.4 + } }, "type": "chat" - }, + } + ] + }, + "inception": { + "id": "inception", + "name": "Inception", + "display_name": "Inception", + "api": "https://api.inceptionlabs.ai/v1/", + "doc": "https://platform.inceptionlabs.ai/docs", + "models": [ { - "id": "glm-4.5-air", - "name": "GLM-4.5-Air", - "display_name": "GLM-4.5-Air", + "id": "mercury-edit-2", + "name": "Mercury Edit 2", + "display_name": "Mercury Edit 2", "modalities": { "input": [ "text" @@ -93125,44 +97574,41 @@ ] }, "limit": { - "context": 131072, - "output": 98304 + "context": 128000, + "output": 8192 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": true, "default": true }, "attachment": false, - "open_weights": true, - "knowledge": "2025-04", - "release_date": "2025-07-28", - "last_updated": "2025-07-28", + "open_weights": false, + "release_date": "2026-03-30", + "last_updated": "2026-03-30", "cost": { - "input": 0.2, - "output": 1.1, - "cache_read": 0.03, - "cache_write": 0 + "input": 0.25, + "output": 0.75, + "cache_read": 0.025 }, "type": "chat" }, { - "id": "grok-4-1-fast-reasoning", - "name": "Grok 4.1 Fast Reasoning", - "display_name": "Grok 4.1 Fast Reasoning", + "id": "mercury-2", + "name": "Mercury 2", + "display_name": "Mercury 2", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 2000000, - "output": 30000 + "context": 128000, + "output": 50000 }, "temperature": true, "tool_call": true, @@ -93170,73 +97616,99 @@ "supported": true, "default": true }, - "extra_capabilities": { - "reasoning": { - "supported": true - } - }, - "attachment": true, + "attachment": false, "open_weights": false, - "release_date": "2025-11-19", - "last_updated": "2025-11-19", + "knowledge": "2025-01-01", + "release_date": "2026-02-24", + "last_updated": "2026-02-24", "cost": { - "input": 0.2, - "output": 0.5, - "cache_read": 0.05 + "input": 0.25, + "output": 0.75, + "cache_read": 0.025 }, "type": "chat" - }, + } + ] + }, + "anthropic": { + "id": "anthropic", + "name": "Anthropic", + "display_name": "Anthropic", + "doc": "https://docs.anthropic.com/en/docs/about-claude/models", + "models": [ { - "id": "qwen3-vl-235b-a22b-thinking", - "name": "Qwen3 VL 235B A22B Thinking", - "display_name": "Qwen3 VL 235B A22B Thinking", + "id": "claude-opus-4-5", + "name": "Claude Opus 4.5 (latest)", + "display_name": "Claude Opus 4.5 (latest)", "modalities": { "input": [ "text", - "image" + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 131072, - "output": 8192 + "context": 200000, + "output": 64000 }, "temperature": true, "tool_call": true, "reasoning": { "supported": true, - "default": true + "default": false }, "extra_capabilities": { "reasoning": { "supported": true, + "default_enabled": false, + "mode": "mixed", + "budget": { + "min": 1024, + "unit": "tokens" + }, + "effort": "high", + "effort_options": [ + "low", + "medium", + "high" + ], "interleaved": true, "summaries": true, "visibility": "summary", "continuation": [ "thinking_blocks" + ], + "notes": [ + "Claude Opus 4.5 uses manual thinking.type = \"enabled\" with budget_tokens; effort can be used alongside the thinking budget.", + "Interleaved thinking requires the interleaved-thinking-2025-05-14 beta header." ] } }, "attachment": true, - "open_weights": true, - "release_date": "2025-09-15", - "last_updated": "2025-09-15", + "open_weights": false, + "knowledge": "2025-03-31", + "release_date": "2025-11-24", + "last_updated": "2025-11-24", "cost": { - "input": 0.5, - "output": 2 + "input": 5, + "output": 25, + "cache_read": 0.5, + "cache_write": 6.25 }, "type": "chat" }, { - "id": "glm-5.1", - "name": "GLM-5.1", - "display_name": "GLM-5.1", + "id": "claude-haiku-4-5-20251001", + "name": "Claude Haiku 4.5", + "display_name": "Claude Haiku 4.5", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ "text" @@ -93244,41 +97716,52 @@ }, "limit": { "context": 200000, - "output": 131072 + "output": 64000 }, "temperature": true, "tool_call": true, "reasoning": { "supported": true, - "default": true + "default": false }, "extra_capabilities": { "reasoning": { "supported": true, + "default_enabled": false, + "mode": "budget", + "budget": { + "min": 1024, + "unit": "tokens" + }, "interleaved": true, "summaries": true, "visibility": "summary", "continuation": [ "thinking_blocks" + ], + "notes": [ + "Claude 4 manual thinking uses thinking.type = \"enabled\" with budget_tokens.", + "Interleaved thinking requires the interleaved-thinking-2025-05-14 beta header for this model family." ] } }, - "attachment": false, - "open_weights": true, - "release_date": "2026-03-27", - "last_updated": "2026-03-27", + "attachment": true, + "open_weights": false, + "knowledge": "2025-02-28", + "release_date": "2025-10-15", + "last_updated": "2025-10-15", "cost": { - "input": 6, - "output": 24, - "cache_read": 1.3, - "cache_write": 0 + "input": 1, + "output": 5, + "cache_read": 0.1, + "cache_write": 1.25 }, "type": "chat" }, { - "id": "grok-4-20-non-reasoning", - "name": "Grok 4.20 (Non-Reasoning)", - "display_name": "Grok 4.20 (Non-Reasoning)", + "id": "claude-3-5-haiku-20241022", + "name": "Claude Haiku 3.5", + "display_name": "Claude Haiku 3.5", "modalities": { "input": [ "text", @@ -93290,611 +97773,727 @@ ] }, "limit": { - "context": 1000000, - "output": 30000 + "context": 200000, + "output": 8192 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true - } + "supported": false }, "attachment": true, "open_weights": false, - "release_date": "2026-03-09", - "last_updated": "2026-03-09", + "knowledge": "2024-07-31", + "release_date": "2024-10-22", + "last_updated": "2024-10-22", "cost": { - "input": 1.25, - "output": 2.5, - "cache_read": 0.2, - "tiers": [ - { - "input": 2.5, - "output": 5, - "cache_read": 0.4, - "tier": { - "type": "context", - "size": 200000 - } - } - ], - "context_over_200k": { - "input": 2.5, - "output": 5, - "cache_read": 0.4 - } + "input": 0.8, + "output": 4, + "cache_read": 0.08, + "cache_write": 1 }, "type": "chat" }, { - "id": "minimax-m2.1-lightning", - "name": "MiniMax M2.1 Lightning", - "display_name": "MiniMax M2.1 Lightning", + "id": "claude-opus-4-0", + "name": "Claude Opus 4 (latest)", + "display_name": "Claude Opus 4 (latest)", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 196608, - "output": 131072 + "context": 200000, + "output": 32000 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { "supported": true, - "default": true + "default": false }, - "attachment": false, - "open_weights": true, - "release_date": "2025-12-23", - "last_updated": "2025-12-23", + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": false, + "mode": "budget", + "budget": { + "min": 1024, + "unit": "tokens" + }, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ], + "notes": [ + "Claude 4 manual thinking uses thinking.type = \"enabled\" with budget_tokens.", + "Interleaved thinking requires the interleaved-thinking-2025-05-14 beta header for this model family." + ] + } + }, + "attachment": true, + "open_weights": false, + "knowledge": "2025-03-31", + "release_date": "2025-05-22", + "last_updated": "2025-05-22", "cost": { - "input": 0.12, - "output": 0.48 + "input": 15, + "output": 75, + "cache_read": 1.5, + "cache_write": 18.75 }, "type": "chat" }, { - "id": "gpt-4o-search-preview", - "name": "GPT-4o Search Preview", - "display_name": "GPT-4o Search Preview", + "id": "claude-3-opus-20240229", + "name": "Claude Opus 3", + "display_name": "Claude Opus 3", "modalities": { "input": [ "text", - "image" + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 16384 + "context": 200000, + "output": 4096 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { "supported": false }, "attachment": true, "open_weights": false, - "release_date": "2024-10-01", - "last_updated": "2024-10-01", + "knowledge": "2023-08-31", + "release_date": "2024-02-29", + "last_updated": "2024-02-29", "cost": { - "input": 2.5, - "output": 10 + "input": 15, + "output": 75, + "cache_read": 1.5, + "cache_write": 18.75 }, "type": "chat" }, { - "id": "mimo-v2.5-pro", - "name": "MiMo-V2.5-Pro", - "display_name": "MiMo-V2.5-Pro", + "id": "claude-opus-4-1-20250805", + "name": "Claude Opus 4.1", + "display_name": "Claude Opus 4.1", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 1048576, - "output": 131072 + "context": 200000, + "output": 32000 }, "temperature": true, "tool_call": true, "reasoning": { "supported": true, - "default": true + "default": false }, "extra_capabilities": { "reasoning": { "supported": true, + "default_enabled": false, + "mode": "budget", + "budget": { + "min": 1024, + "unit": "tokens" + }, "interleaved": true, "summaries": true, "visibility": "summary", "continuation": [ "thinking_blocks" + ], + "notes": [ + "Claude 4 manual thinking uses thinking.type = \"enabled\" with budget_tokens.", + "Interleaved thinking requires the interleaved-thinking-2025-05-14 beta header for this model family." ] } }, - "attachment": false, - "open_weights": true, - "knowledge": "2024-12", - "release_date": "2026-04-22", - "last_updated": "2026-04-22", + "attachment": true, + "open_weights": false, + "knowledge": "2025-03-31", + "release_date": "2025-08-05", + "last_updated": "2025-08-05", "cost": { - "input": 1, - "output": 3, - "cache_read": 0.2, - "tiers": [ - { - "input": 2, - "output": 6, - "cache_read": 0.4, - "tier": { - "type": "context", - "size": 256000 - } - } - ], - "context_over_200k": { - "input": 2, - "output": 6, - "cache_read": 0.4 - } + "input": 15, + "output": 75, + "cache_read": 1.5, + "cache_write": 18.75 }, "type": "chat" }, { - "id": "auto", - "name": "Auto Route", - "display_name": "Auto Route", + "id": "claude-sonnet-4-5", + "name": "Claude Sonnet 4.5 (latest)", + "display_name": "Claude Sonnet 4.5 (latest)", "modalities": { "input": [ "text", - "image" + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 16384 + "context": 200000, + "output": 64000 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": false + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": false, + "mode": "budget", + "budget": { + "min": 1024, + "unit": "tokens" + }, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ], + "notes": [ + "Claude 4 manual thinking uses thinking.type = \"enabled\" with budget_tokens.", + "Interleaved thinking requires the interleaved-thinking-2025-05-14 beta header for this model family." + ] + } }, "attachment": true, "open_weights": false, - "release_date": "2024-01-01", - "last_updated": "2024-01-01", + "knowledge": "2025-07-31", + "release_date": "2025-09-29", + "last_updated": "2025-09-29", "cost": { - "input": 0, - "output": 0 + "input": 3, + "output": 15, + "cache_read": 0.3, + "cache_write": 3.75 }, "type": "chat" }, { - "id": "gpt-4.1-nano", - "name": "GPT-4.1 nano", - "display_name": "GPT-4.1 nano", + "id": "claude-opus-4-7", + "name": "Claude Opus 4.7", + "display_name": "Claude Opus 4.7", "modalities": { "input": [ "text", - "image" + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 1047576, - "output": 32768 + "context": 1000000, + "output": 128000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": false + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": false, + "mode": "effort", + "effort": "high", + "effort_options": [ + "low", + "medium", + "high", + "xhigh", + "max" + ], + "interleaved": true, + "summaries": true, + "visibility": "omitted", + "continuation": [ + "thinking_blocks" + ], + "notes": [ + "Claude Opus 4.7 and newer Opus models require thinking.type = \"adaptive\" to enable thinking explicitly.", + "Manual budget_tokens requests return 400 on Claude Opus 4.7 and newer adaptive-only Opus models.", + "task_budget is separate from thinking control and should not be treated as a thinking budget." + ] + } }, "attachment": true, "open_weights": false, - "knowledge": "2024-04", - "release_date": "2025-04-14", - "last_updated": "2025-04-14", + "knowledge": "2026-01-31", + "release_date": "2026-04-16", + "last_updated": "2026-04-16", "cost": { - "input": 0.1, - "output": 0.4, - "cache_read": 0.025 + "input": 5, + "output": 25, + "cache_read": 0.5, + "cache_write": 6.25 }, "type": "chat" }, { - "id": "qwen-plus", - "name": "Qwen Plus", - "display_name": "Qwen Plus", + "id": "claude-opus-4-5-20251101", + "name": "Claude Opus 4.5", + "display_name": "Claude Opus 4.5", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 1000000, - "output": 32768 + "context": 200000, + "output": 64000 }, "temperature": true, "tool_call": true, "reasoning": { "supported": true, - "default": true + "default": false }, "extra_capabilities": { "reasoning": { "supported": true, + "default_enabled": false, + "mode": "mixed", + "budget": { + "min": 1024, + "unit": "tokens" + }, + "effort": "high", + "effort_options": [ + "low", + "medium", + "high" + ], "interleaved": true, "summaries": true, "visibility": "summary", "continuation": [ "thinking_blocks" + ], + "notes": [ + "Claude Opus 4.5 uses manual thinking.type = \"enabled\" with budget_tokens; effort can be used alongside the thinking budget.", + "Interleaved thinking requires the interleaved-thinking-2025-05-14 beta header." ] } }, - "attachment": false, + "attachment": true, "open_weights": false, - "knowledge": "2024-04", - "release_date": "2024-01-25", - "last_updated": "2025-09-11", + "knowledge": "2025-03-31", + "release_date": "2025-11-01", + "last_updated": "2025-11-01", "cost": { - "input": 0.4, - "output": 1.2, - "reasoning": 4 + "input": 5, + "output": 25, + "cache_read": 0.5, + "cache_write": 6.25 }, "type": "chat" }, { - "id": "seed-1-6-flash-250715", - "name": "Seed 1.6 Flash (250715)", - "display_name": "Seed 1.6 Flash (250715)", + "id": "claude-3-5-sonnet-20241022", + "name": "Claude Sonnet 3.5 v2", + "display_name": "Claude Sonnet 3.5 v2", "modalities": { "input": [ "text", - "image" + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 256000, + "context": 200000, "output": 8192 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, "attachment": true, - "open_weights": true, - "release_date": "2025-07-26", - "last_updated": "2025-07-26", - "cost": { - "input": 0.07, - "output": 0.3, - "cache_read": 0.015 - }, - "type": "chat" - } - ] - }, - "togetherai": { - "id": "togetherai", - "name": "Together AI", - "display_name": "Together AI", - "doc": "https://docs.together.ai/docs/serverless-models", - "models": [ - { - "id": "MiniMaxAI/MiniMax-M2.5", - "name": "MiniMax-M2.5", - "display_name": "MiniMax-M2.5", - "modalities": { - "input": [ - "text" - ], - "output": [ - "text" - ] - }, - "limit": { - "context": 204800, - "output": 131072 - }, - "temperature": true, - "tool_call": true, - "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true - } - }, - "attachment": false, - "open_weights": true, - "release_date": "2026-02-12", - "last_updated": "2026-02-12", + "open_weights": false, + "knowledge": "2024-04-30", + "release_date": "2024-10-22", + "last_updated": "2024-10-22", "cost": { - "input": 0.3, - "output": 1.2, - "cache_read": 0.06 + "input": 3, + "output": 15, + "cache_read": 0.3, + "cache_write": 3.75 }, "type": "chat" }, { - "id": "MiniMaxAI/MiniMax-M2.7", - "name": "MiniMax-M2.7", - "display_name": "MiniMax-M2.7", + "id": "claude-opus-4-8", + "name": "Claude Opus 4.8", + "display_name": "Claude Opus 4.8", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 202752, - "output": 131072 + "context": 1000000, + "output": 128000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { "supported": true, - "default": true + "default": false }, "extra_capabilities": { "reasoning": { "supported": true, + "default_enabled": false, + "mode": "effort", + "effort": "high", + "effort_options": [ + "low", + "medium", + "high", + "xhigh", + "max" + ], "interleaved": true, "summaries": true, - "visibility": "summary", + "visibility": "omitted", "continuation": [ "thinking_blocks" + ], + "notes": [ + "Claude Opus 4.7 and newer Opus models require thinking.type = \"adaptive\" to enable thinking explicitly.", + "Manual budget_tokens requests return 400 on Claude Opus 4.7 and newer adaptive-only Opus models.", + "task_budget is separate from thinking control and should not be treated as a thinking budget." ] } }, - "attachment": false, - "open_weights": true, - "release_date": "2026-03-18", - "last_updated": "2026-03-18", + "attachment": true, + "open_weights": false, + "release_date": "2026-05-28", + "last_updated": "2026-05-28", "cost": { - "input": 0.3, - "output": 1.2, - "cache_read": 0.06 + "input": 5, + "output": 25, + "cache_read": 0.5, + "cache_write": 6.25 }, "type": "chat" }, { - "id": "zai-org/GLM-5.1", - "name": "GLM-5.1", - "display_name": "GLM-5.1", + "id": "claude-opus-4-20250514", + "name": "Claude Opus 4", + "display_name": "Claude Opus 4", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 202752, - "output": 131072 + "context": 200000, + "output": 32000 }, "temperature": true, "tool_call": true, "reasoning": { "supported": true, - "default": true + "default": false }, "extra_capabilities": { "reasoning": { - "supported": true + "supported": true, + "default_enabled": false, + "mode": "budget", + "budget": { + "min": 1024, + "unit": "tokens" + }, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ], + "notes": [ + "Claude 4 manual thinking uses thinking.type = \"enabled\" with budget_tokens.", + "Interleaved thinking requires the interleaved-thinking-2025-05-14 beta header for this model family." + ] } }, - "attachment": false, - "open_weights": true, - "knowledge": "2025-11", - "release_date": "2026-04-07", - "last_updated": "2026-04-07", + "attachment": true, + "open_weights": false, + "knowledge": "2025-03-31", + "release_date": "2025-05-22", + "last_updated": "2025-05-22", "cost": { - "input": 1.4, - "output": 4.4 + "input": 15, + "output": 75, + "cache_read": 1.5, + "cache_write": 18.75 }, "type": "chat" }, { - "id": "essentialai/Rnj-1-Instruct", - "name": "Rnj-1 Instruct", - "display_name": "Rnj-1 Instruct", + "id": "claude-3-5-sonnet-20240620", + "name": "Claude Sonnet 3.5", + "display_name": "Claude Sonnet 3.5", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 32768, - "output": 32768 + "context": 200000, + "output": 8192 }, "temperature": true, "tool_call": true, "reasoning": { "supported": false }, - "attachment": false, - "open_weights": true, - "knowledge": "2024-10", - "release_date": "2025-12-05", - "last_updated": "2025-12-05", + "attachment": true, + "open_weights": false, + "knowledge": "2024-04-30", + "release_date": "2024-06-20", + "last_updated": "2024-06-20", "cost": { - "input": 0.15, - "output": 0.15 + "input": 3, + "output": 15, + "cache_read": 0.3, + "cache_write": 3.75 }, "type": "chat" }, { - "id": "moonshotai/Kimi-K2.6", - "name": "Kimi K2.6", - "display_name": "Kimi K2.6", + "id": "claude-sonnet-4-20250514", + "name": "Claude Sonnet 4", + "display_name": "Claude Sonnet 4", "modalities": { "input": [ "text", "image", - "video" + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 262144, - "output": 131000 + "context": 200000, + "output": 64000 }, "temperature": true, "tool_call": true, "reasoning": { "supported": true, - "default": true + "default": false }, "extra_capabilities": { "reasoning": { - "supported": true + "supported": true, + "default_enabled": false, + "mode": "budget", + "budget": { + "min": 1024, + "unit": "tokens" + }, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ], + "notes": [ + "Claude 4 manual thinking uses thinking.type = \"enabled\" with budget_tokens.", + "Interleaved thinking requires the interleaved-thinking-2025-05-14 beta header for this model family." + ] } }, "attachment": true, - "open_weights": true, - "knowledge": "2025-01", - "release_date": "2026-04-21", - "last_updated": "2026-04-21", + "open_weights": false, + "knowledge": "2025-03-31", + "release_date": "2025-05-22", + "last_updated": "2025-05-22", "cost": { - "input": 1.2, - "output": 4.5, - "cache_read": 0.2 + "input": 3, + "output": 15, + "cache_read": 0.3, + "cache_write": 3.75 }, "type": "chat" }, { - "id": "moonshotai/Kimi-K2.5", - "name": "Kimi K2.5", - "display_name": "Kimi K2.5", + "id": "claude-opus-4-1", + "name": "Claude Opus 4.1 (latest)", + "display_name": "Claude Opus 4.1 (latest)", "modalities": { "input": [ "text", - "image" + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 262144, - "output": 262144 + "context": 200000, + "output": 32000 }, "temperature": true, "tool_call": true, "reasoning": { "supported": true, - "default": true + "default": false }, "extra_capabilities": { "reasoning": { "supported": true, + "default_enabled": false, + "mode": "budget", + "budget": { + "min": 1024, + "unit": "tokens" + }, "interleaved": true, "summaries": true, "visibility": "summary", "continuation": [ "thinking_blocks" + ], + "notes": [ + "Claude 4 manual thinking uses thinking.type = \"enabled\" with budget_tokens.", + "Interleaved thinking requires the interleaved-thinking-2025-05-14 beta header for this model family." ] } }, - "attachment": false, - "open_weights": true, - "knowledge": "2026-01", - "release_date": "2026-01-27", - "last_updated": "2026-01-27", + "attachment": true, + "open_weights": false, + "knowledge": "2025-03-31", + "release_date": "2025-08-05", + "last_updated": "2025-08-05", "cost": { - "input": 0.5, - "output": 2.8 + "input": 15, + "output": 75, + "cache_read": 1.5, + "cache_write": 18.75 }, "type": "chat" }, { - "id": "meta-llama/Llama-3.3-70B-Instruct-Turbo", - "name": "Llama 3.3 70B", - "display_name": "Llama 3.3 70B", + "id": "claude-3-haiku-20240307", + "name": "Claude Haiku 3", + "display_name": "Claude Haiku 3", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 131072, - "output": 131072 + "context": 200000, + "output": 4096 }, "temperature": true, "tool_call": true, "reasoning": { "supported": false }, - "attachment": false, - "open_weights": true, - "knowledge": "2023-12", - "release_date": "2024-12-06", - "last_updated": "2024-12-06", + "attachment": true, + "open_weights": false, + "knowledge": "2023-08-31", + "release_date": "2024-03-13", + "last_updated": "2024-03-13", "cost": { - "input": 0.88, - "output": 0.88 + "input": 0.25, + "output": 1.25, + "cache_read": 0.03, + "cache_write": 0.3 }, "type": "chat" }, { - "id": "deepseek-ai/DeepSeek-V4-Pro", - "name": "DeepSeek V4 Pro", - "display_name": "DeepSeek V4 Pro", + "id": "claude-fable-5", + "name": "Claude Fable 5", + "display_name": "Claude Fable 5", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 512000, - "output": 384000 + "context": 1000000, + "output": 128000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { "supported": true, @@ -93903,292 +98502,487 @@ "extra_capabilities": { "reasoning": { "supported": true, + "default_enabled": true, + "mode": "effort", + "effort": "high", + "effort_options": [ + "low", + "medium", + "high", + "xhigh", + "max" + ], "interleaved": true, "summaries": true, - "visibility": "summary", + "visibility": "omitted", "continuation": [ "thinking_blocks" + ], + "notes": [ + "Adaptive thinking is always on for Claude Fable 5 and Claude Mythos 5; thinking.type = \"disabled\" is rejected.", + "Manual budget_tokens requests return 400 on Claude Fable 5 and Claude Mythos 5.", + "thinking.display defaults to omitted; set display to summarized to receive readable thinking summaries." ] } }, - "attachment": false, - "open_weights": true, - "release_date": "2026-04-24", - "last_updated": "2026-04-24", + "attachment": true, + "open_weights": false, + "release_date": "2026-06-09", + "last_updated": "2026-06-09", "cost": { - "input": 2.1, - "output": 4.4, - "cache_read": 0.2 + "input": 10, + "output": 50, + "cache_read": 1, + "cache_write": 12.5 }, "type": "chat" }, { - "id": "deepseek-ai/DeepSeek-V3-1", - "name": "DeepSeek V3.1", - "display_name": "DeepSeek V3.1", + "id": "claude-sonnet-4-0", + "name": "Claude Sonnet 4 (latest)", + "display_name": "Claude Sonnet 4 (latest)", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 131072, - "output": 131072 + "context": 200000, + "output": 64000 }, "temperature": true, "tool_call": true, "reasoning": { "supported": true, - "default": true + "default": false }, - "attachment": false, - "open_weights": true, - "knowledge": "2025-08", - "release_date": "2025-08-21", - "last_updated": "2025-08-21", + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": false, + "mode": "budget", + "budget": { + "min": 1024, + "unit": "tokens" + }, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ], + "notes": [ + "Claude 4 manual thinking uses thinking.type = \"enabled\" with budget_tokens.", + "Interleaved thinking requires the interleaved-thinking-2025-05-14 beta header for this model family." + ] + } + }, + "attachment": true, + "open_weights": false, + "knowledge": "2025-03-31", + "release_date": "2025-05-22", + "last_updated": "2025-05-22", "cost": { - "input": 0.6, - "output": 1.7 + "input": 3, + "output": 15, + "cache_read": 0.3, + "cache_write": 3.75 }, "type": "chat" }, { - "id": "deepseek-ai/DeepSeek-R1", - "name": "DeepSeek-R1", - "display_name": "DeepSeek-R1", + "id": "claude-3-7-sonnet-20250219", + "name": "Claude Sonnet 3.7", + "display_name": "Claude Sonnet 3.7", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 163839, - "output": 163839 + "context": 200000, + "output": 64000 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { "supported": true, - "default": true + "default": false }, "extra_capabilities": { "reasoning": { "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", + "default_enabled": false, + "mode": "budget", + "budget": { + "min": 1024, + "unit": "tokens" + }, + "interleaved": false, + "summaries": false, + "visibility": "full", "continuation": [ "thinking_blocks" + ], + "notes": [ + "Anthropic uses thinking budget tokens" ] } }, - "attachment": false, - "open_weights": true, - "knowledge": "2024-07", - "release_date": "2025-01-20", - "last_updated": "2025-03-24", + "attachment": true, + "open_weights": false, + "knowledge": "2024-10-31", + "release_date": "2025-02-19", + "last_updated": "2025-02-19", "cost": { "input": 3, - "output": 7 + "output": 15, + "cache_read": 0.3, + "cache_write": 3.75 }, "type": "chat" }, { - "id": "deepseek-ai/DeepSeek-V3", - "name": "DeepSeek-V3", - "display_name": "DeepSeek-V3", + "id": "claude-haiku-4-5", + "name": "Claude Haiku 4.5 (latest)", + "display_name": "Claude Haiku 4.5 (latest)", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 131072, - "output": 131072 + "context": 200000, + "output": 64000 }, "temperature": true, "tool_call": true, "reasoning": { "supported": true, - "default": true + "default": false }, - "attachment": false, - "open_weights": true, - "knowledge": "2024-07", - "release_date": "2024-12-26", - "last_updated": "2025-05-29", + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": false, + "mode": "budget", + "budget": { + "min": 1024, + "unit": "tokens" + }, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ], + "notes": [ + "Claude 4 manual thinking uses thinking.type = \"enabled\" with budget_tokens.", + "Interleaved thinking requires the interleaved-thinking-2025-05-14 beta header for this model family." + ] + } + }, + "attachment": true, + "open_weights": false, + "knowledge": "2025-02-28", + "release_date": "2025-10-15", + "last_updated": "2025-10-15", "cost": { - "input": 1.25, - "output": 1.25 + "input": 1, + "output": 5, + "cache_read": 0.1, + "cache_write": 1.25 }, "type": "chat" }, { - "id": "nvidia/nemotron-3-ultra-550b-a55b", - "name": "Nemotron 3 Ultra 550B A55B", - "display_name": "Nemotron 3 Ultra 550B A55B", + "id": "claude-opus-4-6", + "name": "Claude Opus 4.6", + "display_name": "Claude Opus 4.6", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 512300, - "output": 512300 + "context": 1000000, + "output": 128000 }, "temperature": true, "tool_call": true, "reasoning": { "supported": true, - "default": true + "default": false }, - "attachment": false, - "open_weights": true, - "release_date": "2026-06-04", - "last_updated": "2026-06-04", + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": false, + "mode": "mixed", + "budget": { + "min": 1024, + "unit": "tokens" + }, + "effort": "high", + "effort_options": [ + "low", + "medium", + "high", + "max" + ], + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ], + "notes": [ + "Anthropic recommends adaptive thinking with effort for Claude 4.6; budget_tokens remains a deprecated compatibility path.", + "Anthropic API defaults effort to high; lower effort levels should be chosen per workload." + ] + } + }, + "attachment": true, + "open_weights": false, + "knowledge": "2025-05-31", + "release_date": "2026-02-05", + "last_updated": "2026-03-13", "cost": { - "input": 0.6, - "output": 3.6, - "cache_read": 0.2 + "input": 5, + "output": 25, + "cache_read": 0.5, + "cache_write": 6.25 }, "type": "chat" }, { - "id": "Qwen/Qwen3.6-Plus", - "name": "Qwen3.6 Plus", - "display_name": "Qwen3.6 Plus", + "id": "claude-sonnet-4-5-20250929", + "name": "Claude Sonnet 4.5", + "display_name": "Claude Sonnet 4.5", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 1000000, - "output": 500000 + "context": 200000, + "output": 64000 }, "temperature": true, "tool_call": true, "reasoning": { "supported": true, - "default": true + "default": false }, "extra_capabilities": { "reasoning": { "supported": true, + "default_enabled": false, + "mode": "budget", + "budget": { + "min": 1024, + "unit": "tokens" + }, "interleaved": true, "summaries": true, "visibility": "summary", "continuation": [ "thinking_blocks" + ], + "notes": [ + "Claude 4 manual thinking uses thinking.type = \"enabled\" with budget_tokens.", + "Interleaved thinking requires the interleaved-thinking-2025-05-14 beta header for this model family." ] } }, - "attachment": false, - "open_weights": true, - "release_date": "2026-04-30", - "last_updated": "2026-04-30", + "attachment": true, + "open_weights": false, + "knowledge": "2025-07-31", + "release_date": "2025-09-29", + "last_updated": "2025-09-29", "cost": { - "input": 0.5, - "output": 3 + "input": 3, + "output": 15, + "cache_read": 0.3, + "cache_write": 3.75 }, "type": "chat" }, { - "id": "Qwen/Qwen3-Coder-Next-FP8", - "name": "Qwen3 Coder Next FP8", - "display_name": "Qwen3 Coder Next FP8", + "id": "claude-3-sonnet-20240229", + "name": "Claude Sonnet 3", + "display_name": "Claude Sonnet 3", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 262144, - "output": 262144 + "context": 200000, + "output": 4096 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, - "attachment": false, - "open_weights": true, - "knowledge": "2026-02-03", - "release_date": "2026-02-03", - "last_updated": "2026-02-03", + "attachment": true, + "open_weights": false, + "knowledge": "2023-08-31", + "release_date": "2024-03-04", + "last_updated": "2024-03-04", "cost": { - "input": 0.5, - "output": 1.2 + "input": 3, + "output": 15, + "cache_read": 0.3, + "cache_write": 0.3 }, "type": "chat" }, { - "id": "Qwen/Qwen3.5-397B-A17B", - "name": "Qwen3.5 397B A17B", - "display_name": "Qwen3.5 397B A17B", + "id": "claude-sonnet-4-6", + "name": "Claude Sonnet 4.6", + "display_name": "Claude Sonnet 4.6", "modalities": { "input": [ "text", - "image" + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 262144, - "output": 130000 + "context": 1000000, + "output": 64000 }, "temperature": true, "tool_call": true, "reasoning": { "supported": true, - "default": true + "default": false }, "extra_capabilities": { "reasoning": { "supported": true, + "default_enabled": false, + "mode": "mixed", + "budget": { + "min": 1024, + "unit": "tokens" + }, + "effort": "high", + "effort_options": [ + "low", + "medium", + "high", + "max" + ], "interleaved": true, "summaries": true, "visibility": "summary", "continuation": [ "thinking_blocks" + ], + "notes": [ + "Anthropic recommends adaptive thinking with effort for Claude 4.6; budget_tokens remains a deprecated compatibility path.", + "Anthropic API defaults effort to high; lower effort levels should be chosen per workload." ] } }, - "attachment": false, - "open_weights": true, - "release_date": "2026-02-16", - "last_updated": "2026-02-16", + "attachment": true, + "open_weights": false, + "knowledge": "2025-08-31", + "release_date": "2026-02-17", + "last_updated": "2026-03-13", "cost": { - "input": 0.6, - "output": 3.6 + "input": 3, + "output": 15, + "cache_read": 0.3, + "cache_write": 3.75 }, "type": "chat" }, { - "id": "Qwen/Qwen3.7-Max", - "name": "Qwen3.7 Max", - "display_name": "Qwen3.7 Max", + "id": "claude-3-5-haiku-latest", + "name": "Claude Haiku 3.5 (latest)", + "display_name": "Claude Haiku 3.5 (latest)", + "modalities": { + "input": [ + "text", + "image", + "pdf" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 200000, + "output": 8192 + }, + "temperature": true, + "tool_call": true, + "reasoning": { + "supported": false + }, + "attachment": true, + "open_weights": false, + "knowledge": "2024-07-31", + "release_date": "2024-10-22", + "last_updated": "2024-10-22", + "cost": { + "input": 0.8, + "output": 4, + "cache_read": 0.08, + "cache_write": 1 + }, + "type": "chat" + } + ] + }, + "tencent-coding-plan": { + "id": "tencent-coding-plan", + "name": "Tencent Coding Plan (China)", + "display_name": "Tencent Coding Plan (China)", + "api": "https://api.lkeap.cloud.tencent.com/coding/v3", + "doc": "https://cloud.tencent.com/document/product/1772/128947", + "models": [ + { + "id": "minimax-m2.5", + "name": "MiniMax-M2.5", + "display_name": "MiniMax-M2.5", "modalities": { "input": [ "text" @@ -94198,8 +98992,8 @@ ] }, "limit": { - "context": 1000000, - "output": 500000 + "context": 204800, + "output": 32768 }, "temperature": true, "tool_call": true, @@ -94209,26 +99003,36 @@ }, "extra_capabilities": { "reasoning": { - "supported": true + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] } }, "attachment": false, - "open_weights": false, - "release_date": "2026-05-21", - "last_updated": "2026-05-21", + "open_weights": true, + "release_date": "2026-02-12", + "last_updated": "2026-02-12", "cost": { - "input": 2.5, - "output": 7.5 + "input": 0, + "output": 0, + "cache_read": 0, + "cache_write": 0 }, "type": "chat" }, { - "id": "Qwen/Qwen3-235B-A22B-Instruct-2507-tput", - "name": "Qwen3 235B A22B Instruct 2507 FP8", - "display_name": "Qwen3 235B A22B Instruct 2507 FP8", + "id": "kimi-k2.5", + "name": "Kimi-K2.5", + "display_name": "Kimi-K2.5", "modalities": { "input": [ - "text" + "text", + "image", + "video" ], "output": [ "text" @@ -94236,7 +99040,7 @@ }, "limit": { "context": 262144, - "output": 262144 + "output": 32768 }, "temperature": true, "tool_call": true, @@ -94244,21 +99048,34 @@ "supported": true, "default": true }, - "attachment": false, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } + }, + "attachment": true, "open_weights": true, - "knowledge": "2025-07", - "release_date": "2025-07-25", - "last_updated": "2025-07-25", + "knowledge": "2025-01", + "release_date": "2026-01-27", + "last_updated": "2026-01-27", "cost": { - "input": 0.2, - "output": 0.6 + "input": 0, + "output": 0, + "cache_read": 0, + "cache_write": 0 }, "type": "chat" }, { - "id": "Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8", - "name": "Qwen3 Coder 480B A35B Instruct", - "display_name": "Qwen3 Coder 480B A35B Instruct", + "id": "hunyuan-turbos", + "name": "Hunyuan-TurboS", + "display_name": "Hunyuan-TurboS", "modalities": { "input": [ "text" @@ -94268,8 +99085,8 @@ ] }, "limit": { - "context": 262144, - "output": 262144 + "context": 131072, + "output": 16384 }, "temperature": true, "tool_call": true, @@ -94277,32 +99094,32 @@ "supported": false }, "attachment": false, - "open_weights": true, - "knowledge": "2025-04", - "release_date": "2025-07-23", - "last_updated": "2025-07-23", + "open_weights": false, + "release_date": "2026-03-08", + "last_updated": "2026-03-08", "cost": { - "input": 2, - "output": 2 + "input": 0, + "output": 0, + "cache_read": 0, + "cache_write": 0 }, "type": "chat" }, { - "id": "google/gemma-4-31B-it", - "name": "Gemma 4 31B Instruct", - "display_name": "Gemma 4 31B Instruct", + "id": "hunyuan-t1", + "name": "Hunyuan-T1", + "display_name": "Hunyuan-T1", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 262144, - "output": 131072 + "context": 131072, + "output": 16384 }, "temperature": true, "tool_call": true, @@ -94310,21 +99127,33 @@ "supported": true, "default": true }, - "attachment": true, - "open_weights": true, - "knowledge": "2025-01", - "release_date": "2026-04-07", - "last_updated": "2026-04-07", + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } + }, + "attachment": false, + "open_weights": false, + "release_date": "2026-03-08", + "last_updated": "2026-03-08", "cost": { - "input": 0.2, - "output": 0.5 + "input": 0, + "output": 0, + "cache_read": 0, + "cache_write": 0 }, "type": "chat" }, { - "id": "openai/gpt-oss-120b", - "name": "GPT OSS 120B", - "display_name": "GPT OSS 120B", + "id": "tc-code-latest", + "name": "Auto", + "display_name": "Auto", "modalities": { "input": [ "text" @@ -94335,43 +99164,29 @@ }, "limit": { "context": 131072, - "output": 131072 + "output": 16384 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true - } + "supported": false }, "attachment": false, - "open_weights": true, - "knowledge": "2025-08", - "release_date": "2025-08-05", - "last_updated": "2025-08-05", + "open_weights": false, + "release_date": "2026-03-08", + "last_updated": "2026-03-08", "cost": { - "input": 0.15, - "output": 0.6 + "input": 0, + "output": 0, + "cache_read": 0, + "cache_write": 0 }, "type": "chat" - } - ] - }, - "moark": { - "id": "moark", - "name": "Moark", - "display_name": "Moark", - "api": "https://moark.com/v1", - "doc": "https://moark.com/docs/openapi/v1#tag/%E6%96%87%E6%9C%AC%E7%94%9F%E6%88%90", - "models": [ + }, { - "id": "GLM-4.7", - "name": "GLM-4.7", - "display_name": "GLM-4.7", + "id": "glm-5", + "name": "GLM-5", + "display_name": "GLM-5", "modalities": { "input": [ "text" @@ -94381,8 +99196,8 @@ ] }, "limit": { - "context": 204800, - "output": 131072 + "context": 202752, + "output": 16384 }, "temperature": true, "tool_call": true, @@ -94402,20 +99217,21 @@ } }, "attachment": false, - "open_weights": true, - "knowledge": "2025-04", - "release_date": "2025-12-22", - "last_updated": "2025-12-22", + "open_weights": false, + "release_date": "2026-02-11", + "last_updated": "2026-02-11", "cost": { - "input": 3.5, - "output": 14 + "input": 0, + "output": 0, + "cache_read": 0, + "cache_write": 0 }, "type": "chat" }, { - "id": "MiniMax-M2.1", - "name": "MiniMax-M2.1", - "display_name": "MiniMax-M2.1", + "id": "hunyuan-2.0-instruct", + "name": "Tencent HY 2.0 Instruct", + "display_name": "Tencent HY 2.0 Instruct", "modalities": { "input": [ "text" @@ -94425,43 +99241,30 @@ ] }, "limit": { - "context": 204800, - "output": 131072 + "context": 131072, + "output": 16384 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true - } + "supported": false }, "attachment": false, - "open_weights": true, - "release_date": "2025-12-23", - "last_updated": "2025-12-23", + "open_weights": false, + "release_date": "2026-03-08", + "last_updated": "2026-03-08", "cost": { - "input": 2.1, - "output": 8.4 + "input": 0, + "output": 0, + "cache_read": 0, + "cache_write": 0 }, "type": "chat" - } - ] - }, - "github-models": { - "id": "github-models", - "name": "GitHub Models", - "display_name": "GitHub Models", - "api": "https://models.github.ai/inference", - "doc": "https://docs.github.com/en/github-models", - "models": [ + }, { - "id": "core42/jais-30b-chat", - "name": "JAIS 30b Chat", - "display_name": "JAIS 30b Chat", + "id": "hunyuan-2.0-thinking", + "name": "Tencent HY 2.0 Think", + "display_name": "Tencent HY 2.0 Think", "modalities": { "input": [ "text" @@ -94471,8 +99274,8 @@ ] }, "limit": { - "context": 8192, - "output": 2048 + "context": 131072, + "output": 16384 }, "temperature": true, "tool_call": true, @@ -94480,382 +99283,672 @@ "supported": true, "default": true }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } + }, "attachment": false, - "open_weights": true, - "knowledge": "2023-03", - "release_date": "2023-08-30", - "last_updated": "2023-08-30", + "open_weights": false, + "release_date": "2026-03-08", + "last_updated": "2026-03-08", "cost": { "input": 0, - "output": 0 + "output": 0, + "cache_read": 0, + "cache_write": 0 }, "type": "chat" - }, + } + ] + }, + "freemodel": { + "id": "freemodel", + "name": "FreeModel", + "display_name": "FreeModel", + "api": "https://cc.freemodel.dev/v1", + "doc": "https://freemodel.dev", + "models": [ { - "id": "deepseek/deepseek-r1-0528", - "name": "DeepSeek-R1-0528", - "display_name": "DeepSeek-R1-0528", + "id": "claude-haiku-4-5-20251001", + "name": "Claude Haiku 4.5", + "display_name": "Claude Haiku 4.5", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 65536, - "output": 8192 + "context": 200000, + "output": 64000 }, "temperature": true, "tool_call": true, "reasoning": { "supported": true, - "default": true + "default": false }, "extra_capabilities": { "reasoning": { "supported": true, + "default_enabled": false, + "mode": "budget", + "budget": { + "min": 1024, + "unit": "tokens" + }, "interleaved": true, "summaries": true, "visibility": "summary", "continuation": [ "thinking_blocks" + ], + "notes": [ + "Claude 4 manual thinking uses thinking.type = \"enabled\" with budget_tokens.", + "Interleaved thinking requires the interleaved-thinking-2025-05-14 beta header for this model family." ] } }, - "attachment": false, - "open_weights": true, - "knowledge": "2024-06", - "release_date": "2025-05-28", - "last_updated": "2025-05-28", + "attachment": true, + "open_weights": false, + "knowledge": "2025-02-28", + "release_date": "2025-10-15", + "last_updated": "2025-10-15", "cost": { - "input": 0, - "output": 0 + "input": 1, + "output": 5, + "cache_read": 0.1, + "cache_write": 1.25 }, "type": "chat" }, { - "id": "deepseek/deepseek-v3-0324", - "name": "DeepSeek-V3-0324", - "display_name": "DeepSeek-V3-0324", + "id": "claude-opus-4-7", + "name": "Claude Opus 4.7", + "display_name": "Claude Opus 4.7", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 8192 + "context": 1000000, + "output": 128000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { "supported": true, - "default": true + "default": false }, - "attachment": false, - "open_weights": true, - "knowledge": "2024-06", - "release_date": "2025-03-24", - "last_updated": "2025-03-24", + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": false, + "mode": "effort", + "effort": "high", + "effort_options": [ + "low", + "medium", + "high", + "xhigh", + "max" + ], + "interleaved": true, + "summaries": true, + "visibility": "omitted", + "continuation": [ + "thinking_blocks" + ], + "notes": [ + "Claude Opus 4.7 and newer Opus models require thinking.type = \"adaptive\" to enable thinking explicitly.", + "Manual budget_tokens requests return 400 on Claude Opus 4.7 and newer adaptive-only Opus models.", + "task_budget is separate from thinking control and should not be treated as a thinking budget." + ] + } + }, + "attachment": true, + "open_weights": false, + "knowledge": "2026-01-31", + "release_date": "2026-04-16", + "last_updated": "2026-04-16", "cost": { - "input": 0, - "output": 0 + "input": 5, + "output": 25, + "cache_read": 0.5, + "cache_write": 6.25 }, "type": "chat" }, { - "id": "deepseek/deepseek-r1", - "name": "DeepSeek-R1", - "display_name": "DeepSeek-R1", + "id": "claude-opus-4-8", + "name": "Claude Opus 4.8", + "display_name": "Claude Opus 4.8", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 65536, - "output": 8192 + "context": 1000000, + "output": 128000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { "supported": true, - "default": true + "default": false }, "extra_capabilities": { "reasoning": { "supported": true, + "default_enabled": false, + "mode": "effort", + "effort": "high", + "effort_options": [ + "low", + "medium", + "high", + "xhigh", + "max" + ], "interleaved": true, "summaries": true, - "visibility": "summary", + "visibility": "omitted", "continuation": [ "thinking_blocks" + ], + "notes": [ + "Claude Opus 4.7 and newer Opus models require thinking.type = \"adaptive\" to enable thinking explicitly.", + "Manual budget_tokens requests return 400 on Claude Opus 4.7 and newer adaptive-only Opus models.", + "task_budget is separate from thinking control and should not be treated as a thinking budget." ] } }, - "attachment": false, - "open_weights": true, - "knowledge": "2024-06", - "release_date": "2025-01-20", - "last_updated": "2025-01-20", + "attachment": true, + "open_weights": false, + "release_date": "2026-05-28", + "last_updated": "2026-05-28", "cost": { - "input": 0, - "output": 0 + "input": 5, + "output": 25, + "cache_read": 0.5, + "cache_write": 6.25 }, "type": "chat" }, { - "id": "ai21-labs/ai21-jamba-1.5-large", - "name": "AI21 Jamba 1.5 Large", - "display_name": "AI21 Jamba 1.5 Large", + "id": "gpt-5.3-codex", + "name": "GPT-5.3 Codex", + "display_name": "GPT-5.3 Codex", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 256000, - "output": 4096 + "context": 400000, + "output": 128000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { "supported": true, "default": true }, - "attachment": false, + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": true, + "mode": "effort", + "effort": "medium", + "effort_options": [ + "low", + "medium", + "high", + "xhigh" + ], + "verbosity": "medium", + "verbosity_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" + } + }, + "attachment": true, "open_weights": false, - "knowledge": "2024-03", - "release_date": "2024-08-29", - "last_updated": "2024-08-29", + "knowledge": "2025-08-31", + "release_date": "2026-02-05", + "last_updated": "2026-02-05", "cost": { - "input": 0, - "output": 0 + "input": 1.75, + "output": 14, + "cache_read": 0.175, + "cache_write": 1.75 }, "type": "chat" }, { - "id": "ai21-labs/ai21-jamba-1.5-mini", - "name": "AI21 Jamba 1.5 Mini", - "display_name": "AI21 Jamba 1.5 Mini", + "id": "claude-fable-5", + "name": "Claude Fable 5", + "display_name": "Claude Fable 5", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 256000, - "output": 4096 + "context": 1000000, + "output": 128000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { "supported": true, "default": true }, - "attachment": false, + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": true, + "mode": "effort", + "effort": "high", + "effort_options": [ + "low", + "medium", + "high", + "xhigh", + "max" + ], + "interleaved": true, + "summaries": true, + "visibility": "omitted", + "continuation": [ + "thinking_blocks" + ], + "notes": [ + "Adaptive thinking is always on for Claude Fable 5 and Claude Mythos 5; thinking.type = \"disabled\" is rejected.", + "Manual budget_tokens requests return 400 on Claude Fable 5 and Claude Mythos 5.", + "thinking.display defaults to omitted; set display to summarized to receive readable thinking summaries." + ] + } + }, + "attachment": true, "open_weights": false, - "knowledge": "2024-03", - "release_date": "2024-08-29", - "last_updated": "2024-08-29", + "knowledge": "2026-01-31", + "release_date": "2026-06-09", + "last_updated": "2026-06-09", "cost": { - "input": 0, - "output": 0 + "input": 10, + "output": 50, + "cache_read": 1, + "cache_write": 12.5 }, "type": "chat" }, { - "id": "xai/grok-3", - "name": "Grok 3", - "display_name": "Grok 3", + "id": "gpt-5.4", + "name": "GPT-5.4", + "display_name": "GPT-5.4", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 8192 + "context": 1050000, + "output": 128000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { "supported": true, - "default": true + "default": false }, - "attachment": false, + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": false, + "mode": "effort", + "effort": "none", + "effort_options": [ + "none", + "low", + "medium", + "high", + "xhigh" + ], + "verbosity": "medium", + "verbosity_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" + } + }, + "attachment": true, "open_weights": false, - "knowledge": "2024-10", - "release_date": "2024-12-09", - "last_updated": "2024-12-09", + "knowledge": "2025-08-31", + "release_date": "2026-03-05", + "last_updated": "2026-03-05", "cost": { - "input": 0, - "output": 0 + "input": 2.5, + "output": 15, + "cache_read": 0.25, + "cache_write": 2.5 }, "type": "chat" }, { - "id": "xai/grok-3-mini", - "name": "Grok 3 Mini", - "display_name": "Grok 3 Mini", + "id": "gpt-5.4-mini", + "name": "GPT-5.4 mini", + "display_name": "GPT-5.4 mini", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 8192 + "context": 400000, + "output": 128000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { "supported": true, - "default": true + "default": false }, - "attachment": false, + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": false, + "mode": "effort", + "effort": "none", + "effort_options": [ + "none", + "low", + "medium", + "high", + "xhigh" + ], + "verbosity": "medium", + "verbosity_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" + } + }, + "attachment": true, "open_weights": false, - "knowledge": "2024-10", - "release_date": "2024-12-09", - "last_updated": "2024-12-09", + "knowledge": "2025-08-31", + "release_date": "2026-03-17", + "last_updated": "2026-03-17", "cost": { - "input": 0, - "output": 0 + "input": 0.75, + "output": 4.5, + "cache_read": 0.075, + "cache_write": 0.75 }, "type": "chat" }, { - "id": "cohere/cohere-command-r-plus-08-2024", - "name": "Cohere Command R+ 08-2024", - "display_name": "Cohere Command R+ 08-2024", + "id": "claude-opus-4-6", + "name": "Claude Opus 4.6", + "display_name": "Claude Opus 4.6", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 4096 + "context": 1000000, + "output": 128000 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": false }, - "attachment": false, + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": false, + "mode": "mixed", + "budget": { + "min": 1024, + "unit": "tokens" + }, + "effort": "high", + "effort_options": [ + "low", + "medium", + "high", + "max" + ], + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ], + "notes": [ + "Anthropic recommends adaptive thinking with effort for Claude 4.6; budget_tokens remains a deprecated compatibility path.", + "Anthropic API defaults effort to high; lower effort levels should be chosen per workload." + ] + } + }, + "attachment": true, "open_weights": false, - "knowledge": "2024-03", - "release_date": "2024-08-01", - "last_updated": "2024-08-01", + "knowledge": "2025-05-31", + "release_date": "2026-02-05", + "last_updated": "2026-03-13", "cost": { - "input": 0, - "output": 0 + "input": 5, + "output": 25, + "cache_read": 0.5, + "cache_write": 6.25 }, "type": "chat" }, { - "id": "cohere/cohere-command-r-08-2024", - "name": "Cohere Command R 08-2024", - "display_name": "Cohere Command R 08-2024", + "id": "claude-sonnet-4-6", + "name": "Claude Sonnet 4.6", + "display_name": "Claude Sonnet 4.6", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 4096 + "context": 1000000, + "output": 64000 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": false }, - "attachment": false, + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": false, + "mode": "mixed", + "budget": { + "min": 1024, + "unit": "tokens" + }, + "effort": "high", + "effort_options": [ + "low", + "medium", + "high", + "max" + ], + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ], + "notes": [ + "Anthropic recommends adaptive thinking with effort for Claude 4.6; budget_tokens remains a deprecated compatibility path.", + "Anthropic API defaults effort to high; lower effort levels should be chosen per workload." + ] + } + }, + "attachment": true, "open_weights": false, - "knowledge": "2024-03", - "release_date": "2024-08-01", - "last_updated": "2024-08-01", + "knowledge": "2025-08-31", + "release_date": "2026-02-17", + "last_updated": "2026-03-13", "cost": { - "input": 0, - "output": 0 + "input": 3, + "output": 15, + "cache_read": 0.3, + "cache_write": 3.75 }, "type": "chat" }, { - "id": "cohere/cohere-command-r", - "name": "Cohere Command R", - "display_name": "Cohere Command R", + "id": "gpt-5.5", + "name": "GPT-5.5", + "display_name": "GPT-5.5", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 4096 + "context": 1050000, + "output": 128000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { "supported": true, "default": true }, - "attachment": false, + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": true, + "mode": "effort", + "effort": "medium", + "effort_options": [ + "low", + "medium", + "high", + "xhigh" + ], + "verbosity": "medium", + "verbosity_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" + } + }, + "attachment": true, "open_weights": false, - "knowledge": "2024-03", - "release_date": "2024-03-11", - "last_updated": "2024-08-01", + "knowledge": "2025-12-01", + "release_date": "2026-04-23", + "last_updated": "2026-04-23", "cost": { - "input": 0, - "output": 0 + "input": 5, + "output": 30, + "cache_read": 0.5, + "cache_write": 5 }, "type": "chat" - }, + } + ] + }, + "sap-ai-core": { + "id": "sap-ai-core", + "name": "SAP AI Core", + "display_name": "SAP AI Core", + "doc": "https://help.sap.com/docs/sap-ai-core", + "models": [ { - "id": "cohere/cohere-command-a", - "name": "Cohere Command A", - "display_name": "Cohere Command A", + "id": "anthropic--claude-4.6-sonnet", + "name": "anthropic--claude-4.6-sonnet", + "display_name": "anthropic--claude-4.6-sonnet", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 4096 + "context": 1000000, + "output": 64000 }, "temperature": true, "tool_call": true, @@ -94863,31 +99956,35 @@ "supported": true, "default": true }, - "attachment": false, + "attachment": true, "open_weights": false, - "knowledge": "2024-03", - "release_date": "2024-11-01", - "last_updated": "2024-11-01", + "knowledge": "2025-08", + "release_date": "2026-02-17", + "last_updated": "2026-03-13", "cost": { - "input": 0, - "output": 0 + "input": 3, + "output": 15, + "cache_read": 0.3, + "cache_write": 3.75 }, "type": "chat" }, { - "id": "cohere/cohere-command-r-plus", - "name": "Cohere Command R+", - "display_name": "Cohere Command R+", + "id": "anthropic--claude-3-sonnet", + "name": "anthropic--claude-3-sonnet", + "display_name": "anthropic--claude-3-sonnet", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 128000, + "context": 200000, "output": 4096 }, "temperature": true, @@ -94895,32 +99992,36 @@ "reasoning": { "supported": false }, - "attachment": false, + "attachment": true, "open_weights": false, - "knowledge": "2024-03", - "release_date": "2024-04-04", - "last_updated": "2024-08-01", + "knowledge": "2023-08-31", + "release_date": "2024-03-04", + "last_updated": "2024-03-04", "cost": { - "input": 0, - "output": 0 + "input": 3, + "output": 15, + "cache_read": 0.3, + "cache_write": 3.75 }, "type": "chat" }, { - "id": "mistral-ai/mistral-large-2411", - "name": "Mistral Large 24.11", - "display_name": "Mistral Large 24.11", + "id": "anthropic--claude-4-sonnet", + "name": "anthropic--claude-4-sonnet", + "display_name": "anthropic--claude-4-sonnet", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 32768 + "context": 200000, + "output": 64000 }, "temperature": true, "tool_call": true, @@ -94928,32 +100029,38 @@ "supported": true, "default": true }, - "attachment": false, + "attachment": true, "open_weights": false, - "knowledge": "2024-09", - "release_date": "2024-11-01", - "last_updated": "2024-11-01", + "knowledge": "2025-03-31", + "release_date": "2025-05-22", + "last_updated": "2025-05-22", "cost": { - "input": 0, - "output": 0 + "input": 3, + "output": 15, + "cache_read": 0.3, + "cache_write": 3.75 }, "type": "chat" }, { - "id": "mistral-ai/ministral-3b", - "name": "Ministral 3B", - "display_name": "Ministral 3B", + "id": "gemini-2.5-pro", + "name": "gemini-2.5-pro", + "display_name": "gemini-2.5-pro", "modalities": { "input": [ - "text" + "text", + "image", + "audio", + "video", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 8192 + "context": 1048576, + "output": 65536 }, "temperature": true, "tool_call": true, @@ -94961,21 +100068,41 @@ "supported": true, "default": true }, - "attachment": false, - "open_weights": true, - "knowledge": "2024-03", - "release_date": "2024-10-22", - "last_updated": "2024-10-22", + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": true, + "mode": "budget", + "budget": { + "default": -1, + "min": 128, + "max": 32768, + "auto": -1, + "unit": "tokens" + }, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thought_signatures" + ] + } + }, + "attachment": true, + "open_weights": false, + "knowledge": "2025-01", + "release_date": "2025-03-25", + "last_updated": "2025-06-05", "cost": { - "input": 0, - "output": 0 + "input": 1.25, + "output": 10, + "cache_read": 0.125 }, "type": "chat" }, { - "id": "mistral-ai/mistral-small-2503", - "name": "Mistral Small 3.1", - "display_name": "Mistral Small 3.1", + "id": "gpt-5", + "name": "gpt-5", + "display_name": "gpt-5", "modalities": { "input": [ "text", @@ -94986,41 +100113,67 @@ ] }, "limit": { - "context": 128000, - "output": 32768 + "context": 400000, + "output": 128000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { "supported": true, "default": true }, - "attachment": false, + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": true, + "mode": "effort", + "effort": "medium", + "effort_options": [ + "minimal", + "low", + "medium", + "high" + ], + "verbosity": "medium", + "verbosity_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" + } + }, + "attachment": true, "open_weights": false, - "knowledge": "2024-09", - "release_date": "2025-03-01", - "last_updated": "2025-03-01", + "knowledge": "2024-09-30", + "release_date": "2025-08-07", + "last_updated": "2025-08-07", "cost": { - "input": 0, - "output": 0 + "input": 1.25, + "output": 10, + "cache_read": 0.125 }, "type": "chat" }, { - "id": "mistral-ai/mistral-nemo", - "name": "Mistral Nemo", - "display_name": "Mistral Nemo", + "id": "gemini-2.5-flash", + "name": "gemini-2.5-flash", + "display_name": "gemini-2.5-flash", "modalities": { "input": [ - "text" + "text", + "image", + "audio", + "video", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 8192 + "context": 1048576, + "output": 65536 }, "temperature": true, "tool_call": true, @@ -95028,33 +100181,56 @@ "supported": true, "default": true }, - "attachment": false, - "open_weights": true, - "knowledge": "2024-03", - "release_date": "2024-07-18", - "last_updated": "2024-07-18", + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": true, + "mode": "budget", + "budget": { + "default": -1, + "min": 0, + "max": 24576, + "auto": -1, + "off": 0, + "unit": "tokens" + }, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thought_signatures" + ] + } + }, + "attachment": true, + "open_weights": false, + "knowledge": "2025-01", + "release_date": "2025-04-17", + "last_updated": "2025-06-05", "cost": { - "input": 0, - "output": 0 + "input": 0.3, + "output": 2.5, + "cache_read": 0.03, + "input_audio": 1 }, "type": "chat" }, { - "id": "mistral-ai/mistral-medium-2505", - "name": "Mistral Medium 3 (25.05)", - "display_name": "Mistral Medium 3 (25.05)", + "id": "anthropic--claude-4.5-haiku", + "name": "anthropic--claude-4.5-haiku", + "display_name": "anthropic--claude-4.5-haiku", "modalities": { "input": [ "text", - "image" + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 32768 + "context": 200000, + "output": 64000 }, "temperature": true, "tool_call": true, @@ -95062,65 +100238,72 @@ "supported": true, "default": true }, - "attachment": false, + "attachment": true, "open_weights": false, - "knowledge": "2024-09", - "release_date": "2025-05-01", - "last_updated": "2025-05-01", + "knowledge": "2025-02-28", + "release_date": "2025-10-15", + "last_updated": "2025-10-15", "cost": { - "input": 0, - "output": 0 + "input": 1, + "output": 5, + "cache_read": 0.1, + "cache_write": 1.25 }, "type": "chat" }, { - "id": "mistral-ai/codestral-2501", - "name": "Codestral 25.01", - "display_name": "Codestral 25.01", + "id": "anthropic--claude-3-haiku", + "name": "anthropic--claude-3-haiku", + "display_name": "anthropic--claude-3-haiku", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 32000, - "output": 8192 + "context": 200000, + "output": 4096 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, - "attachment": false, + "attachment": true, "open_weights": false, - "knowledge": "2024-03", - "release_date": "2025-01-01", - "last_updated": "2025-01-01", + "knowledge": "2023-08-31", + "release_date": "2024-03-13", + "last_updated": "2024-03-13", "cost": { - "input": 0, - "output": 0 + "input": 0.25, + "output": 1.25, + "cache_read": 0.03, + "cache_write": 0.3 }, "type": "chat" }, { - "id": "microsoft/phi-3-medium-128k-instruct", - "name": "Phi-3-medium instruct (128k)", - "display_name": "Phi-3-medium instruct (128k)", + "id": "anthropic--claude-4-opus", + "name": "anthropic--claude-4-opus", + "display_name": "anthropic--claude-4-opus", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 4096 + "context": 200000, + "output": 32000 }, "temperature": true, "tool_call": true, @@ -95128,33 +100311,36 @@ "supported": true, "default": true }, - "attachment": false, - "open_weights": true, - "knowledge": "2023-10", - "release_date": "2024-04-23", - "last_updated": "2024-04-23", + "attachment": true, + "open_weights": false, + "knowledge": "2025-03-31", + "release_date": "2025-05-22", + "last_updated": "2025-05-22", "cost": { - "input": 0, - "output": 0 + "input": 15, + "output": 75, + "cache_read": 1.5, + "cache_write": 18.75 }, "type": "chat" }, { - "id": "microsoft/phi-3.5-vision-instruct", - "name": "Phi-3.5-vision instruct (128k)", - "display_name": "Phi-3.5-vision instruct (128k)", + "id": "anthropic--claude-4.5-sonnet", + "name": "anthropic--claude-4.5-sonnet", + "display_name": "anthropic--claude-4.5-sonnet", "modalities": { "input": [ "text", - "image" + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 4096 + "context": 200000, + "output": 64000 }, "temperature": true, "tool_call": true, @@ -95162,65 +100348,72 @@ "supported": true, "default": true }, - "attachment": false, - "open_weights": true, - "knowledge": "2023-10", - "release_date": "2024-08-20", - "last_updated": "2024-08-20", + "attachment": true, + "open_weights": false, + "knowledge": "2025-07-31", + "release_date": "2025-09-29", + "last_updated": "2025-09-29", "cost": { - "input": 0, - "output": 0 + "input": 3, + "output": 15, + "cache_read": 0.3, + "cache_write": 3.75 }, "type": "chat" }, { - "id": "microsoft/phi-4-reasoning", - "name": "Phi-4-Reasoning", - "display_name": "Phi-4-Reasoning", + "id": "anthropic--claude-3.5-sonnet", + "name": "anthropic--claude-3.5-sonnet", + "display_name": "anthropic--claude-3.5-sonnet", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 4096 + "context": 200000, + "output": 8192 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, - "attachment": false, - "open_weights": true, - "knowledge": "2023-10", - "release_date": "2024-12-11", - "last_updated": "2024-12-11", + "attachment": true, + "open_weights": false, + "knowledge": "2024-04-30", + "release_date": "2024-10-22", + "last_updated": "2024-10-22", "cost": { - "input": 0, - "output": 0 + "input": 3, + "output": 15, + "cache_read": 0.3, + "cache_write": 3.75 }, "type": "chat" }, { - "id": "microsoft/phi-4", - "name": "Phi-4", - "display_name": "Phi-4", + "id": "anthropic--claude-4.6-opus", + "name": "anthropic--claude-4.6-opus", + "display_name": "anthropic--claude-4.6-opus", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 16000, - "output": 4096 + "context": 1000000, + "output": 128000 }, "temperature": true, "tool_call": true, @@ -95228,87 +100421,138 @@ "supported": true, "default": true }, - "attachment": false, - "open_weights": true, - "knowledge": "2023-10", - "release_date": "2024-12-11", - "last_updated": "2024-12-11", + "attachment": true, + "open_weights": false, + "knowledge": "2025-05", + "release_date": "2026-02-05", + "last_updated": "2026-03-13", "cost": { - "input": 0, - "output": 0 + "input": 5, + "output": 25, + "cache_read": 0.5, + "cache_write": 6.25 }, "type": "chat" }, { - "id": "microsoft/phi-3-mini-128k-instruct", - "name": "Phi-3-mini instruct (128k)", - "display_name": "Phi-3-mini instruct (128k)", + "id": "gemini-2.5-flash-lite", + "name": "gemini-2.5-flash-lite", + "display_name": "gemini-2.5-flash-lite", "modalities": { "input": [ - "text" + "text", + "image", + "audio", + "video", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 4096 + "context": 1048576, + "output": 65536 }, "temperature": true, "tool_call": true, "reasoning": { "supported": true, - "default": true + "default": false }, - "attachment": false, - "open_weights": true, - "knowledge": "2023-10", - "release_date": "2024-04-23", - "last_updated": "2024-04-23", + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": false, + "mode": "budget", + "budget": { + "default": -1, + "min": 512, + "max": 24576, + "auto": -1, + "unit": "tokens" + }, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thought_signatures" + ] + } + }, + "attachment": true, + "open_weights": false, + "knowledge": "2025-01", + "release_date": "2025-06-17", + "last_updated": "2025-06-17", "cost": { - "input": 0, - "output": 0 + "input": 0.1, + "output": 0.4, + "cache_read": 0.01, + "input_audio": 0.3 }, "type": "chat" }, { - "id": "microsoft/phi-3-small-128k-instruct", - "name": "Phi-3-small instruct (128k)", - "display_name": "Phi-3-small instruct (128k)", + "id": "anthropic--claude-3.7-sonnet", + "name": "anthropic--claude-3.7-sonnet", + "display_name": "anthropic--claude-3.7-sonnet", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 4096 + "context": 200000, + "output": 64000 }, "temperature": true, "tool_call": true, "reasoning": { "supported": true, - "default": true + "default": false }, - "attachment": false, - "open_weights": true, - "knowledge": "2023-10", - "release_date": "2024-04-23", - "last_updated": "2024-04-23", + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": false, + "mode": "budget", + "budget": { + "min": 1024, + "unit": "tokens" + }, + "interleaved": false, + "summaries": false, + "visibility": "full", + "continuation": [ + "thinking_blocks" + ], + "notes": [ + "Anthropic uses thinking budget tokens" + ] + } + }, + "attachment": true, + "open_weights": false, + "knowledge": "2024-10-31", + "release_date": "2025-02-24", + "last_updated": "2025-02-24", "cost": { - "input": 0, - "output": 0 + "input": 3, + "output": 15, + "cache_read": 0.3, + "cache_write": 3.75 }, "type": "chat" }, { - "id": "microsoft/mai-ds-r1", - "name": "MAI-DS-R1", - "display_name": "MAI-DS-R1", + "id": "sonar", + "name": "sonar", + "display_name": "sonar", "modalities": { "input": [ "text" @@ -95318,230 +100562,282 @@ ] }, "limit": { - "context": 65536, - "output": 8192 + "context": 128000, + "output": 4096 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": true + "supported": false }, "attachment": false, "open_weights": false, - "knowledge": "2024-06", - "release_date": "2025-01-20", - "last_updated": "2025-01-20", + "knowledge": "2025-09-01", + "release_date": "2024-01-01", + "last_updated": "2025-09-01", "cost": { - "input": 0, - "output": 0 + "input": 1, + "output": 1 }, "type": "chat" }, { - "id": "microsoft/phi-4-multimodal-instruct", - "name": "Phi-4-multimodal-instruct", - "display_name": "Phi-4-multimodal-instruct", + "id": "sonar-pro", + "name": "sonar-pro", + "display_name": "sonar-pro", "modalities": { "input": [ "text", - "image", - "audio" + "image" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 4096 + "context": 200000, + "output": 8192 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": true + "supported": false }, - "attachment": false, - "open_weights": true, - "knowledge": "2023-10", - "release_date": "2024-12-11", - "last_updated": "2024-12-11", + "attachment": true, + "open_weights": false, + "knowledge": "2025-09-01", + "release_date": "2024-01-01", + "last_updated": "2025-09-01", "cost": { - "input": 0, - "output": 0 + "input": 3, + "output": 15 }, "type": "chat" }, { - "id": "microsoft/phi-3-small-8k-instruct", - "name": "Phi-3-small instruct (8k)", - "display_name": "Phi-3-small instruct (8k)", + "id": "gpt-5.4", + "name": "gpt-5.4", + "display_name": "gpt-5.4", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 8192, - "output": 2048 + "context": 1050000, + "output": 128000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { "supported": true, - "default": true + "default": false }, - "attachment": false, - "open_weights": true, - "knowledge": "2023-10", - "release_date": "2024-04-23", - "last_updated": "2024-04-23", + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": false, + "mode": "effort", + "effort": "none", + "effort_options": [ + "none", + "low", + "medium", + "high", + "xhigh" + ], + "verbosity": "medium", + "verbosity_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" + } + }, + "attachment": true, + "open_weights": false, + "knowledge": "2025-08-31", + "release_date": "2026-03-05", + "last_updated": "2026-03-05", "cost": { - "input": 0, - "output": 0 + "input": 2.5, + "output": 15, + "cache_read": 0.25 }, "type": "chat" }, { - "id": "microsoft/phi-4-mini-instruct", - "name": "Phi-4-mini-instruct", - "display_name": "Phi-4-mini-instruct", + "id": "gpt-4.1", + "name": "gpt-4.1", + "display_name": "gpt-4.1", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 4096 + "context": 1047576, + "output": 32768 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, - "attachment": false, - "open_weights": true, - "knowledge": "2023-10", - "release_date": "2024-12-11", - "last_updated": "2024-12-11", + "attachment": true, + "open_weights": false, + "knowledge": "2024-04", + "release_date": "2025-04-14", + "last_updated": "2025-04-14", "cost": { - "input": 0, - "output": 0 + "input": 2, + "output": 8, + "cache_read": 0.5 }, "type": "chat" }, { - "id": "microsoft/phi-3.5-mini-instruct", - "name": "Phi-3.5-mini instruct (128k)", - "display_name": "Phi-3.5-mini instruct (128k)", + "id": "anthropic--claude-3-opus", + "name": "anthropic--claude-3-opus", + "display_name": "anthropic--claude-3-opus", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 128000, + "context": 200000, "output": 4096 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, - "attachment": false, - "open_weights": true, - "knowledge": "2023-10", - "release_date": "2024-08-20", - "last_updated": "2024-08-20", + "attachment": true, + "open_weights": false, + "knowledge": "2023-08-31", + "release_date": "2024-02-29", + "last_updated": "2024-02-29", "cost": { - "input": 0, - "output": 0 + "input": 15, + "output": 75, + "cache_read": 1.5, + "cache_write": 18.75 }, "type": "chat" }, { - "id": "microsoft/phi-3-mini-4k-instruct", - "name": "Phi-3-mini instruct (4k)", - "display_name": "Phi-3-mini instruct (4k)", + "id": "gpt-5-mini", + "name": "gpt-5-mini", + "display_name": "gpt-5-mini", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 4096, - "output": 1024 + "context": 400000, + "output": 128000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { "supported": true, "default": true }, - "attachment": false, - "open_weights": true, - "knowledge": "2023-10", - "release_date": "2024-04-23", - "last_updated": "2024-04-23", + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": true, + "mode": "effort", + "effort": "medium", + "effort_options": [ + "minimal", + "low", + "medium", + "high" + ], + "verbosity": "medium", + "verbosity_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" + } + }, + "attachment": true, + "open_weights": false, + "knowledge": "2024-05-30", + "release_date": "2025-08-07", + "last_updated": "2025-08-07", "cost": { - "input": 0, - "output": 0 + "input": 0.25, + "output": 2, + "cache_read": 0.025 }, "type": "chat" }, { - "id": "microsoft/phi-3-medium-4k-instruct", - "name": "Phi-3-medium instruct (4k)", - "display_name": "Phi-3-medium instruct (4k)", + "id": "gpt-4.1-mini", + "name": "gpt-4.1-mini", + "display_name": "gpt-4.1-mini", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 4096, - "output": 1024 + "context": 1047576, + "output": 32768 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, - "attachment": false, - "open_weights": true, - "knowledge": "2023-10", - "release_date": "2024-04-23", - "last_updated": "2024-04-23", + "attachment": true, + "open_weights": false, + "knowledge": "2024-04", + "release_date": "2025-04-14", + "last_updated": "2025-04-14", "cost": { - "input": 0, - "output": 0 + "input": 0.4, + "output": 1.6, + "cache_read": 0.1 }, "type": "chat" }, { - "id": "microsoft/phi-3.5-moe-instruct", - "name": "Phi-3.5-MoE instruct (128k)", - "display_name": "Phi-3.5-MoE instruct (128k)", + "id": "sonar-deep-research", + "name": "sonar-deep-research", + "display_name": "sonar-deep-research", "modalities": { "input": [ "text" @@ -95552,73 +100848,99 @@ }, "limit": { "context": 128000, - "output": 4096 + "output": 32768 }, - "temperature": true, - "tool_call": true, + "temperature": false, + "tool_call": false, "reasoning": { "supported": true, "default": true }, "attachment": false, - "open_weights": true, - "knowledge": "2023-10", - "release_date": "2024-08-20", - "last_updated": "2024-08-20", + "open_weights": false, + "knowledge": "2025-01", + "release_date": "2025-02-01", + "last_updated": "2025-09-01", "cost": { - "input": 0, - "output": 0 + "input": 2, + "output": 8, + "reasoning": 3 }, "type": "chat" }, { - "id": "microsoft/phi-4-mini-reasoning", - "name": "Phi-4-mini-reasoning", - "display_name": "Phi-4-mini-reasoning", + "id": "gpt-5-nano", + "name": "gpt-5-nano", + "display_name": "gpt-5-nano", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 4096 + "context": 400000, + "output": 128000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { "supported": true, "default": true }, - "attachment": false, - "open_weights": true, - "knowledge": "2023-10", - "release_date": "2024-12-11", - "last_updated": "2024-12-11", + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": true, + "mode": "effort", + "effort": "medium", + "effort_options": [ + "minimal", + "low", + "medium", + "high" + ], + "verbosity": "medium", + "verbosity_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" + } + }, + "attachment": true, + "open_weights": false, + "knowledge": "2024-05-30", + "release_date": "2025-08-07", + "last_updated": "2025-08-07", "cost": { - "input": 0, - "output": 0 + "input": 0.05, + "output": 0.4, + "cache_read": 0.005 }, "type": "chat" }, { - "id": "meta/meta-llama-3.1-405b-instruct", - "name": "Meta-Llama-3.1-405B-Instruct", - "display_name": "Meta-Llama-3.1-405B-Instruct", + "id": "anthropic--claude-4.5-opus", + "name": "anthropic--claude-4.5-opus", + "display_name": "anthropic--claude-4.5-opus", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 32768 + "context": 200000, + "output": 64000 }, "temperature": true, "tool_call": true, @@ -95626,100 +100948,137 @@ "supported": true, "default": true }, - "attachment": false, - "open_weights": true, - "knowledge": "2023-12", - "release_date": "2024-07-23", - "last_updated": "2024-07-23", + "attachment": true, + "open_weights": false, + "knowledge": "2025-05", + "release_date": "2025-11-24", + "last_updated": "2025-11-24", "cost": { - "input": 0, - "output": 0 + "input": 5, + "output": 25, + "cache_read": 0.5, + "cache_write": 6.25 }, "type": "chat" }, { - "id": "meta/meta-llama-3.1-8b-instruct", - "name": "Meta-Llama-3.1-8B-Instruct", - "display_name": "Meta-Llama-3.1-8B-Instruct", + "id": "anthropic--claude-4.7-opus", + "name": "anthropic--claude-4.7-opus", + "display_name": "anthropic--claude-4.7-opus", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 32768 + "context": 1000000, + "output": 128000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { "supported": true, "default": true }, - "attachment": false, - "open_weights": true, - "knowledge": "2023-12", - "release_date": "2024-07-23", - "last_updated": "2024-07-23", + "attachment": true, + "open_weights": false, + "knowledge": "2026-01-31", + "release_date": "2026-04-16", + "last_updated": "2026-04-16", "cost": { - "input": 0, - "output": 0 + "input": 5, + "output": 25, + "cache_read": 0.5, + "cache_write": 6.25 }, "type": "chat" }, { - "id": "meta/llama-4-scout-17b-16e-instruct", - "name": "Llama 4 Scout 17B 16E Instruct", - "display_name": "Llama 4 Scout 17B 16E Instruct", + "id": "gpt-5.5", + "name": "gpt-5.5", + "display_name": "gpt-5.5", "modalities": { "input": [ "text", - "image" + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 8192 + "context": 1050000, + "output": 128000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { "supported": true, "default": true }, - "attachment": false, - "open_weights": true, - "knowledge": "2024-12", - "release_date": "2025-01-31", - "last_updated": "2025-01-31", + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": true, + "mode": "effort", + "effort": "medium", + "effort_options": [ + "low", + "medium", + "high", + "xhigh" + ], + "verbosity": "medium", + "verbosity_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" + } + }, + "attachment": true, + "open_weights": false, + "knowledge": "2025-12-01", + "release_date": "2026-04-23", + "last_updated": "2026-04-23", "cost": { - "input": 0, - "output": 0 + "input": 5, + "output": 30, + "cache_read": 0.5 }, "type": "chat" - }, + } + ] + }, + "opencode": { + "id": "opencode", + "name": "OpenCode Zen", + "display_name": "OpenCode Zen", + "api": "https://opencode.ai/zen/v1", + "doc": "https://opencode.ai/docs/zen", + "models": [ { - "id": "meta/llama-4-maverick-17b-128e-instruct-fp8", - "name": "Llama 4 Maverick 17B 128E Instruct FP8", - "display_name": "Llama 4 Maverick 17B 128E Instruct FP8", + "id": "ring-2.6-1t-free", + "name": "Ring 2.6 1T Free", + "display_name": "Ring 2.6 1T Free", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 8192 + "context": 262000, + "output": 66000 }, "temperature": true, "tool_call": true, @@ -95727,11 +101086,22 @@ "supported": true, "default": true }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } + }, "attachment": false, "open_weights": true, - "knowledge": "2024-12", - "release_date": "2025-01-31", - "last_updated": "2025-01-31", + "knowledge": "2025-06", + "release_date": "2026-05-08", + "last_updated": "2026-05-08", "cost": { "input": 0, "output": 0 @@ -95739,9 +101109,9 @@ "type": "chat" }, { - "id": "meta/meta-llama-3-8b-instruct", - "name": "Meta-Llama-3-8B-Instruct", - "display_name": "Meta-Llama-3-8B-Instruct", + "id": "mimo-v2-pro-free", + "name": "MiMo V2 Pro Free", + "display_name": "MiMo V2 Pro Free", "modalities": { "input": [ "text" @@ -95751,8 +101121,8 @@ ] }, "limit": { - "context": 8192, - "output": 2048 + "context": 1048576, + "output": 64000 }, "temperature": true, "tool_call": true, @@ -95760,21 +101130,33 @@ "supported": true, "default": true }, - "attachment": false, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } + }, + "attachment": true, "open_weights": true, - "knowledge": "2023-12", - "release_date": "2024-04-18", - "last_updated": "2024-04-18", + "knowledge": "2024-12", + "release_date": "2026-03-18", + "last_updated": "2026-03-18", "cost": { "input": 0, - "output": 0 + "output": 0, + "cache_read": 0 }, "type": "chat" }, { - "id": "meta/meta-llama-3.1-70b-instruct", - "name": "Meta-Llama-3.1-70B-Instruct", - "display_name": "Meta-Llama-3.1-70B-Instruct", + "id": "deepseek-v4-flash", + "name": "DeepSeek V4 Flash", + "display_name": "DeepSeek V4 Flash", "modalities": { "input": [ "text" @@ -95784,8 +101166,8 @@ ] }, "limit": { - "context": 128000, - "output": 32768 + "context": 1000000, + "output": 384000 }, "temperature": true, "tool_call": true, @@ -95793,34 +101175,44 @@ "supported": true, "default": true }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } + }, "attachment": false, "open_weights": true, - "knowledge": "2023-12", - "release_date": "2024-07-23", - "last_updated": "2024-07-23", + "knowledge": "2025-05", + "release_date": "2026-04-24", + "last_updated": "2026-04-24", "cost": { - "input": 0, - "output": 0 + "input": 0.14, + "output": 0.28, + "cache_read": 0.028 }, "type": "chat" }, { - "id": "meta/llama-3.2-11b-vision-instruct", - "name": "Llama-3.2-11B-Vision-Instruct", - "display_name": "Llama-3.2-11B-Vision-Instruct", + "id": "minimax-m2.5", + "name": "MiniMax M2.5", + "display_name": "MiniMax M2.5", "modalities": { "input": [ - "text", - "image", - "audio" + "text" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 8192 + "context": 204800, + "output": 131072 }, "temperature": true, "tool_call": true, @@ -95828,21 +101220,33 @@ "supported": true, "default": true }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } + }, "attachment": false, "open_weights": true, - "knowledge": "2023-12", - "release_date": "2024-09-25", - "last_updated": "2024-09-25", + "knowledge": "2025-01", + "release_date": "2026-02-12", + "last_updated": "2026-02-12", "cost": { - "input": 0, - "output": 0 + "input": 0.3, + "output": 1.2, + "cache_read": 0.06 }, "type": "chat" }, { - "id": "meta/meta-llama-3-70b-instruct", - "name": "Meta-Llama-3-70B-Instruct", - "display_name": "Meta-Llama-3-70B-Instruct", + "id": "glm-4.7", + "name": "GLM-4.7", + "display_name": "GLM-4.7", "modalities": { "input": [ "text" @@ -95852,8 +101256,8 @@ ] }, "limit": { - "context": 8192, - "output": 2048 + "context": 204800, + "output": 131072 }, "temperature": true, "tool_call": true, @@ -95861,32 +101265,47 @@ "supported": true, "default": true }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } + }, "attachment": false, "open_weights": true, - "knowledge": "2023-12", - "release_date": "2024-04-18", - "last_updated": "2024-04-18", + "knowledge": "2025-04", + "release_date": "2025-12-22", + "last_updated": "2025-12-22", "cost": { - "input": 0, - "output": 0 + "input": 0.6, + "output": 2.2, + "cache_read": 0.1 }, "type": "chat" }, { - "id": "meta/llama-3.3-70b-instruct", - "name": "Llama-3.3-70B-Instruct", - "display_name": "Llama-3.3-70B-Instruct", + "id": "mimo-v2.5-free", + "name": "MiMo V2.5 Free", + "display_name": "MiMo V2.5 Free", "modalities": { "input": [ - "text" + "text", + "image", + "audio", + "video" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 32768 + "context": 200000, + "output": 32000 }, "temperature": true, "tool_call": true, @@ -95894,105 +101313,125 @@ "supported": true, "default": true }, - "attachment": false, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } + }, + "attachment": true, "open_weights": true, - "knowledge": "2023-12", - "release_date": "2024-12-06", - "last_updated": "2024-12-06", + "knowledge": "2024-12", + "release_date": "2026-04-24", + "last_updated": "2026-04-24", "cost": { "input": 0, - "output": 0 + "output": 0, + "cache_read": 0 }, "type": "chat" }, { - "id": "meta/llama-3.2-90b-vision-instruct", - "name": "Llama-3.2-90B-Vision-Instruct", - "display_name": "Llama-3.2-90B-Vision-Instruct", + "id": "kimi-k2", + "name": "Kimi K2", + "display_name": "Kimi K2", "modalities": { "input": [ - "text", - "image", - "audio" + "text" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 8192 + "context": 262144, + "output": 262144 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, "attachment": false, "open_weights": true, - "knowledge": "2023-12", - "release_date": "2024-09-25", - "last_updated": "2024-09-25", + "knowledge": "2024-10", + "release_date": "2025-09-05", + "last_updated": "2025-09-05", "cost": { - "input": 0, - "output": 0 + "input": 0.4, + "output": 2.5, + "cache_read": 0.4 }, "type": "chat" }, { - "id": "openai/gpt-4o", - "name": "GPT-4o", - "display_name": "GPT-4o", + "id": "minimax-m2.1", + "name": "MiniMax M2.1", + "display_name": "MiniMax M2.1", "modalities": { "input": [ - "text", - "image", - "audio" + "text" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 16384 + "context": 204800, + "output": 131072 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": true, - "open_weights": false, - "knowledge": "2023-10", - "release_date": "2024-05-13", - "last_updated": "2024-05-13", + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } + }, + "attachment": false, + "open_weights": true, + "knowledge": "2025-01", + "release_date": "2025-12-23", + "last_updated": "2025-12-23", "cost": { - "input": 0, - "output": 0 + "input": 0.3, + "output": 1.2, + "cache_read": 0.1 }, "type": "chat" }, { - "id": "openai/o3", - "name": "OpenAI o3", - "display_name": "OpenAI o3", + "id": "nemotron-3-ultra-free", + "name": "Nemotron 3 Ultra Free", + "display_name": "Nemotron 3 Ultra Free", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 100000 + "context": 1000000, + "output": 128000 }, - "temperature": false, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { "supported": true, "default": true @@ -96000,80 +101439,93 @@ "extra_capabilities": { "reasoning": { "supported": true, - "default_enabled": true, - "mode": "effort", - "effort": "medium", - "effort_options": [ - "low", - "medium", - "high" - ], - "visibility": "hidden" + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] } }, "attachment": false, - "open_weights": false, - "knowledge": "2024-04", - "release_date": "2025-01-31", - "last_updated": "2025-01-31", + "open_weights": true, + "knowledge": "2026-02", + "release_date": "2026-06-04", + "last_updated": "2026-06-04", "cost": { "input": 0, - "output": 0 + "output": 0, + "cache_read": 0 }, "type": "chat" }, { - "id": "openai/gpt-4.1-mini", - "name": "GPT-4.1-mini", - "display_name": "GPT-4.1-mini", + "id": "glm-4.7-free", + "name": "GLM-4.7 Free", + "display_name": "GLM-4.7 Free", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 16384 + "context": 204800, + "output": 131072 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": true, - "open_weights": false, - "knowledge": "2024-04", - "release_date": "2025-04-14", - "last_updated": "2025-04-14", + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } + }, + "attachment": false, + "open_weights": true, + "knowledge": "2025-04", + "release_date": "2025-12-22", + "last_updated": "2025-12-22", "cost": { "input": 0, - "output": 0 + "output": 0, + "cache_read": 0 }, "type": "chat" }, { - "id": "openai/o4-mini", - "name": "OpenAI o4-mini", - "display_name": "OpenAI o4-mini", + "id": "gemini-3-flash", + "name": "Gemini 3 Flash", + "display_name": "Gemini 3 Flash", "modalities": { "input": [ "text", - "image" + "image", + "video", + "audio", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 100000 + "context": 1048576, + "output": 65536 }, - "temperature": false, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { "supported": true, "default": true @@ -96082,31 +101534,37 @@ "reasoning": { "supported": true, "default_enabled": true, - "mode": "effort", - "effort": "medium", - "effort_options": [ + "mode": "level", + "level": "high", + "level_options": [ + "minimal", "low", "medium", "high" ], - "visibility": "hidden" + "summaries": true, + "visibility": "summary", + "continuation": [ + "thought_signatures" + ] } }, - "attachment": false, + "attachment": true, "open_weights": false, - "knowledge": "2024-04", - "release_date": "2025-01-31", - "last_updated": "2025-01-31", + "knowledge": "2025-01", + "release_date": "2025-12-17", + "last_updated": "2025-12-17", "cost": { - "input": 0, - "output": 0 + "input": 0.5, + "output": 3, + "cache_read": 0.05 }, "type": "chat" }, { - "id": "openai/o3-mini", - "name": "OpenAI o3-mini", - "display_name": "OpenAI o3-mini", + "id": "deepseek-v4-flash-free", + "name": "DeepSeek V4 Flash Free", + "display_name": "DeepSeek V4 Flash Free", "modalities": { "input": [ "text" @@ -96117,10 +101575,10 @@ }, "limit": { "context": 200000, - "output": 100000 + "output": 128000 }, - "temperature": false, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { "supported": true, "default": true @@ -96128,113 +101586,185 @@ "extra_capabilities": { "reasoning": { "supported": true, - "default_enabled": true, - "mode": "effort", - "effort": "medium", - "effort_options": [ - "low", - "medium", - "high" - ], - "visibility": "hidden" + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] } }, "attachment": false, - "open_weights": false, - "knowledge": "2024-04", - "release_date": "2025-01-31", - "last_updated": "2025-01-31", + "open_weights": true, + "knowledge": "2025-05", + "release_date": "2026-04-24", + "last_updated": "2026-04-24", "cost": { "input": 0, - "output": 0 + "output": 0, + "cache_read": 0 }, "type": "chat" }, { - "id": "openai/gpt-4o-mini", - "name": "GPT-4o mini", - "display_name": "GPT-4o mini", + "id": "claude-sonnet-4", + "name": "Claude Sonnet 4", + "display_name": "Claude Sonnet 4", "modalities": { "input": [ "text", "image", - "audio" + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 16384 + "context": 1000000, + "output": 64000 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": false + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": false, + "mode": "budget", + "budget": { + "min": 1024, + "unit": "tokens" + }, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ], + "notes": [ + "Claude 4 manual thinking uses thinking.type = \"enabled\" with budget_tokens.", + "Interleaved thinking requires the interleaved-thinking-2025-05-14 beta header for this model family." + ] + } }, "attachment": true, "open_weights": false, - "knowledge": "2023-10", - "release_date": "2024-07-18", - "last_updated": "2024-07-18", + "knowledge": "2025-03-31", + "release_date": "2025-05-22", + "last_updated": "2025-05-22", "cost": { - "input": 0, - "output": 0 + "input": 3, + "output": 15, + "cache_read": 0.3, + "cache_write": 3.75, + "tiers": [ + { + "input": 6, + "output": 22.5, + "cache_read": 0.6, + "cache_write": 7.5, + "tier": { + "type": "context", + "size": 200000 + } + } + ], + "context_over_200k": { + "input": 6, + "output": 22.5, + "cache_read": 0.6, + "cache_write": 7.5 + } }, "type": "chat" }, { - "id": "openai/gpt-4.1", - "name": "GPT-4.1", - "display_name": "GPT-4.1", + "id": "claude-opus-4-5", + "name": "Claude Opus 4.5", + "display_name": "Claude Opus 4.5", "modalities": { "input": [ "text", - "image" + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 16384 + "context": 200000, + "output": 64000 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": false + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": false, + "mode": "mixed", + "budget": { + "min": 1024, + "unit": "tokens" + }, + "effort": "high", + "effort_options": [ + "low", + "medium", + "high" + ], + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ], + "notes": [ + "Claude Opus 4.5 uses manual thinking.type = \"enabled\" with budget_tokens; effort can be used alongside the thinking budget.", + "Interleaved thinking requires the interleaved-thinking-2025-05-14 beta header." + ] + } }, "attachment": true, "open_weights": false, - "knowledge": "2024-04", - "release_date": "2025-04-14", - "last_updated": "2025-04-14", + "knowledge": "2025-03-31", + "release_date": "2025-11-24", + "last_updated": "2025-11-24", "cost": { - "input": 0, - "output": 0 + "input": 5, + "output": 25, + "cache_read": 0.5, + "cache_write": 6.25 }, "type": "chat" }, { - "id": "openai/o1-mini", - "name": "OpenAI o1-mini", - "display_name": "OpenAI o1-mini", + "id": "gpt-5", + "name": "GPT-5", + "display_name": "GPT-5", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 65536 + "context": 400000, + "output": 128000 }, "temperature": false, - "tool_call": false, + "tool_call": true, "reasoning": { "supported": true, "default": true @@ -96246,6 +101776,13 @@ "mode": "effort", "effort": "medium", "effort_options": [ + "minimal", + "low", + "medium", + "high" + ], + "verbosity": "medium", + "verbosity_options": [ "low", "medium", "high" @@ -96253,35 +101790,40 @@ "visibility": "hidden" } }, - "attachment": false, + "attachment": true, "open_weights": false, - "knowledge": "2023-10", - "release_date": "2024-09-12", - "last_updated": "2024-12-17", + "knowledge": "2024-09-30", + "release_date": "2025-08-07", + "last_updated": "2025-08-07", "cost": { - "input": 0, - "output": 0 + "input": 1.07, + "output": 8.5, + "cache_read": 0.107 }, "type": "chat" }, { - "id": "openai/o1-preview", - "name": "OpenAI o1-preview", - "display_name": "OpenAI o1-preview", + "id": "gemini-3.5-flash", + "name": "Gemini 3.5 Flash", + "display_name": "Gemini 3.5 Flash", "modalities": { "input": [ - "text" + "text", + "image", + "video", + "audio", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 32768 + "context": 1048576, + "output": 65536 }, - "temperature": false, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { "supported": true, "default": true @@ -96290,35 +101832,43 @@ "reasoning": { "supported": true, "default_enabled": true, - "mode": "effort", - "effort": "medium", - "effort_options": [ + "mode": "level", + "level": "high", + "level_options": [ + "minimal", "low", "medium", "high" ], - "visibility": "hidden" + "summaries": true, + "visibility": "summary", + "continuation": [ + "thought_signatures" + ] } }, - "attachment": false, + "attachment": true, "open_weights": false, - "knowledge": "2023-10", - "release_date": "2024-09-12", - "last_updated": "2024-09-12", + "knowledge": "2025-01", + "release_date": "2026-05-19", + "last_updated": "2026-05-19", "cost": { - "input": 0, - "output": 0 + "input": 1.5, + "output": 9, + "cache_read": 0.15, + "input_audio": 1.5 }, "type": "chat" }, { - "id": "openai/o1", - "name": "OpenAI o1", - "display_name": "OpenAI o1", + "id": "minimax-m3-free", + "name": "MiniMax M3 Free", + "display_name": "MiniMax M3 Free", "modalities": { "input": [ "text", - "image" + "image", + "video" ], "output": [ "text" @@ -96326,129 +101876,163 @@ }, "limit": { "context": 200000, - "output": 100000 + "output": 32000 }, - "temperature": false, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { "supported": true, "default": true }, "extra_capabilities": { "reasoning": { - "supported": true, - "default_enabled": true, - "mode": "effort", - "effort": "medium", - "effort_options": [ - "low", - "medium", - "high" - ], - "visibility": "hidden" + "supported": true } }, "attachment": false, - "open_weights": false, - "knowledge": "2023-10", - "release_date": "2024-09-12", - "last_updated": "2024-12-17", + "open_weights": true, + "knowledge": "2025-01", + "release_date": "2026-05-31", + "last_updated": "2026-05-31", "cost": { "input": 0, - "output": 0 + "output": 0, + "cache_read": 0 }, "type": "chat" }, { - "id": "openai/gpt-4.1-nano", - "name": "GPT-4.1-nano", - "display_name": "GPT-4.1-nano", + "id": "gemini-3-pro", + "name": "Gemini 3 Pro", + "display_name": "Gemini 3 Pro", "modalities": { "input": [ "text", - "image" + "image", + "video", + "audio", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 16384 + "context": 1048576, + "output": 65536 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": true, + "mode": "level", + "level": "high", + "level_options": [ + "low", + "high" + ], + "summaries": true, + "visibility": "summary", + "continuation": [ + "thought_signatures" + ] + } }, "attachment": true, "open_weights": false, - "knowledge": "2024-04", - "release_date": "2025-04-14", - "last_updated": "2025-04-14", + "knowledge": "2025-01", + "release_date": "2025-11-18", + "last_updated": "2025-11-18", "cost": { - "input": 0, - "output": 0 + "input": 2, + "output": 12, + "cache_read": 0.2, + "tiers": [ + { + "input": 4, + "output": 18, + "cache_read": 0.4, + "tier": { + "type": "context", + "size": 200000 + } + } + ], + "context_over_200k": { + "input": 4, + "output": 18, + "cache_read": 0.4 + } }, "type": "chat" - } - ] - }, - "xiaomi-token-plan-cn": { - "id": "xiaomi-token-plan-cn", - "name": "Xiaomi Token Plan (China)", - "display_name": "Xiaomi Token Plan (China)", - "api": "https://token-plan-cn.xiaomimimo.com/v1", - "doc": "https://platform.xiaomimimo.com/#/docs", - "models": [ + }, { - "id": "mimo-v2-tts", - "name": "MiMo-V2-TTS", - "display_name": "MiMo-V2-TTS", + "id": "kimi-k2.5-free", + "name": "Kimi K2.5 Free", + "display_name": "Kimi K2.5 Free", "modalities": { "input": [ - "text" + "text", + "image", + "video" ], "output": [ - "audio" + "text" ] }, "limit": { - "context": 8192, - "output": 8192 + "context": 262144, + "output": 262144 }, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": false, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } + }, + "attachment": true, "open_weights": true, - "release_date": "2026-03-18", - "last_updated": "2026-03-18", + "knowledge": "2024-10", + "release_date": "2026-01-27", + "last_updated": "2026-01-27", "cost": { "input": 0, - "output": 0 + "output": 0, + "cache_read": 0 }, "type": "chat" }, { - "id": "mimo-v2-omni", - "name": "MiMo-V2-Omni", - "display_name": "MiMo-V2-Omni", + "id": "glm-5.1", + "name": "GLM-5.1", + "display_name": "GLM-5.1", "modalities": { "input": [ - "text", - "image", - "audio", - "video", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 262144, + "context": 204800, "output": 131072 }, "temperature": true, @@ -96468,82 +102052,106 @@ ] } }, - "attachment": true, - "open_weights": false, - "knowledge": "2024-12", - "release_date": "2026-03-18", - "last_updated": "2026-03-18", + "attachment": false, + "open_weights": true, + "knowledge": "2025-04", + "release_date": "2026-04-07", + "last_updated": "2026-04-07", "cost": { - "input": 0, - "output": 0, - "cache_read": 0 + "input": 1.4, + "output": 4.4, + "cache_read": 0.26 }, "type": "chat" }, { - "id": "mimo-v2.5-tts-voicedesign", - "name": "MiMo-V2.5-TTS-VoiceDesign", - "display_name": "MiMo-V2.5-TTS-VoiceDesign", + "id": "deepseek-v4-pro", + "name": "DeepSeek V4 Pro", + "display_name": "DeepSeek V4 Pro", "modalities": { "input": [ "text" ], "output": [ - "audio" + "text" ] }, "limit": { - "context": 8192, - "output": 8192 + "context": 1000000, + "output": 384000 }, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } }, "attachment": false, "open_weights": true, - "release_date": "2026-04-22", - "last_updated": "2026-04-22", + "knowledge": "2025-05", + "release_date": "2026-04-24", + "last_updated": "2026-04-24", "cost": { - "input": 0, - "output": 0 + "input": 1.74, + "output": 3.84, + "cache_read": 0.145 }, "type": "chat" }, { - "id": "mimo-v2.5-tts-voiceclone", - "name": "MiMo-V2.5-TTS-VoiceClone", - "display_name": "MiMo-V2.5-TTS-VoiceClone", + "id": "glm-4.6", + "name": "GLM-4.6", + "display_name": "GLM-4.6", "modalities": { "input": [ "text" ], "output": [ - "audio" + "text" ] }, "limit": { - "context": 8192, - "output": 8192 + "context": 204800, + "output": 131072 }, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true + } }, "attachment": false, "open_weights": true, - "release_date": "2026-04-22", - "last_updated": "2026-04-22", + "knowledge": "2025-04", + "release_date": "2025-09-30", + "last_updated": "2025-09-30", "cost": { - "input": 0, - "output": 0 + "input": 0.6, + "output": 2.2, + "cache_read": 0.1 }, "type": "chat" }, { - "id": "mimo-v2-pro", - "name": "MiMo-V2-Pro", - "display_name": "MiMo-V2-Pro", + "id": "kimi-k2-thinking", + "name": "Kimi K2 Thinking", + "display_name": "Kimi K2 Thinking", "modalities": { "input": [ "text" @@ -96553,8 +102161,8 @@ ] }, "limit": { - "context": 1048576, - "output": 131072 + "context": 262144, + "output": 262144 }, "temperature": true, "tool_call": true, @@ -96574,153 +102182,218 @@ } }, "attachment": false, - "open_weights": false, - "knowledge": "2024-12", - "release_date": "2026-03-18", - "last_updated": "2026-03-18", + "open_weights": true, + "knowledge": "2024-10", + "release_date": "2025-09-05", + "last_updated": "2025-09-05", "cost": { - "input": 0, - "output": 0, - "cache_read": 0 + "input": 0.4, + "output": 2.5, + "cache_read": 0.4 }, "type": "chat" }, { - "id": "mimo-v2.5", - "name": "MiMo-V2.5", - "display_name": "MiMo-V2.5", + "id": "claude-sonnet-4-5", + "name": "Claude Sonnet 4.5", + "display_name": "Claude Sonnet 4.5", "modalities": { "input": [ "text", "image", - "audio", - "video" + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 1048576, - "output": 131072 + "context": 1000000, + "output": 64000 }, "temperature": true, "tool_call": true, "reasoning": { "supported": true, - "default": true + "default": false }, "extra_capabilities": { "reasoning": { "supported": true, + "default_enabled": false, + "mode": "budget", + "budget": { + "min": 1024, + "unit": "tokens" + }, "interleaved": true, "summaries": true, "visibility": "summary", "continuation": [ "thinking_blocks" + ], + "notes": [ + "Claude 4 manual thinking uses thinking.type = \"enabled\" with budget_tokens.", + "Interleaved thinking requires the interleaved-thinking-2025-05-14 beta header for this model family." ] } }, "attachment": true, - "open_weights": true, - "knowledge": "2024-12", - "release_date": "2026-04-22", - "last_updated": "2026-04-22", + "open_weights": false, + "knowledge": "2025-07-31", + "release_date": "2025-09-29", + "last_updated": "2025-09-29", "cost": { - "input": 0, - "output": 0, - "cache_read": 0 + "input": 3, + "output": 15, + "cache_read": 0.3, + "cache_write": 3.75, + "tiers": [ + { + "input": 6, + "output": 22.5, + "cache_read": 0.6, + "cache_write": 7.5, + "tier": { + "type": "context", + "size": 200000 + } + } + ], + "context_over_200k": { + "input": 6, + "output": 22.5, + "cache_read": 0.6, + "cache_write": 7.5 + } }, "type": "chat" }, { - "id": "mimo-v2.5-tts", - "name": "MiMo-V2.5-TTS", - "display_name": "MiMo-V2.5-TTS", + "id": "claude-opus-4-7", + "name": "Claude Opus 4.7", + "display_name": "Claude Opus 4.7", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ - "audio" + "text" ] }, "limit": { - "context": 8192, - "output": 8192 + "context": 1000000, + "output": 128000 }, - "tool_call": false, + "temperature": false, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": false }, - "attachment": false, - "open_weights": true, - "release_date": "2026-04-22", - "last_updated": "2026-04-22", + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": false, + "mode": "effort", + "effort": "high", + "effort_options": [ + "low", + "medium", + "high", + "xhigh", + "max" + ], + "interleaved": true, + "summaries": true, + "visibility": "omitted", + "continuation": [ + "thinking_blocks" + ], + "notes": [ + "Claude Opus 4.7 and newer Opus models require thinking.type = \"adaptive\" to enable thinking explicitly.", + "Manual budget_tokens requests return 400 on Claude Opus 4.7 and newer adaptive-only Opus models.", + "task_budget is separate from thinking control and should not be treated as a thinking budget." + ] + } + }, + "attachment": true, + "open_weights": false, + "knowledge": "2026-01-31", + "release_date": "2026-04-16", + "last_updated": "2026-04-16", "cost": { - "input": 0, - "output": 0 + "input": 5, + "output": 25, + "cache_read": 0.5, + "cache_write": 6.25 }, "type": "chat" }, { - "id": "mimo-v2.5-pro", - "name": "MiMo-V2.5-Pro", - "display_name": "MiMo-V2.5-Pro", + "id": "gpt-5.4-nano", + "name": "GPT-5.4 Nano", + "display_name": "GPT-5.4 Nano", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 1048576, - "output": 131072 + "context": 400000, + "output": 128000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { "supported": true, - "default": true + "default": false }, "extra_capabilities": { "reasoning": { "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] + "default_enabled": false, + "mode": "effort", + "effort": "none", + "effort_options": [ + "none", + "low", + "medium", + "high", + "xhigh" + ], + "verbosity": "medium", + "verbosity_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" } }, - "attachment": false, - "open_weights": true, - "knowledge": "2024-12", - "release_date": "2026-04-22", - "last_updated": "2026-04-22", + "attachment": true, + "open_weights": false, + "knowledge": "2025-08-31", + "release_date": "2026-03-17", + "last_updated": "2026-03-17", "cost": { - "input": 0, - "output": 0, - "cache_read": 0 + "input": 0.2, + "output": 1.25, + "cache_read": 0.02 }, "type": "chat" - } - ] - }, - "lmstudio": { - "id": "lmstudio", - "name": "LMStudio", - "display_name": "LMStudio", - "api": "http://127.0.0.1:1234/v1", - "doc": "https://lmstudio.ai/models", - "models": [ - { - "id": "qwen/qwen3-coder-30b", - "name": "Qwen3 Coder 30B", - "display_name": "Qwen3 Coder 30B", + }, + { + "id": "qwen3-coder", + "name": "Qwen3 Coder", + "display_name": "Qwen3 Coder", "modalities": { "input": [ "text" @@ -96744,15 +102417,15 @@ "release_date": "2025-07-23", "last_updated": "2025-07-23", "cost": { - "input": 0, - "output": 0 + "input": 0.45, + "output": 1.8 }, "type": "chat" }, { - "id": "qwen/qwen3-30b-a3b-2507", - "name": "Qwen3 30B A3B 2507", - "display_name": "Qwen3 30B A3B 2507", + "id": "hy3-preview-free", + "name": "Hy3 preview Free", + "display_name": "Hy3 preview Free", "modalities": { "input": [ "text" @@ -96762,170 +102435,208 @@ ] }, "limit": { - "context": 262144, - "output": 16384 + "context": 256000, + "output": 64000 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true + } }, "attachment": false, "open_weights": true, - "knowledge": "2025-04", - "release_date": "2025-07-30", - "last_updated": "2025-07-30", + "knowledge": "2025-06", + "release_date": "2026-04-20", + "last_updated": "2026-04-20", "cost": { "input": 0, - "output": 0 + "output": 0, + "cache_read": 0 }, "type": "chat" }, { - "id": "openai/gpt-oss-20b", - "name": "GPT OSS 20B", - "display_name": "GPT OSS 20B", + "id": "gpt-5.1-codex", + "name": "GPT-5.1 Codex", + "display_name": "GPT-5.1 Codex", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 131072, - "output": 32768 + "context": 400000, + "output": 128000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { "supported": true, - "default": true + "default": false }, "extra_capabilities": { "reasoning": { - "supported": true + "supported": true, + "default_enabled": false, + "mode": "effort", + "effort": "none", + "effort_options": [ + "none", + "low", + "medium", + "high" + ], + "verbosity": "medium", + "verbosity_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" } }, - "attachment": false, - "open_weights": true, - "release_date": "2025-08-05", - "last_updated": "2025-08-05", + "attachment": true, + "open_weights": false, + "knowledge": "2024-09-30", + "release_date": "2025-11-13", + "last_updated": "2025-11-13", "cost": { - "input": 0, - "output": 0 + "input": 1.07, + "output": 8.5, + "cache_read": 0.107 }, "type": "chat" - } - ] - }, - "claudinio": { - "id": "claudinio", - "name": "Claudinio", - "display_name": "Claudinio", - "api": "https://api.claudin.io/v1", - "doc": "https://claudin.io", - "models": [ + }, { - "id": "claudinio", - "name": "Claudinio", - "display_name": "Claudinio", + "id": "gpt-5.3-codex-spark", + "name": "GPT-5.3 Codex Spark", + "display_name": "GPT-5.3 Codex Spark", "modalities": { "input": [ - "text", - "image", - "audio", - "video" + "text" ], "output": [ "text" ] }, "limit": { - "context": 256000, - "output": 64000 + "context": 128000, + "output": 128000 }, + "temperature": false, "tool_call": true, "reasoning": { "supported": true, "default": true }, - "attachment": true, + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": true, + "mode": "effort", + "effort": "medium", + "effort_options": [ + "low", + "medium", + "high", + "xhigh" + ], + "verbosity": "medium", + "verbosity_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" + } + }, + "attachment": false, "open_weights": false, - "knowledge": "2026-05", - "release_date": "2026-05-12", - "last_updated": "2026-06-02", + "knowledge": "2025-08-31", + "release_date": "2026-02-12", + "last_updated": "2026-02-12", "cost": { - "input": 0.5, - "output": 2, - "cache_read": 0.15 + "input": 1.75, + "output": 14, + "cache_read": 0.175 }, "type": "chat" - } - ] - }, - "alibaba-coding-plan": { - "id": "alibaba-coding-plan", - "name": "Alibaba Coding Plan", - "display_name": "Alibaba Coding Plan", - "api": "https://coding-intl.dashscope.aliyuncs.com/v1", - "doc": "https://www.alibabacloud.com/help/en/model-studio/coding-plan", - "models": [ + }, { - "id": "MiniMax-M2.5", - "name": "MiniMax-M2.5", - "display_name": "MiniMax-M2.5", + "id": "gpt-5.1-codex-max", + "name": "GPT-5.1 Codex Max", + "display_name": "GPT-5.1 Codex Max", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 196608, - "output": 24576 + "context": 400000, + "output": 128000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { "supported": true, - "default": true + "default": false }, "extra_capabilities": { "reasoning": { "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] + "default_enabled": false, + "mode": "effort", + "effort": "none", + "effort_options": [ + "none", + "low", + "medium", + "high" + ], + "verbosity": "medium", + "verbosity_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" } }, - "attachment": false, - "open_weights": true, - "release_date": "2026-02-12", - "last_updated": "2026-02-12", + "attachment": true, + "open_weights": false, + "knowledge": "2024-09-30", + "release_date": "2025-11-13", + "last_updated": "2025-11-13", "cost": { - "input": 0, - "output": 0, - "cache_read": 0, - "cache_write": 0 + "input": 1.25, + "output": 10, + "cache_read": 0.125 }, "type": "chat" }, { - "id": "qwen3.5-plus", - "name": "Qwen3.5 Plus", - "display_name": "Qwen3.5 Plus", + "id": "claude-opus-4-8", + "name": "Claude Opus 4.8", + "display_name": "Claude Opus 4.8", "modalities": { "input": [ "text", "image", - "video" + "pdf" ], "output": [ "text" @@ -96933,42 +102644,56 @@ }, "limit": { "context": 1000000, - "output": 65536 + "output": 128000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { "supported": true, - "default": true + "default": false }, "extra_capabilities": { "reasoning": { "supported": true, + "default_enabled": false, + "mode": "effort", + "effort": "high", + "effort_options": [ + "low", + "medium", + "high", + "xhigh", + "max" + ], "interleaved": true, "summaries": true, - "visibility": "summary", + "visibility": "omitted", "continuation": [ "thinking_blocks" + ], + "notes": [ + "Claude Opus 4.7 and newer Opus models require thinking.type = \"adaptive\" to enable thinking explicitly.", + "Manual budget_tokens requests return 400 on Claude Opus 4.7 and newer adaptive-only Opus models.", + "task_budget is separate from thinking control and should not be treated as a thinking budget." ] } }, - "attachment": false, + "attachment": true, "open_weights": false, - "knowledge": "2025-04", - "release_date": "2026-02-16", - "last_updated": "2026-02-16", + "release_date": "2026-05-28", + "last_updated": "2026-05-28", "cost": { - "input": 0, - "output": 0, - "cache_read": 0, - "cache_write": 0 + "input": 5, + "output": 25, + "cache_read": 0.5, + "cache_write": 6.25 }, "type": "chat" }, { - "id": "qwen3-coder-plus", - "name": "Qwen3 Coder Plus", - "display_name": "Qwen3 Coder Plus", + "id": "ling-2.6-flash-free", + "name": "Ling 2.6 Flash Free", + "display_name": "Ling 2.6 Flash Free", "modalities": { "input": [ "text" @@ -96978,8 +102703,8 @@ ] }, "limit": { - "context": 1000000, - "output": 65536 + "context": 262100, + "output": 32800 }, "temperature": true, "tool_call": true, @@ -96988,32 +102713,32 @@ }, "attachment": false, "open_weights": true, - "knowledge": "2025-04", - "release_date": "2025-07-23", - "last_updated": "2025-07-23", + "knowledge": "2025-06", + "release_date": "2026-04-21", + "last_updated": "2026-04-21", "cost": { "input": 0, - "output": 0, - "cache_read": 0, - "cache_write": 0 + "output": 0 }, "type": "chat" }, { - "id": "glm-4.7", - "name": "GLM-4.7", - "display_name": "GLM-4.7", + "id": "qwen3.5-plus", + "name": "Qwen3.5 Plus", + "display_name": "Qwen3.5 Plus", "modalities": { "input": [ - "text" + "text", + "image", + "video" ], "output": [ "text" ] }, "limit": { - "context": 202752, - "output": 16384 + "context": 262144, + "output": 65536 }, "temperature": true, "tool_call": true, @@ -97032,110 +102757,131 @@ ] } }, - "attachment": false, - "open_weights": true, + "attachment": true, + "open_weights": false, "knowledge": "2025-04", - "release_date": "2025-12-22", - "last_updated": "2025-12-22", + "release_date": "2026-02-16", + "last_updated": "2026-02-16", "cost": { - "input": 0, - "output": 0, - "cache_read": 0, - "cache_write": 0 + "input": 0.2, + "output": 1.2, + "cache_read": 0.02, + "cache_write": 0.25 }, "type": "chat" }, { - "id": "qwen3-coder-next", - "name": "Qwen3 Coder Next", - "display_name": "Qwen3 Coder Next", + "id": "claude-3-5-haiku", + "name": "Claude Haiku 3.5", + "display_name": "Claude Haiku 3.5", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 262144, - "output": 65536 + "context": 200000, + "output": 8192 }, "temperature": true, "tool_call": true, "reasoning": { "supported": false }, - "attachment": false, - "open_weights": true, - "release_date": "2026-02-03", - "last_updated": "2026-02-03", + "attachment": true, + "open_weights": false, + "knowledge": "2024-07-31", + "release_date": "2024-10-22", + "last_updated": "2024-10-22", "cost": { - "input": 0, - "output": 0, - "cache_read": 0, - "cache_write": 0 + "input": 0.8, + "output": 4, + "cache_read": 0.08, + "cache_write": 1 }, "type": "chat" }, { - "id": "qwen3.7-max", - "name": "Qwen3.7 Max", - "display_name": "Qwen3.7 Max", + "id": "gpt-5.2", + "name": "GPT-5.2", + "display_name": "GPT-5.2", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 1000000, - "output": 65536 + "context": 400000, + "output": 128000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { "supported": true, - "default": true + "default": false }, "extra_capabilities": { "reasoning": { - "supported": true + "supported": true, + "default_enabled": false, + "mode": "effort", + "effort": "none", + "effort_options": [ + "none", + "low", + "medium", + "high", + "xhigh" + ], + "verbosity": "medium", + "verbosity_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" } }, - "attachment": false, + "attachment": true, "open_weights": false, - "release_date": "2026-05-21", - "last_updated": "2026-05-21", + "knowledge": "2025-08-31", + "release_date": "2025-12-11", + "last_updated": "2025-12-11", "cost": { - "input": 2.5, - "output": 7.5, - "cache_read": 0.5, - "cache_write": 3.125 + "input": 1.75, + "output": 14, + "cache_read": 0.175 }, "type": "chat" }, { - "id": "qwen3.6-plus", - "name": "Qwen3.6 Plus", - "display_name": "Qwen3.6 Plus", + "id": "gpt-5.3-codex", + "name": "GPT-5.3 Codex", + "display_name": "GPT-5.3 Codex", "modalities": { "input": [ "text", "image", - "video" + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 1000000, - "output": 65536 + "context": 400000, + "output": 128000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { "supported": true, @@ -97144,44 +102890,51 @@ "extra_capabilities": { "reasoning": { "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] + "default_enabled": true, + "mode": "effort", + "effort": "medium", + "effort_options": [ + "low", + "medium", + "high", + "xhigh" + ], + "verbosity": "medium", + "verbosity_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" } }, - "attachment": false, + "attachment": true, "open_weights": false, - "knowledge": "2025-04", - "release_date": "2026-04-02", - "last_updated": "2026-04-02", + "knowledge": "2025-08-31", + "release_date": "2026-02-24", + "last_updated": "2026-02-24", "cost": { - "input": 0, - "output": 0, - "cache_read": 0, - "cache_write": 0 + "input": 1.75, + "output": 14, + "cache_read": 0.175 }, "type": "chat" }, { - "id": "qwen3.6-flash", - "name": "Qwen3.6 Flash", - "display_name": "Qwen3.6 Flash", + "id": "minimax-m2.7", + "name": "MiniMax M2.7", + "display_name": "MiniMax M2.7", "modalities": { "input": [ - "text", - "image", - "video" + "text" ], "output": [ "text" ] }, "limit": { - "context": 1000000, - "output": 65536 + "context": 204800, + "output": 131072 }, "temperature": true, "tool_call": true, @@ -97200,21 +102953,22 @@ ] } }, - "attachment": true, - "open_weights": false, - "release_date": "2026-04-27", - "last_updated": "2026-04-27", + "attachment": false, + "open_weights": true, + "knowledge": "2025-01", + "release_date": "2026-03-18", + "last_updated": "2026-03-18", "cost": { - "input": 0.1875, - "output": 1.125, - "cache_write": 0.234375 + "input": 0.3, + "output": 1.2, + "cache_read": 0.06 }, "type": "chat" }, { - "id": "qwen3-max-2026-01-23", - "name": "Qwen3 Max", - "display_name": "Qwen3 Max", + "id": "north-mini-code-free", + "name": "North Mini Code Free", + "display_name": "North Mini Code Free", "modalities": { "input": [ "text" @@ -97224,13 +102978,14 @@ ] }, "limit": { - "context": 262144, - "output": 32768 + "context": 256000, + "output": 64000 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true + "supported": true, + "default": true }, "extra_capabilities": { "reasoning": { @@ -97244,22 +102999,20 @@ } }, "attachment": false, - "open_weights": false, - "knowledge": "2025-04", - "release_date": "2026-01-23", - "last_updated": "2026-01-23", + "open_weights": true, + "knowledge": "2025-09-23", + "release_date": "2026-06-09", + "last_updated": "2026-06-09", "cost": { "input": 0, - "output": 0, - "cache_read": 0, - "cache_write": 0 + "output": 0 }, "type": "chat" }, { - "id": "glm-5", - "name": "GLM-5", - "display_name": "GLM-5", + "id": "grok-code", + "name": "Grok Code Fast 1", + "display_name": "Grok Code Fast 1", "modalities": { "input": [ "text" @@ -97269,8 +103022,8 @@ ] }, "limit": { - "context": 202752, - "output": 16384 + "context": 256000, + "output": 256000 }, "temperature": true, "tool_call": true, @@ -97278,21 +103031,10 @@ "supported": true, "default": true }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } - }, - "attachment": false, + "attachment": true, "open_weights": false, - "release_date": "2026-02-11", - "last_updated": "2026-02-11", + "release_date": "2025-08-20", + "last_updated": "2025-08-20", "cost": { "input": 0, "output": 0, @@ -97302,172 +103044,128 @@ "type": "chat" }, { - "id": "kimi-k2.5", - "name": "Kimi K2.5", - "display_name": "Kimi K2.5", + "id": "claude-opus-4-1", + "name": "Claude Opus 4.1", + "display_name": "Claude Opus 4.1", "modalities": { "input": [ "text", "image", - "video" + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 262144, - "output": 32768 + "context": 200000, + "output": 32000 }, "temperature": true, "tool_call": true, "reasoning": { "supported": true, - "default": true + "default": false }, "extra_capabilities": { "reasoning": { "supported": true, + "default_enabled": false, + "mode": "budget", + "budget": { + "min": 1024, + "unit": "tokens" + }, "interleaved": true, "summaries": true, "visibility": "summary", "continuation": [ "thinking_blocks" + ], + "notes": [ + "Claude 4 manual thinking uses thinking.type = \"enabled\" with budget_tokens.", + "Interleaved thinking requires the interleaved-thinking-2025-05-14 beta header for this model family." ] } }, "attachment": true, - "open_weights": true, - "knowledge": "2025-01", - "release_date": "2026-01-27", - "last_updated": "2026-01-27", - "cost": { - "input": 0, - "output": 0, - "cache_read": 0, - "cache_write": 0 - }, - "type": "chat" - } - ] - }, - "modelscope": { - "id": "modelscope", - "name": "ModelScope", - "display_name": "ModelScope", - "api": "https://api-inference.modelscope.cn/v1", - "doc": "https://modelscope.cn/docs/model-service/API-Inference/intro", - "models": [ - { - "id": "ZhipuAI/GLM-4.5", - "name": "GLM-4.5", - "display_name": "GLM-4.5", - "modalities": { - "input": [ - "text" - ], - "output": [ - "text" - ] - }, - "limit": { - "context": 131072, - "output": 98304 - }, - "temperature": true, - "tool_call": true, - "reasoning": { - "supported": true, - "default": true - }, - "attachment": false, - "open_weights": true, - "knowledge": "2025-04", - "release_date": "2025-07-28", - "last_updated": "2025-07-28", + "open_weights": false, + "knowledge": "2025-03-31", + "release_date": "2025-08-05", + "last_updated": "2025-08-05", "cost": { - "input": 0, - "output": 0 + "input": 15, + "output": 75, + "cache_read": 1.5, + "cache_write": 18.75 }, "type": "chat" }, { - "id": "ZhipuAI/GLM-4.6", - "name": "GLM-4.6", - "display_name": "GLM-4.6", + "id": "gpt-5.1-codex-mini", + "name": "GPT-5.1 Codex Mini", + "display_name": "GPT-5.1 Codex Mini", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 202752, - "output": 98304 + "context": 400000, + "output": 128000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { "supported": true, - "default": true + "default": false }, "extra_capabilities": { "reasoning": { - "supported": true + "supported": true, + "default_enabled": false, + "mode": "effort", + "effort": "none", + "effort_options": [ + "none", + "low", + "medium", + "high" + ], + "verbosity": "medium", + "verbosity_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" } }, - "attachment": false, - "open_weights": true, - "knowledge": "2025-07", - "release_date": "2025-09-30", - "last_updated": "2025-09-30", - "cost": { - "input": 0, - "output": 0 - }, - "type": "chat" - }, - { - "id": "Qwen/Qwen3-30B-A3B-Instruct-2507", - "name": "Qwen3 30B A3B Instruct 2507", - "display_name": "Qwen3 30B A3B Instruct 2507", - "modalities": { - "input": [ - "text" - ], - "output": [ - "text" - ] - }, - "limit": { - "context": 262144, - "output": 16384 - }, - "temperature": true, - "tool_call": true, - "reasoning": { - "supported": false - }, - "attachment": false, - "open_weights": true, - "knowledge": "2025-04", - "release_date": "2025-07-30", - "last_updated": "2025-07-30", + "attachment": true, + "open_weights": false, + "knowledge": "2024-09-30", + "release_date": "2025-11-13", + "last_updated": "2025-11-13", "cost": { - "input": 0, - "output": 0 + "input": 0.25, + "output": 2, + "cache_read": 0.025 }, "type": "chat" }, { - "id": "Qwen/Qwen3-235B-A22B-Thinking-2507", - "name": "Qwen3-235B-A22B-Thinking-2507", - "display_name": "Qwen3-235B-A22B-Thinking-2507", + "id": "kimi-k2.5", + "name": "Kimi K2.5", + "display_name": "Kimi K2.5", "modalities": { "input": [ - "text" + "text", + "image", + "video" ], "output": [ "text" @@ -97475,7 +103173,7 @@ }, "limit": { "context": 262144, - "output": 131072 + "output": 65536 }, "temperature": true, "tool_call": true, @@ -97494,168 +103192,175 @@ ] } }, - "attachment": false, + "attachment": true, "open_weights": true, - "knowledge": "2025-04", - "release_date": "2025-07-25", - "last_updated": "2025-07-25", + "knowledge": "2024-10", + "release_date": "2026-01-27", + "last_updated": "2026-01-27", "cost": { - "input": 0, - "output": 0 + "input": 0.6, + "output": 3, + "cache_read": 0.08 }, "type": "chat" }, { - "id": "Qwen/Qwen3-Coder-30B-A3B-Instruct", - "name": "Qwen3 Coder 30B A3B Instruct", - "display_name": "Qwen3 Coder 30B A3B Instruct", + "id": "claude-fable-5", + "name": "Claude Fable 5", + "display_name": "Claude Fable 5", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 262144, - "output": 65536 + "context": 1000000, + "output": 128000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { - "supported": false - }, - "attachment": false, - "open_weights": true, - "knowledge": "2025-04", - "release_date": "2025-07-31", - "last_updated": "2025-07-31", - "cost": { - "input": 0, - "output": 0 - }, - "type": "chat" - }, - { - "id": "Qwen/Qwen3-235B-A22B-Instruct-2507", - "name": "Qwen3 235B A22B Instruct 2507", - "display_name": "Qwen3 235B A22B Instruct 2507", - "modalities": { - "input": [ - "text" - ], - "output": [ - "text" - ] - }, - "limit": { - "context": 262144, - "output": 131072 + "supported": true, + "default": true }, - "temperature": true, - "tool_call": true, - "reasoning": { - "supported": false + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": true, + "mode": "effort", + "effort": "high", + "effort_options": [ + "low", + "medium", + "high", + "xhigh", + "max" + ], + "interleaved": true, + "summaries": true, + "visibility": "omitted", + "continuation": [ + "thinking_blocks" + ], + "notes": [ + "Adaptive thinking is always on for Claude Fable 5 and Claude Mythos 5; thinking.type = \"disabled\" is rejected.", + "Manual budget_tokens requests return 400 on Claude Fable 5 and Claude Mythos 5.", + "thinking.display defaults to omitted; set display to summarized to receive readable thinking summaries." + ] + } }, - "attachment": false, - "open_weights": true, - "knowledge": "2025-04", - "release_date": "2025-04-28", - "last_updated": "2025-07-21", + "attachment": true, + "open_weights": false, + "knowledge": "2026-01-31", + "release_date": "2026-06-09", + "last_updated": "2026-06-09", "cost": { - "input": 0, - "output": 0 + "input": 10, + "output": 50, + "cache_read": 1, + "cache_write": 12.5 }, "type": "chat" }, { - "id": "Qwen/Qwen3-30B-A3B-Thinking-2507", - "name": "Qwen3 30B A3B Thinking 2507", - "display_name": "Qwen3 30B A3B Thinking 2507", + "id": "claude-haiku-4-5", + "name": "Claude Haiku 4.5", + "display_name": "Claude Haiku 4.5", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 262144, - "output": 32768 + "context": 200000, + "output": 64000 }, "temperature": true, "tool_call": true, "reasoning": { "supported": true, - "default": true + "default": false }, "extra_capabilities": { "reasoning": { "supported": true, + "default_enabled": false, + "mode": "budget", + "budget": { + "min": 1024, + "unit": "tokens" + }, "interleaved": true, "summaries": true, "visibility": "summary", "continuation": [ "thinking_blocks" + ], + "notes": [ + "Claude 4 manual thinking uses thinking.type = \"enabled\" with budget_tokens.", + "Interleaved thinking requires the interleaved-thinking-2025-05-14 beta header for this model family." ] } }, - "attachment": false, - "open_weights": true, - "knowledge": "2025-04", - "release_date": "2025-07-30", - "last_updated": "2025-07-30", + "attachment": true, + "open_weights": false, + "knowledge": "2025-02-28", + "release_date": "2025-10-15", + "last_updated": "2025-10-15", "cost": { - "input": 0, - "output": 0 + "input": 1, + "output": 5, + "cache_read": 0.1, + "cache_write": 1.25 }, "type": "chat" - } - ] - }, - "qihang-ai": { - "id": "qihang-ai", - "name": "QiHang", - "display_name": "QiHang", - "api": "https://api.qhaigc.net/v1", - "doc": "https://www.qhaigc.net/docs", - "models": [ + }, { - "id": "gpt-5-mini", - "name": "GPT-5-Mini", - "display_name": "GPT-5-Mini", + "id": "gpt-5.4", + "name": "GPT-5.4", + "display_name": "GPT-5.4", "modalities": { "input": [ "text", - "image" + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 64000 + "context": 1050000, + "output": 128000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { "supported": true, - "default": true + "default": false }, "extra_capabilities": { "reasoning": { "supported": true, - "default_enabled": true, + "default_enabled": false, "mode": "effort", - "effort": "medium", + "effort": "none", "effort_options": [ - "minimal", + "none", "low", "medium", - "high" + "high", + "xhigh" ], "verbosity": "medium", "verbosity_options": [ @@ -97668,23 +103373,41 @@ }, "attachment": true, "open_weights": false, - "knowledge": "2024-09-30", - "release_date": "2025-09-15", - "last_updated": "2025-09-15", + "knowledge": "2025-08-31", + "release_date": "2026-03-05", + "last_updated": "2026-03-05", "cost": { - "input": 0.04, - "output": 0.29 + "input": 2.5, + "output": 15, + "cache_read": 0.25, + "tiers": [ + { + "input": 5, + "output": 22.5, + "cache_read": 0.5, + "tier": { + "type": "context", + "size": 272000 + } + } + ], + "context_over_200k": { + "input": 5, + "output": 22.5, + "cache_read": 0.5 + } }, "type": "chat" }, { - "id": "gpt-5.2", - "name": "GPT-5.2", - "display_name": "GPT-5.2", + "id": "gpt-5.4-mini", + "name": "GPT-5.4 Mini", + "display_name": "GPT-5.4 Mini", "modalities": { "input": [ "text", - "image" + "image", + "pdf" ], "output": [ "text" @@ -97694,7 +103417,7 @@ "context": 400000, "output": 128000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { "supported": true, @@ -97725,88 +103448,70 @@ "attachment": true, "open_weights": false, "knowledge": "2025-08-31", - "release_date": "2025-12-11", - "last_updated": "2025-12-11", + "release_date": "2026-03-17", + "last_updated": "2026-03-17", "cost": { - "input": 0.25, - "output": 2 + "input": 0.75, + "output": 4.5, + "cache_read": 0.075 }, "type": "chat" }, { - "id": "claude-haiku-4-5-20251001", - "name": "Claude Haiku 4.5", - "display_name": "Claude Haiku 4.5", + "id": "minimax-m2.5-free", + "name": "MiniMax M2.5 Free", + "display_name": "MiniMax M2.5 Free", "modalities": { "input": [ - "text", - "image", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 64000 + "context": 204800, + "output": 131072 }, "temperature": true, "tool_call": true, "reasoning": { "supported": true, - "default": false + "default": true }, "extra_capabilities": { "reasoning": { - "supported": true, - "default_enabled": false, - "mode": "budget", - "budget": { - "min": 1024, - "unit": "tokens" - }, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ], - "notes": [ - "Claude 4 manual thinking uses thinking.type = \"enabled\" with budget_tokens.", - "Interleaved thinking requires the interleaved-thinking-2025-05-14 beta header for this model family." - ] + "supported": true } }, - "attachment": true, - "open_weights": false, - "knowledge": "2025-07-31", - "release_date": "2025-10-01", - "last_updated": "2025-10-01", + "attachment": false, + "open_weights": true, + "knowledge": "2025-01", + "release_date": "2026-02-12", + "last_updated": "2026-02-12", "cost": { - "input": 0.14, - "output": 0.71 + "input": 0, + "output": 0, + "cache_read": 0 }, "type": "chat" }, { - "id": "gemini-3-flash-preview", - "name": "Gemini 3 Flash Preview", - "display_name": "Gemini 3 Flash Preview", + "id": "kimi-k2.6", + "name": "Kimi K2.6", + "display_name": "Kimi K2.6", "modalities": { "input": [ "text", "image", - "video", - "audio", - "pdf" + "video" ], "output": [ "text" ] }, "limit": { - "context": 1048576, + "context": 262144, "output": 65536 }, "temperature": true, @@ -97818,51 +103523,30 @@ "extra_capabilities": { "reasoning": { "supported": true, - "default_enabled": true, - "mode": "level", - "level": "high", - "level_options": [ - "minimal", - "low", - "medium", - "high" - ], + "interleaved": true, "summaries": true, "visibility": "summary", - "continuation": [ - "thought_signatures" - ] - } - }, - "attachment": true, - "open_weights": false, - "knowledge": "2025-01", - "release_date": "2025-12-17", - "last_updated": "2025-12-17", - "cost": { - "input": 0.07, - "output": 0.43, - "tiers": [ - { - "input": 0.07, - "output": 0.43, - "tier": { - "type": "context", - "size": 200000 - } - } - ], - "context_over_200k": { - "input": 0.07, - "output": 0.43 + "continuation": [ + "thinking_blocks" + ] } }, + "attachment": true, + "open_weights": true, + "knowledge": "2024-10", + "release_date": "2026-04-21", + "last_updated": "2026-04-21", + "cost": { + "input": 0.95, + "output": 4, + "cache_read": 0.16 + }, "type": "chat" }, { - "id": "claude-sonnet-4-5-20250929", - "name": "Claude Sonnet 4.5", - "display_name": "Claude Sonnet 4.5", + "id": "claude-opus-4-6", + "name": "Claude Opus 4.6", + "display_name": "Claude Opus 4.6", "modalities": { "input": [ "text", @@ -97874,8 +103558,8 @@ ] }, "limit": { - "context": 200000, - "output": 64000 + "context": 1000000, + "output": 128000 }, "temperature": true, "tool_call": true, @@ -97887,11 +103571,18 @@ "reasoning": { "supported": true, "default_enabled": false, - "mode": "budget", + "mode": "mixed", "budget": { "min": 1024, "unit": "tokens" }, + "effort": "high", + "effort_options": [ + "low", + "medium", + "high", + "max" + ], "interleaved": true, "summaries": true, "visibility": "summary", @@ -97899,41 +103590,39 @@ "thinking_blocks" ], "notes": [ - "Claude 4 manual thinking uses thinking.type = \"enabled\" with budget_tokens.", - "Interleaved thinking requires the interleaved-thinking-2025-05-14 beta header for this model family." + "Anthropic recommends adaptive thinking with effort for Claude 4.6; budget_tokens remains a deprecated compatibility path.", + "Anthropic API defaults effort to high; lower effort levels should be chosen per workload." ] } }, "attachment": true, "open_weights": false, - "knowledge": "2025-07-31", - "release_date": "2025-09-29", - "last_updated": "2025-09-29", + "knowledge": "2025-05-31", + "release_date": "2026-02-05", + "last_updated": "2026-03-13", "cost": { - "input": 0.43, - "output": 2.14 + "input": 5, + "output": 25, + "cache_read": 0.5, + "cache_write": 6.25 }, "type": "chat" }, { - "id": "gemini-2.5-flash", - "name": "Gemini 2.5 Flash", - "display_name": "Gemini 2.5 Flash", + "id": "minimax-m2.1-free", + "name": "MiniMax M2.1 Free", + "display_name": "MiniMax M2.1 Free", "modalities": { "input": [ - "text", - "image", - "video", - "audio", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 1048576, - "output": 65536 + "context": 204800, + "output": 131072 }, "temperature": true, "tool_call": true, @@ -97943,53 +103632,25 @@ }, "extra_capabilities": { "reasoning": { - "supported": true, - "default_enabled": true, - "mode": "budget", - "budget": { - "default": -1, - "min": 0, - "max": 24576, - "auto": -1, - "off": 0, - "unit": "tokens" - }, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thought_signatures" - ] + "supported": true } }, - "attachment": true, - "open_weights": false, + "attachment": false, + "open_weights": true, "knowledge": "2025-01", - "release_date": "2025-12-17", - "last_updated": "2025-12-17", + "release_date": "2025-12-23", + "last_updated": "2025-12-23", "cost": { - "input": 0.09, - "output": 0.71, - "tiers": [ - { - "input": 0.09, - "output": 0.71, - "tier": { - "type": "context", - "size": 200000 - } - } - ], - "context_over_200k": { - "input": 0.09, - "output": 0.71 - } + "input": 0, + "output": 0, + "cache_read": 0 }, "type": "chat" }, { - "id": "claude-opus-4-5-20251101", - "name": "Claude Opus 4.5", - "display_name": "Claude Opus 4.5", + "id": "gpt-5-nano", + "name": "GPT-5 Nano", + "display_name": "GPT-5 Nano", "modalities": { "input": [ "text", @@ -98000,68 +103661,64 @@ ] }, "limit": { - "context": 200000, - "output": 32000 + "context": 400000, + "output": 128000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { "supported": true, - "default": false + "default": true }, "extra_capabilities": { "reasoning": { "supported": true, - "default_enabled": false, - "mode": "mixed", - "budget": { - "min": 1024, - "unit": "tokens" - }, - "effort": "high", + "default_enabled": true, + "mode": "effort", + "effort": "medium", "effort_options": [ + "minimal", "low", "medium", "high" ], - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" + "verbosity": "medium", + "verbosity_options": [ + "low", + "medium", + "high" ], - "notes": [ - "Claude Opus 4.5 uses manual thinking.type = \"enabled\" with budget_tokens; effort can be used alongside the thinking budget.", - "Interleaved thinking requires the interleaved-thinking-2025-05-14 beta header." - ] + "visibility": "hidden" } }, "attachment": true, "open_weights": false, - "knowledge": "2025-03", - "release_date": "2025-11-01", - "last_updated": "2025-11-01", + "knowledge": "2024-05-30", + "release_date": "2025-08-07", + "last_updated": "2025-08-07", "cost": { - "input": 0.71, - "output": 3.57 + "input": 0.05, + "output": 0.4, + "cache_read": 0.005 }, "type": "chat" }, { - "id": "gpt-5.2-codex", - "name": "GPT-5.2 Codex", - "display_name": "GPT-5.2 Codex", + "id": "gpt-5.4-pro", + "name": "GPT-5.4 Pro", + "display_name": "GPT-5.4 Pro", "modalities": { "input": [ "text", - "image" + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 400000, + "context": 1050000, "output": 128000 }, "temperature": false, @@ -98075,9 +103732,8 @@ "supported": true, "default_enabled": true, "mode": "effort", - "effort": "medium", + "effort": "high", "effort_options": [ - "low", "medium", "high", "xhigh" @@ -98094,24 +103750,24 @@ "attachment": true, "open_weights": false, "knowledge": "2025-08-31", - "release_date": "2025-12-11", - "last_updated": "2025-12-11", + "release_date": "2026-03-05", + "last_updated": "2026-03-05", "cost": { - "input": 0.14, - "output": 1.14 + "input": 30, + "output": 180, + "cache_read": 30 }, "type": "chat" }, { - "id": "gemini-3-pro-preview", - "name": "Gemini 3 Pro Preview", - "display_name": "Gemini 3 Pro Preview", + "id": "claude-sonnet-4-6", + "name": "Claude Sonnet 4.6", + "display_name": "Claude Sonnet 4.6", "modalities": { "input": [ "text", "image", - "audio", - "video" + "pdf" ], "output": [ "text" @@ -98119,55 +103775,59 @@ }, "limit": { "context": 1000000, - "output": 65000 + "output": 64000 }, "temperature": true, "tool_call": true, "reasoning": { "supported": true, - "default": true + "default": false }, "extra_capabilities": { "reasoning": { "supported": true, - "default_enabled": true, - "mode": "level", - "level": "high", - "level_options": [ + "default_enabled": false, + "mode": "mixed", + "budget": { + "min": 1024, + "unit": "tokens" + }, + "effort": "high", + "effort_options": [ "low", - "high" + "medium", + "high", + "max" ], + "interleaved": true, "summaries": true, "visibility": "summary", "continuation": [ - "thought_signatures" + "thinking_blocks" + ], + "notes": [ + "Anthropic recommends adaptive thinking with effort for Claude 4.6; budget_tokens remains a deprecated compatibility path.", + "Anthropic API defaults effort to high; lower effort levels should be chosen per workload." ] } }, "attachment": true, "open_weights": false, - "knowledge": "2025-11", - "release_date": "2025-11-19", - "last_updated": "2025-11-19", + "knowledge": "2025-08-31", + "release_date": "2026-02-17", + "last_updated": "2026-02-17", "cost": { - "input": 0.57, - "output": 3.43 + "input": 3, + "output": 15, + "cache_read": 0.3, + "cache_write": 3.75 }, "type": "chat" - } - ] - }, - "poe": { - "id": "poe", - "name": "Poe", - "display_name": "Poe", - "api": "https://api.poe.com/v1", - "doc": "https://creator.poe.com/docs/external-applications/openai-compatible-api", - "models": [ + }, { - "id": "empiriolabs/deepseek-v4-pro-el", - "name": "DeepSeek-V4-Pro-EL", - "display_name": "DeepSeek-V4-Pro-EL", + "id": "mimo-v2-flash-free", + "name": "MiMo V2 Flash Free", + "display_name": "MiMo V2 Flash Free", "modalities": { "input": [ "text" @@ -98177,144 +103837,237 @@ ] }, "limit": { - "context": 1000000, - "output": 384000 + "context": 262144, + "output": 65536 }, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, "default": true }, - "attachment": true, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } + }, + "attachment": false, "open_weights": true, - "release_date": "2026-04-24", - "last_updated": "2026-05-02", + "knowledge": "2024-12", + "release_date": "2025-12-16", + "last_updated": "2025-12-16", "cost": { - "input": 1.67, - "output": 3.33 + "input": 0, + "output": 0, + "cache_read": 0 }, "type": "chat" }, { - "id": "empiriolabs/deepseek-v4-flash-el", - "name": "DeepSeek-V4-Flash-EL", - "display_name": "DeepSeek-V4-Flash-EL", + "id": "gemini-3.1-pro", + "name": "Gemini 3.1 Pro Preview", + "display_name": "Gemini 3.1 Pro Preview", "modalities": { "input": [ - "text" + "text", + "image", + "video", + "audio", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 1000000, - "output": 384000 + "context": 1048576, + "output": 65536 }, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, "default": true }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": true, + "mode": "level", + "level": "high", + "level_options": [ + "low", + "high" + ], + "summaries": true, + "visibility": "summary", + "continuation": [ + "thought_signatures" + ] + } + }, "attachment": true, - "open_weights": true, - "release_date": "2026-04-24", - "last_updated": "2026-05-02", + "open_weights": false, + "knowledge": "2025-01", + "release_date": "2026-02-19", + "last_updated": "2026-02-19", "cost": { - "input": 0.14, - "output": 0.28 + "input": 2, + "output": 12, + "cache_read": 0.2, + "tiers": [ + { + "input": 4, + "output": 18, + "cache_read": 0.4, + "tier": { + "type": "context", + "size": 200000 + } + } + ], + "context_over_200k": { + "input": 4, + "output": 18, + "cache_read": 0.4 + } }, "type": "chat" }, { - "id": "elevenlabs/elevenlabs-v3", - "name": "ElevenLabs-v3", - "display_name": "ElevenLabs-v3", + "id": "trinity-large-preview-free", + "name": "Trinity Large Preview", + "display_name": "Trinity Large Preview", "modalities": { "input": [ "text" ], "output": [ - "audio" + "text" ] }, "limit": { - "context": 128000, - "output": 8192 + "context": 131072, + "output": 131072 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { "supported": false }, - "attachment": true, - "open_weights": false, - "release_date": "2025-06-05", - "last_updated": "2025-06-05", + "attachment": false, + "open_weights": true, + "knowledge": "2025-06", + "release_date": "2026-01-28", + "last_updated": "2026-01-28", + "cost": { + "input": 0, + "output": 0 + }, "type": "chat" }, { - "id": "elevenlabs/elevenlabs-music", - "name": "ElevenLabs-Music", - "display_name": "ElevenLabs-Music", + "id": "big-pickle", + "name": "Big Pickle", + "display_name": "Big Pickle", "modalities": { "input": [ "text" ], "output": [ - "audio" + "text" ] }, "limit": { - "context": 2000, - "output": 8192 + "context": 200000, + "output": 32000 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": true, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } + }, + "attachment": false, "open_weights": false, - "release_date": "2025-08-29", - "last_updated": "2025-08-29", + "knowledge": "2025-01", + "release_date": "2025-10-17", + "last_updated": "2025-10-17", + "cost": { + "input": 0, + "output": 0, + "cache_read": 0, + "cache_write": 0 + }, "type": "chat" }, { - "id": "elevenlabs/elevenlabs-v2.5-turbo", - "name": "ElevenLabs-v2.5-Turbo", - "display_name": "ElevenLabs-v2.5-Turbo", + "id": "gpt-5.5-pro", + "name": "GPT-5.5 Pro", + "display_name": "GPT-5.5 Pro", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ - "audio" + "text" ] }, "limit": { - "context": 128000, - "output": 8192 + "context": 1050000, + "output": 128000 }, "temperature": false, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true + } }, "attachment": true, "open_weights": false, - "release_date": "2024-10-28", - "last_updated": "2024-10-28", + "knowledge": "2025-12-01", + "release_date": "2026-04-24", + "last_updated": "2026-04-24", + "cost": { + "input": 30, + "output": 180, + "cache_read": 30 + }, "type": "chat" }, { - "id": "fireworks-ai/kimi-k2.5-fw", - "name": "Kimi-K2.5-FW", - "display_name": "Kimi-K2.5-FW", + "id": "qwen3.6-plus-free", + "name": "Qwen3.6 Plus Free", + "display_name": "Qwen3.6 Plus Free", "modalities": { "input": [ "text", - "image" + "image", + "video" ], "output": [ "text" @@ -98322,27 +104075,41 @@ }, "limit": { "context": 262144, - "output": 16384 + "output": 65536 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } }, "attachment": true, "open_weights": false, - "release_date": "2026-01-27", - "last_updated": "2026-01-27", + "knowledge": "2025-04", + "release_date": "2026-04-02", + "last_updated": "2026-04-02", "cost": { "input": 0, - "output": 0 + "output": 0, + "cache_read": 0 }, "type": "chat" }, { - "id": "novita/glm-4.7-n", - "name": "glm-4.7-n", - "display_name": "glm-4.7-n", + "id": "glm-5", + "name": "GLM-5", + "display_name": "GLM-5", "modalities": { "input": [ "text" @@ -98352,68 +104119,102 @@ ] }, "limit": { - "context": 205000, + "context": 204800, "output": 131072 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, "default": true }, - "attachment": true, - "open_weights": false, - "release_date": "2025-12-22", - "last_updated": "2025-12-22", + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } + }, + "attachment": false, + "open_weights": true, + "knowledge": "2025-04", + "release_date": "2026-02-11", + "last_updated": "2026-02-11", + "cost": { + "input": 1, + "output": 3.2, + "cache_read": 0.2 + }, "type": "chat" }, { - "id": "novita/glm-4.6", - "name": "GLM-4.6", - "display_name": "GLM-4.6", + "id": "mimo-v2-omni-free", + "name": "MiMo V2 Omni Free", + "display_name": "MiMo V2 Omni Free", "modalities": { "input": [ - "text" + "text", + "image", + "audio", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 8192, - "output": 8192 + "context": 262144, + "output": 64000 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { - "supported": true + "supported": true, + "default": true }, "extra_capabilities": { "reasoning": { - "supported": true + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] } }, "attachment": true, - "open_weights": false, - "release_date": "2025-09-30", - "last_updated": "2025-09-30", + "open_weights": true, + "knowledge": "2024-12", + "release_date": "2026-03-18", + "last_updated": "2026-03-18", + "cost": { + "input": 0, + "output": 0, + "cache_read": 0 + }, "type": "chat" }, { - "id": "novita/kimi-k2-thinking", - "name": "kimi-k2-thinking", - "display_name": "kimi-k2-thinking", + "id": "gpt-5-codex", + "name": "GPT-5 Codex", + "display_name": "GPT-5 Codex", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 256000, - "output": 8192 + "context": 400000, + "output": 128000 }, "temperature": false, "tool_call": true, @@ -98424,37 +104225,55 @@ "extra_capabilities": { "reasoning": { "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] + "default_enabled": true, + "mode": "effort", + "effort": "medium", + "effort_options": [ + "minimal", + "low", + "medium", + "high" + ], + "verbosity": "medium", + "verbosity_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" } }, "attachment": true, "open_weights": false, - "release_date": "2025-11-07", - "last_updated": "2025-11-07", + "knowledge": "2024-09-30", + "release_date": "2025-09-15", + "last_updated": "2025-09-15", + "cost": { + "input": 1.07, + "output": 8.5, + "cache_read": 0.107 + }, "type": "chat" }, { - "id": "novita/deepseek-v3.2", - "name": "DeepSeek-V3.2", - "display_name": "DeepSeek-V3.2", + "id": "gpt-5.2-codex", + "name": "GPT-5.2 Codex", + "display_name": "GPT-5.2 Codex", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 8192 + "context": 400000, + "output": 128000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { "supported": true, @@ -98462,24 +104281,41 @@ }, "extra_capabilities": { "reasoning": { - "supported": true + "supported": true, + "default_enabled": true, + "mode": "effort", + "effort": "medium", + "effort_options": [ + "low", + "medium", + "high", + "xhigh" + ], + "verbosity": "medium", + "verbosity_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" } }, "attachment": true, - "open_weights": true, - "release_date": "2025-12-01", - "last_updated": "2025-12-01", + "open_weights": false, + "knowledge": "2025-08-31", + "release_date": "2026-01-14", + "last_updated": "2026-01-14", "cost": { - "input": 0.27, - "output": 0.4, - "cache_read": 0.13 + "input": 1.75, + "output": 14, + "cache_read": 0.175 }, "type": "chat" }, { - "id": "novita/minimax-m2.1", - "name": "minimax-m2.1", - "display_name": "minimax-m2.1", + "id": "glm-5-free", + "name": "GLM-5 Free", + "display_name": "GLM-5 Free", "modalities": { "input": [ "text" @@ -98489,10 +104325,10 @@ ] }, "limit": { - "context": 205000, + "context": 204800, "output": 131072 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, @@ -98500,19 +104336,31 @@ }, "extra_capabilities": { "reasoning": { - "supported": true + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] } }, - "attachment": true, - "open_weights": false, - "release_date": "2025-12-26", - "last_updated": "2025-12-26", + "attachment": false, + "open_weights": true, + "knowledge": "2025-04", + "release_date": "2026-02-11", + "last_updated": "2026-02-11", + "cost": { + "input": 0, + "output": 0, + "cache_read": 0 + }, "type": "chat" }, { - "id": "novita/kimi-k2.6", - "name": "Kimi-K2.6", - "display_name": "Kimi-K2.6", + "id": "qwen3.6-plus", + "name": "Qwen3.6 Plus", + "display_name": "Qwen3.6 Plus", "modalities": { "input": [ "text", @@ -98525,7 +104373,7 @@ }, "limit": { "context": 262144, - "output": 262144 + "output": 65536 }, "temperature": true, "tool_call": true, @@ -98535,25 +104383,32 @@ }, "extra_capabilities": { "reasoning": { - "supported": true + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] } }, "attachment": true, - "open_weights": true, + "open_weights": false, "knowledge": "2025-04", - "release_date": "2026-04-20", - "last_updated": "2026-05-02", + "release_date": "2026-04-02", + "last_updated": "2026-04-02", "cost": { - "input": 0.96, - "output": 4.04, - "cache_read": 0.16 + "input": 0.5, + "output": 3, + "cache_read": 0.05, + "cache_write": 0.625 }, "type": "chat" }, { - "id": "novita/glm-4.7", - "name": "glm-4.7", - "display_name": "glm-4.7", + "id": "nemotron-3-super-free", + "name": "Nemotron 3 Super Free", + "display_name": "Nemotron 3 Super Free", "modalities": { "input": [ "text" @@ -98563,8 +104418,8 @@ ] }, "limit": { - "context": 205000, - "output": 131072 + "context": 204800, + "output": 128000 }, "temperature": true, "tool_call": true, @@ -98583,16 +104438,22 @@ ] } }, - "attachment": true, - "open_weights": false, - "release_date": "2025-12-22", - "last_updated": "2025-12-22", + "attachment": false, + "open_weights": true, + "knowledge": "2026-02", + "release_date": "2026-03-11", + "last_updated": "2026-03-11", + "cost": { + "input": 0, + "output": 0, + "cache_read": 0 + }, "type": "chat" }, { - "id": "novita/glm-4.6v", - "name": "glm-4.6v", - "display_name": "glm-4.6v", + "id": "grok-build-0.1", + "name": "Grok Build 0.1", + "display_name": "Grok Build 0.1", "modalities": { "input": [ "text", @@ -98603,71 +104464,106 @@ ] }, "limit": { - "context": 131000, - "output": 32768 + "context": 256000, + "output": 256000 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, "default": true }, + "extra_capabilities": { + "reasoning": { + "supported": true + } + }, "attachment": true, "open_weights": false, - "release_date": "2025-12-09", - "last_updated": "2025-12-09", + "release_date": "2026-05-20", + "last_updated": "2026-05-20", + "cost": { + "input": 1, + "output": 2, + "cache_read": 0.2 + }, "type": "chat" }, { - "id": "novita/glm-4.7-flash", - "name": "glm-4.7-flash", - "display_name": "glm-4.7-flash", + "id": "gpt-5.1", + "name": "GPT-5.1", + "display_name": "GPT-5.1", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 65500 + "context": 400000, + "output": 128000 }, "temperature": false, "tool_call": true, "reasoning": { "supported": true, - "default": true + "default": false }, "extra_capabilities": { "reasoning": { - "supported": true + "supported": true, + "default_enabled": false, + "mode": "effort", + "effort": "none", + "effort_options": [ + "none", + "low", + "medium", + "high" + ], + "verbosity": "medium", + "verbosity_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" } }, "attachment": true, "open_weights": false, - "release_date": "2026-01-19", - "last_updated": "2026-01-19", + "knowledge": "2024-09-30", + "release_date": "2025-11-13", + "last_updated": "2025-11-13", + "cost": { + "input": 1.07, + "output": 8.5, + "cache_read": 0.107 + }, "type": "chat" }, { - "id": "novita/glm-5", - "name": "GLM-5", - "display_name": "GLM-5", + "id": "gpt-5.5", + "name": "GPT-5.5", + "display_name": "GPT-5.5", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 205000, - "output": 131072 + "context": 1050000, + "output": 128000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { "supported": true, @@ -98676,609 +104572,494 @@ "extra_capabilities": { "reasoning": { "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] + "default_enabled": true, + "mode": "effort", + "effort": "medium", + "effort_options": [ + "low", + "medium", + "high", + "xhigh" + ], + "verbosity": "medium", + "verbosity_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" } }, "attachment": true, "open_weights": false, - "release_date": "2026-02-15", - "last_updated": "2026-02-15", + "knowledge": "2025-12-01", + "release_date": "2026-04-23", + "last_updated": "2026-04-23", "cost": { - "input": 1, - "output": 3.2, - "cache_read": 0.2 + "input": 5, + "output": 30, + "cache_read": 0.5, + "tiers": [ + { + "input": 10, + "output": 45, + "cache_read": 1, + "tier": { + "type": "context", + "size": 272000 + } + } + ], + "context_over_200k": { + "input": 10, + "output": 45, + "cache_read": 1 + } }, "type": "chat" - }, + } + ] + }, + "inference": { + "id": "inference", + "name": "Inference", + "display_name": "Inference", + "api": "https://inference.net/v1", + "doc": "https://inference.net/models", + "models": [ { - "id": "novita/kimi-k2.5", - "name": "Kimi-K2.5", - "display_name": "Kimi-K2.5", + "id": "mistral/mistral-nemo-12b-instruct", + "name": "Mistral Nemo 12B Instruct", + "display_name": "Mistral Nemo 12B Instruct", "modalities": { "input": [ - "text", - "image", - "video" + "text" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 262144 + "context": 16000, + "output": 4096 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } + "supported": false }, - "attachment": true, - "open_weights": false, - "release_date": "2026-01-27", - "last_updated": "2026-01-27", + "attachment": false, + "open_weights": true, + "knowledge": "2024-12", + "release_date": "2025-01-01", + "last_updated": "2025-01-01", "cost": { - "input": 0.6, - "output": 3, - "cache_read": 0.1 + "input": 0.038, + "output": 0.1 }, "type": "chat" }, { - "id": "anthropic/claude-sonnet-4", - "name": "Claude-Sonnet-4", - "display_name": "Claude-Sonnet-4", + "id": "google/gemma-3", + "name": "Google Gemma 3", + "display_name": "Google Gemma 3", "modalities": { "input": [ "text", - "image", - "pdf" + "image" ], "output": [ "text" ] }, "limit": { - "context": 983040, - "output": 64000 + "context": 125000, + "output": 4096 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": false - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": false, - "mode": "budget", - "budget": { - "min": 1024, - "unit": "tokens" - }, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ], - "notes": [ - "Claude 4 manual thinking uses thinking.type = \"enabled\" with budget_tokens.", - "Interleaved thinking requires the interleaved-thinking-2025-05-14 beta header for this model family." - ] - } + "supported": false }, "attachment": true, - "open_weights": false, - "release_date": "2025-05-21", - "last_updated": "2025-05-21", + "open_weights": true, + "knowledge": "2024-12", + "release_date": "2025-01-01", + "last_updated": "2025-01-01", "cost": { - "input": 2.6, - "output": 13, - "cache_read": 0.26, - "cache_write": 3.2 + "input": 0.15, + "output": 0.3 }, "type": "chat" }, { - "id": "anthropic/claude-sonnet-4.6", - "name": "Claude-Sonnet-4.6", - "display_name": "Claude-Sonnet-4.6", + "id": "osmosis/osmosis-structure-0.6b", + "name": "Osmosis Structure 0.6B", + "display_name": "Osmosis Structure 0.6B", "modalities": { "input": [ - "text", - "image", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 983040, - "output": 128000 + "context": 4000, + "output": 2048 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": false + "supported": false }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": false, - "mode": "mixed", - "budget": { - "min": 1024, - "unit": "tokens" - }, - "effort": "high", - "effort_options": [ - "low", - "medium", - "high", - "max" - ], - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ], - "notes": [ - "Anthropic recommends adaptive thinking with effort for Claude 4.6; budget_tokens remains a deprecated compatibility path.", - "Anthropic API defaults effort to high; lower effort levels should be chosen per workload." - ] - } + "attachment": false, + "open_weights": true, + "knowledge": "2024-12", + "release_date": "2025-01-01", + "last_updated": "2025-01-01", + "cost": { + "input": 0.1, + "output": 0.5 + }, + "type": "chat" + }, + { + "id": "qwen/qwen3-embedding-4b", + "name": "Qwen 3 Embedding 4B", + "display_name": "Qwen 3 Embedding 4B", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] }, - "attachment": true, - "open_weights": false, - "release_date": "2026-02-05", - "last_updated": "2026-02-05", + "limit": { + "context": 32000, + "output": 2048 + }, + "temperature": false, + "tool_call": false, + "reasoning": { + "supported": false + }, + "attachment": false, + "open_weights": true, + "knowledge": "2024-12", + "release_date": "2025-01-01", + "last_updated": "2025-01-01", "cost": { - "input": 2.6, - "output": 13, - "cache_read": 0.26, - "cache_write": 3.2 + "input": 0.01, + "output": 0 }, - "type": "chat" + "type": "embedding" }, { - "id": "anthropic/claude-opus-4.5", - "name": "Claude-Opus-4.5", - "display_name": "Claude-Opus-4.5", + "id": "qwen/qwen-2.5-7b-vision-instruct", + "name": "Qwen 2.5 7B Vision Instruct", + "display_name": "Qwen 2.5 7B Vision Instruct", "modalities": { "input": [ "text", - "image", - "pdf" + "image" ], "output": [ "text" ] }, "limit": { - "context": 196608, - "output": 64000 + "context": 125000, + "output": 4096 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": false - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": false, - "mode": "mixed", - "budget": { - "min": 1024, - "unit": "tokens" - }, - "effort": "high", - "effort_options": [ - "low", - "medium", - "high" - ], - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ], - "notes": [ - "Claude Opus 4.5 uses manual thinking.type = \"enabled\" with budget_tokens; effort can be used alongside the thinking budget.", - "Interleaved thinking requires the interleaved-thinking-2025-05-14 beta header." - ] - } + "supported": false }, "attachment": true, - "open_weights": false, - "release_date": "2025-11-21", - "last_updated": "2025-11-21", + "open_weights": true, + "knowledge": "2024-12", + "release_date": "2025-01-01", + "last_updated": "2025-01-01", "cost": { - "input": 4.3, - "output": 21, - "cache_read": 0.43, - "cache_write": 5.3 + "input": 0.2, + "output": 0.2 }, "type": "chat" }, { - "id": "anthropic/claude-opus-4.7", - "name": "Claude-Opus-4.7", - "display_name": "Claude-Opus-4.7", + "id": "meta/llama-3.1-8b-instruct", + "name": "Llama 3.1 8B Instruct", + "display_name": "Llama 3.1 8B Instruct", "modalities": { "input": [ - "text", - "image", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 1048576, - "output": 128000 + "context": 16000, + "output": 4096 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": false - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": false, - "mode": "effort", - "effort": "high", - "effort_options": [ - "low", - "medium", - "high", - "xhigh", - "max" - ], - "interleaved": true, - "summaries": true, - "visibility": "omitted", - "continuation": [ - "thinking_blocks" - ], - "notes": [ - "Claude Opus 4.7 and newer Opus models require thinking.type = \"adaptive\" to enable thinking explicitly.", - "Manual budget_tokens requests return 400 on Claude Opus 4.7 and newer adaptive-only Opus models.", - "task_budget is separate from thinking control and should not be treated as a thinking budget." - ] - } + "supported": false }, - "attachment": true, - "open_weights": false, - "release_date": "2026-04-15", - "last_updated": "2026-04-15", + "attachment": false, + "open_weights": true, + "knowledge": "2023-12", + "release_date": "2025-01-01", + "last_updated": "2025-01-01", "cost": { - "input": 4.3, - "output": 21, - "cache_read": 0.43, - "cache_write": 5.4 + "input": 0.025, + "output": 0.025 }, "type": "chat" }, { - "id": "anthropic/claude-haiku-3", - "name": "Claude-Haiku-3", - "display_name": "Claude-Haiku-3", + "id": "meta/llama-3.2-1b-instruct", + "name": "Llama 3.2 1B Instruct", + "display_name": "Llama 3.2 1B Instruct", "modalities": { "input": [ - "text", - "image", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 189096, - "output": 8192 + "context": 16000, + "output": 4096 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { "supported": false }, - "attachment": true, - "open_weights": false, - "release_date": "2024-03-09", - "last_updated": "2024-03-09", + "attachment": false, + "open_weights": true, + "knowledge": "2023-12", + "release_date": "2025-01-01", + "last_updated": "2025-01-01", "cost": { - "input": 0.21, - "output": 1.1, - "cache_read": 0.021, - "cache_write": 0.26 + "input": 0.01, + "output": 0.01 }, "type": "chat" }, { - "id": "anthropic/claude-sonnet-3.5", - "name": "Claude-Sonnet-3.5", - "display_name": "Claude-Sonnet-3.5", + "id": "meta/llama-3.2-11b-vision-instruct", + "name": "Llama 3.2 11B Vision Instruct", + "display_name": "Llama 3.2 11B Vision Instruct", "modalities": { "input": [ "text", - "image", - "pdf" + "image" ], "output": [ "text" ] }, "limit": { - "context": 189096, - "output": 8192 + "context": 16000, + "output": 4096 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { "supported": false }, "attachment": true, - "open_weights": false, - "release_date": "2024-06-05", - "last_updated": "2024-06-05", + "open_weights": true, + "knowledge": "2023-12", + "release_date": "2025-01-01", + "last_updated": "2025-01-01", "cost": { - "input": 2.6, - "output": 13, - "cache_read": 0.26, - "cache_write": 3.2 + "input": 0.055, + "output": 0.055 }, "type": "chat" }, { - "id": "anthropic/claude-sonnet-3.5-june", - "name": "Claude-Sonnet-3.5-June", - "display_name": "Claude-Sonnet-3.5-June", + "id": "meta/llama-3.2-3b-instruct", + "name": "Llama 3.2 3B Instruct", + "display_name": "Llama 3.2 3B Instruct", "modalities": { "input": [ - "text", - "image", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 189096, - "output": 8192 + "context": 16000, + "output": 4096 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { "supported": false }, - "attachment": true, - "open_weights": false, - "release_date": "2024-11-18", - "last_updated": "2024-11-18", + "attachment": false, + "open_weights": true, + "knowledge": "2023-12", + "release_date": "2025-01-01", + "last_updated": "2025-01-01", "cost": { - "input": 2.6, - "output": 13, - "cache_read": 0.26, - "cache_write": 3.2 + "input": 0.02, + "output": 0.02 }, "type": "chat" - }, + } + ] + }, + "inceptron": { + "id": "inceptron", + "name": "Inceptron", + "display_name": "Inceptron", + "api": "https://api.inceptron.io/v1", + "doc": "https://docs.inceptron.io", + "models": [ { - "id": "anthropic/claude-sonnet-4.5", - "name": "Claude-Sonnet-4.5", - "display_name": "Claude-Sonnet-4.5", + "id": "moonshotai/Kimi-K2.6", + "name": "Kimi K2.6", + "display_name": "Kimi K2.6", "modalities": { "input": [ "text", - "image", - "pdf" + "image" ], "output": [ "text" ] }, "limit": { - "context": 983040, - "output": 32768 + "context": 262144, + "output": 262144 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, - "default": false + "default": true }, "extra_capabilities": { "reasoning": { "supported": true, - "default_enabled": false, - "mode": "budget", - "budget": { - "min": 1024, - "unit": "tokens" - }, "interleaved": true, "summaries": true, "visibility": "summary", "continuation": [ "thinking_blocks" - ], - "notes": [ - "Claude 4 manual thinking uses thinking.type = \"enabled\" with budget_tokens.", - "Interleaved thinking requires the interleaved-thinking-2025-05-14 beta header for this model family." ] } }, "attachment": true, - "open_weights": false, - "release_date": "2025-09-26", - "last_updated": "2025-09-26", + "open_weights": true, + "knowledge": "2025-01", + "release_date": "2026-04-21", + "last_updated": "2026-04-21", "cost": { - "input": 2.6, - "output": 13, - "cache_read": 0.26, - "cache_write": 3.2 + "input": 0.78, + "output": 3.5, + "cache_read": 0.2, + "cache_write": 0 }, "type": "chat" }, { - "id": "anthropic/claude-opus-4.6", - "name": "Claude-Opus-4.6", - "display_name": "Claude-Opus-4.6", + "id": "nvidia/llama-3.3-70b-instruct-fp8", + "name": "Llama 3.3 70B Instruct", + "display_name": "Llama 3.3 70B Instruct", "modalities": { "input": [ - "text", - "image", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 983040, - "output": 128000 + "context": 131072, + "output": 131072 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": false - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": false, - "mode": "mixed", - "budget": { - "min": 1024, - "unit": "tokens" - }, - "effort": "high", - "effort_options": [ - "low", - "medium", - "high", - "max" - ], - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ], - "notes": [ - "Anthropic recommends adaptive thinking with effort for Claude 4.6; budget_tokens remains a deprecated compatibility path.", - "Anthropic API defaults effort to high; lower effort levels should be chosen per workload." - ] - } + "supported": false }, "attachment": true, - "open_weights": false, - "release_date": "2026-02-04", - "last_updated": "2026-02-04", + "open_weights": true, + "knowledge": "2023-12", + "release_date": "2024-12-06", + "last_updated": "2024-12-06", "cost": { - "input": 4.3, - "output": 21, - "cache_read": 0.43, - "cache_write": 5.3 + "input": 0.12, + "output": 0.38, + "cache_read": 0, + "cache_write": 0 }, "type": "chat" }, { - "id": "anthropic/claude-haiku-4.5", - "name": "Claude-Haiku-4.5", - "display_name": "Claude-Haiku-4.5", + "id": "zai-org/GLM-5.1-FP8", + "name": "GLM 5.1", + "display_name": "GLM 5.1", "modalities": { "input": [ - "text", - "image", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 192000, - "output": 64000 + "context": 202752, + "output": 202752 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, - "default": false + "default": true }, "extra_capabilities": { "reasoning": { "supported": true, - "default_enabled": false, - "mode": "budget", - "budget": { - "min": 1024, - "unit": "tokens" - }, "interleaved": true, "summaries": true, "visibility": "summary", "continuation": [ "thinking_blocks" - ], - "notes": [ - "Claude 4 manual thinking uses thinking.type = \"enabled\" with budget_tokens.", - "Interleaved thinking requires the interleaved-thinking-2025-05-14 beta header for this model family." ] } }, - "attachment": true, - "open_weights": false, - "release_date": "2025-10-15", - "last_updated": "2025-10-15", + "attachment": false, + "open_weights": true, + "release_date": "2026-03-27", + "last_updated": "2026-03-27", "cost": { - "input": 0.85, - "output": 4.3, - "cache_read": 0.085, - "cache_write": 1.1 + "input": 1.4, + "output": 4.4, + "cache_read": 0.26, + "cache_write": 0 }, "type": "chat" }, { - "id": "anthropic/claude-sonnet-3.7", - "name": "Claude-Sonnet-3.7", - "display_name": "Claude-Sonnet-3.7", + "id": "MiniMaxAI/MiniMax-M2.5", + "name": "MiniMax M2.5", + "display_name": "MiniMax M2.5", "modalities": { "input": [ - "text", - "image", - "pdf" + "text" ], "output": [ "text" @@ -99286,243 +105067,176 @@ }, "limit": { "context": 196608, - "output": 128000 + "output": 196608 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, "default": true }, - "attachment": true, - "open_weights": false, - "release_date": "2025-02-19", - "last_updated": "2025-02-19", + "extra_capabilities": { + "reasoning": { + "supported": true + } + }, + "attachment": false, + "open_weights": true, + "release_date": "2026-02-12", + "last_updated": "2026-02-12", "cost": { - "input": 2.6, - "output": 13, - "cache_read": 0.26, - "cache_write": 3.2 + "input": 0.24, + "output": 0.9, + "cache_read": 0.03, + "cache_write": 0 }, "type": "chat" - }, + } + ] + }, + "llama": { + "id": "llama", + "name": "Llama", + "display_name": "Llama", + "api": "https://api.llama.com/compat/v1/", + "doc": "https://llama.developer.meta.com/docs/models", + "models": [ { - "id": "anthropic/claude-haiku-3.5", - "name": "Claude-Haiku-3.5", - "display_name": "Claude-Haiku-3.5", + "id": "llama-4-scout-17b-16e-instruct-fp8", + "name": "Llama-4-Scout-17B-16E-Instruct-FP8", + "display_name": "Llama-4-Scout-17B-16E-Instruct-FP8", "modalities": { "input": [ "text", - "image", - "pdf" + "image" ], "output": [ "text" ] }, "limit": { - "context": 189096, - "output": 8192 + "context": 128000, + "output": 4096 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { "supported": false }, "attachment": true, - "open_weights": false, - "release_date": "2024-10-01", - "last_updated": "2024-10-01", + "open_weights": true, + "knowledge": "2024-08", + "release_date": "2025-04-05", + "last_updated": "2025-04-05", "cost": { - "input": 0.68, - "output": 3.4, - "cache_read": 0.068, - "cache_write": 0.85 + "input": 0, + "output": 0 }, "type": "chat" }, { - "id": "anthropic/claude-opus-4.1", - "name": "Claude-Opus-4.1", - "display_name": "Claude-Opus-4.1", + "id": "cerebras-llama-4-maverick-17b-128e-instruct", + "name": "Cerebras-Llama-4-Maverick-17B-128E-Instruct", + "display_name": "Cerebras-Llama-4-Maverick-17B-128E-Instruct", "modalities": { "input": [ - "text", - "image", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 196608, - "output": 32000 + "context": 128000, + "output": 4096 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": false - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": false, - "mode": "budget", - "budget": { - "min": 1024, - "unit": "tokens" - }, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ], - "notes": [ - "Claude 4 manual thinking uses thinking.type = \"enabled\" with budget_tokens.", - "Interleaved thinking requires the interleaved-thinking-2025-05-14 beta header for this model family." - ] - } + "supported": false }, "attachment": true, - "open_weights": false, - "release_date": "2025-08-05", - "last_updated": "2025-08-05", + "open_weights": true, + "knowledge": "2025-01", + "release_date": "2025-04-05", + "last_updated": "2025-04-05", "cost": { - "input": 13, - "output": 64, - "cache_read": 1.3, - "cache_write": 16 + "input": 0, + "output": 0 }, "type": "chat" }, { - "id": "anthropic/claude-opus-4.8", - "name": "Claude-Opus-4.8", - "display_name": "Claude-Opus-4.8", + "id": "llama-3.3-70b-instruct", + "name": "Llama-3.3-70B-Instruct", + "display_name": "Llama-3.3-70B-Instruct", "modalities": { "input": [ - "text", - "image", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 1048576, - "output": 128000 + "context": 128000, + "output": 4096 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": false - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": false, - "mode": "effort", - "effort": "high", - "effort_options": [ - "low", - "medium", - "high", - "xhigh", - "max" - ], - "interleaved": true, - "summaries": true, - "visibility": "omitted", - "continuation": [ - "thinking_blocks" - ], - "notes": [ - "Claude Opus 4.7 and newer Opus models require thinking.type = \"adaptive\" to enable thinking explicitly.", - "Manual budget_tokens requests return 400 on Claude Opus 4.7 and newer adaptive-only Opus models.", - "task_budget is separate from thinking control and should not be treated as a thinking budget." - ] - } + "supported": false }, "attachment": true, - "open_weights": false, - "release_date": "2026-05-28", - "last_updated": "2026-05-28", + "open_weights": true, + "knowledge": "2023-12", + "release_date": "2024-12-06", + "last_updated": "2024-12-06", "cost": { - "input": 4.2929, - "output": 21.4646 + "input": 0, + "output": 0 }, "type": "chat" }, { - "id": "anthropic/claude-opus-4", - "name": "Claude-Opus-4", - "display_name": "Claude-Opus-4", + "id": "groq-llama-4-maverick-17b-128e-instruct", + "name": "Groq-Llama-4-Maverick-17B-128E-Instruct", + "display_name": "Groq-Llama-4-Maverick-17B-128E-Instruct", "modalities": { "input": [ - "text", - "image", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 192512, - "output": 28672 + "context": 128000, + "output": 4096 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": false - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": false, - "mode": "budget", - "budget": { - "min": 1024, - "unit": "tokens" - }, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ], - "notes": [ - "Claude 4 manual thinking uses thinking.type = \"enabled\" with budget_tokens.", - "Interleaved thinking requires the interleaved-thinking-2025-05-14 beta header for this model family." - ] - } + "supported": false }, "attachment": true, - "open_weights": false, - "release_date": "2025-05-21", - "last_updated": "2025-05-21", + "open_weights": true, + "knowledge": "2025-01", + "release_date": "2025-04-05", + "last_updated": "2025-04-05", "cost": { - "input": 13, - "output": 64, - "cache_read": 1.3, - "cache_write": 16 + "input": 0, + "output": 0 }, "type": "chat" }, { - "id": "xai/grok-4.20-multi-agent", - "name": "Grok-4.20-Multi-Agent", - "display_name": "Grok-4.20-Multi-Agent", + "id": "cerebras-llama-4-scout-17b-16e-instruct", + "name": "Cerebras-Llama-4-Scout-17B-16E-Instruct", + "display_name": "Cerebras-Llama-4-Scout-17B-16E-Instruct", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" @@ -99530,56 +105244,60 @@ }, "limit": { "context": 128000, - "output": 8192 + "output": 4096 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { "supported": false }, "attachment": true, - "open_weights": false, - "release_date": "2026-03-13", - "last_updated": "2026-03-13", + "open_weights": true, + "knowledge": "2025-01", + "release_date": "2025-04-05", + "last_updated": "2025-04-05", "cost": { - "input": 2, - "output": 6, - "cache_read": 0.2 + "input": 0, + "output": 0 }, "type": "chat" }, { - "id": "xai/grok-4.1-fast-non-reasoning", - "name": "Grok-4.1-Fast-Non-Reasoning", - "display_name": "Grok-4.1-Fast-Non-Reasoning", + "id": "llama-3.3-8b-instruct", + "name": "Llama-3.3-8B-Instruct", + "display_name": "Llama-3.3-8B-Instruct", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 2000000, - "output": 30000 + "context": 128000, + "output": 4096 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { "supported": false }, "attachment": true, - "open_weights": false, - "release_date": "2025-11-19", - "last_updated": "2025-11-19", + "open_weights": true, + "knowledge": "2023-12", + "release_date": "2024-12-06", + "last_updated": "2024-12-06", + "cost": { + "input": 0, + "output": 0 + }, "type": "chat" }, { - "id": "xai/grok-4-fast-non-reasoning", - "name": "Grok-4-Fast-Non-Reasoning", - "display_name": "Grok-4-Fast-Non-Reasoning", + "id": "llama-4-maverick-17b-128e-instruct-fp8", + "name": "Llama-4-Maverick-17B-128E-Instruct-FP8", + "display_name": "Llama-4-Maverick-17B-128E-Instruct-FP8", "modalities": { "input": [ "text", @@ -99590,58 +105308,69 @@ ] }, "limit": { - "context": 2000000, - "output": 128000 + "context": 128000, + "output": 4096 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { "supported": false }, "attachment": true, - "open_weights": false, - "release_date": "2025-09-16", - "last_updated": "2025-09-16", + "open_weights": true, + "knowledge": "2024-08", + "release_date": "2025-04-05", + "last_updated": "2025-04-05", "cost": { - "input": 0.2, - "output": 0.5, - "cache_read": 0.05 + "input": 0, + "output": 0 }, "type": "chat" - }, + } + ] + }, + "llmtr": { + "id": "llmtr", + "name": "LLMTR", + "display_name": "LLMTR", + "api": "https://llmtr.com/v1", + "doc": "https://llmtr.com/docs", + "models": [ { - "id": "xai/grok-4.1-fast-reasoning", - "name": "Grok-4.1-Fast-Reasoning", - "display_name": "Grok-4.1-Fast-Reasoning", + "id": "sincap", + "name": "Sincap", + "display_name": "Sincap", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 2000000, - "output": 30000 + "context": 128000, + "output": 8192 }, - "temperature": false, - "tool_call": true, + "temperature": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": true + "supported": false }, - "attachment": true, + "attachment": false, "open_weights": false, - "release_date": "2025-11-19", - "last_updated": "2025-11-19", + "release_date": "2026-05-05", + "last_updated": "2026-05-05", + "cost": { + "input": 0, + "output": 0 + }, "type": "chat" }, { - "id": "xai/grok-3", - "name": "Grok 3", - "display_name": "Grok 3", + "id": "magibu-11b-v8", + "name": "Magibu 11B v8", + "display_name": "Magibu 11B v8", "modalities": { "input": [ "text" @@ -99651,140 +105380,126 @@ ] }, "limit": { - "context": 131072, - "output": 8192 + "context": 8192, + "output": 4096 }, - "temperature": false, - "tool_call": true, + "temperature": true, + "tool_call": false, "reasoning": { "supported": false }, - "attachment": true, + "attachment": false, "open_weights": false, - "release_date": "2025-04-11", - "last_updated": "2025-04-11", + "release_date": "2026-06-05", + "last_updated": "2026-06-05", "cost": { - "input": 3, - "output": 15, - "cache_read": 0.75 + "input": 0, + "output": 0 }, "type": "chat" }, { - "id": "xai/grok-4-fast-reasoning", - "name": "Grok-4-Fast-Reasoning", - "display_name": "Grok-4-Fast-Reasoning", + "id": "gemma-4", + "name": "Gemma 4", + "display_name": "Gemma 4", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 2000000, - "output": 128000 + "context": 32768, + "output": 8192 }, - "temperature": false, - "tool_call": true, + "temperature": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true - } + "supported": false }, - "attachment": true, - "open_weights": false, - "release_date": "2025-09-16", - "last_updated": "2025-09-16", + "attachment": false, + "open_weights": true, + "release_date": "2026-04-22", + "last_updated": "2026-04-22", "cost": { - "input": 0.2, - "output": 0.5, - "cache_read": 0.05 + "input": 5, + "output": 10 }, "type": "chat" }, { - "id": "xai/grok-3-mini", - "name": "Grok 3 Mini", - "display_name": "Grok 3 Mini", + "id": "medgemma-4b", + "name": "MedGemma 4B", + "display_name": "MedGemma 4B", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 131072, - "output": 8192 + "context": 8192, + "output": 4096 }, - "temperature": false, - "tool_call": true, + "temperature": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": true + "supported": false }, "attachment": true, - "open_weights": false, - "release_date": "2025-04-11", - "last_updated": "2025-04-11", + "open_weights": true, + "release_date": "2026-04-26", + "last_updated": "2026-04-26", "cost": { - "input": 0.3, - "output": 0.5, - "cache_read": 0.075 + "input": 3, + "output": 5 }, "type": "chat" }, { - "id": "xai/grok-4", - "name": "Grok-4", - "display_name": "Grok-4", + "id": "qwen3-6-35b", + "name": "Qwen3.6 35B-A3B", + "display_name": "Qwen3.6 35B-A3B", "modalities": { "input": [ "text", - "image" + "image", + "video", + "audio" ], "output": [ "text" ] }, "limit": { - "context": 256000, - "output": 128000 + "context": 16384, + "output": 65536 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, "default": true }, - "extra_capabilities": { - "reasoning": { - "supported": true - } - }, "attachment": true, - "open_weights": false, - "release_date": "2025-07-10", - "last_updated": "2025-07-10", + "open_weights": true, + "release_date": "2026-04-17", + "last_updated": "2026-04-17", "cost": { - "input": 3, - "output": 15, - "cache_read": 0.75 + "input": 5, + "output": 10 }, "type": "chat" }, { - "id": "xai/grok-code-fast-1", - "name": "Grok Code Fast 1", - "display_name": "Grok Code Fast 1", + "id": "trendyol-7b", + "name": "Trendyol 7B", + "display_name": "Trendyol 7B", "modalities": { "input": [ "text" @@ -99794,35 +105509,36 @@ ] }, "limit": { - "context": 256000, - "output": 128000 + "context": 32768, + "output": 8192 }, - "temperature": false, - "tool_call": true, + "temperature": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true - } + "supported": false }, - "attachment": true, - "open_weights": false, - "release_date": "2025-08-22", - "last_updated": "2025-08-22", + "attachment": false, + "open_weights": true, + "release_date": "2026-06-06", + "last_updated": "2026-06-06", "cost": { - "input": 0.2, - "output": 1.5, - "cache_read": 0.02 + "input": 0, + "output": 0 }, "type": "chat" - }, + } + ] + }, + "cohere": { + "id": "cohere", + "name": "Cohere", + "display_name": "Cohere", + "doc": "https://docs.cohere.com/docs/models", + "models": [ { - "id": "trytako/tako", - "name": "Tako", - "display_name": "Tako", + "id": "c4ai-aya-expanse-32b", + "name": "Aya Expanse 32B", + "display_name": "Aya Expanse 32B", "modalities": { "input": [ "text" @@ -99832,135 +105548,144 @@ ] }, "limit": { - "context": 2048, - "output": 8192 + "context": 128000, + "output": 4000 }, - "temperature": false, - "tool_call": true, + "temperature": true, + "tool_call": false, "reasoning": { "supported": false }, - "attachment": true, - "open_weights": false, - "release_date": "2024-08-15", - "last_updated": "2024-08-15", + "attachment": false, + "open_weights": true, + "release_date": "2024-10-24", + "last_updated": "2024-10-24", "type": "chat" }, { - "id": "topazlabs-co/topazlabs", - "name": "TopazLabs", - "display_name": "TopazLabs", + "id": "command-a-03-2025", + "name": "Command A", + "display_name": "Command A", "modalities": { "input": [ "text" ], "output": [ - "image" + "text" ] }, "limit": { - "context": 204, - "output": 8192 + "context": 256000, + "output": 8000 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { "supported": false }, - "attachment": true, - "open_weights": false, - "release_date": "2024-12-03", - "last_updated": "2024-12-03", + "attachment": false, + "open_weights": true, + "knowledge": "2024-06-01", + "release_date": "2025-03-13", + "last_updated": "2025-03-13", + "cost": { + "input": 2.5, + "output": 10 + }, "type": "chat" }, { - "id": "runwayml/runway", - "name": "Runway", - "display_name": "Runway", + "id": "c4ai-aya-vision-32b", + "name": "Aya Vision 32B", + "display_name": "Aya Vision 32B", "modalities": { "input": [ "text", "image" ], "output": [ - "video" + "text" ] }, "limit": { - "context": 256, - "output": 8192 + "context": 16000, + "output": 4000 }, - "temperature": false, - "tool_call": true, + "temperature": true, + "tool_call": false, "reasoning": { "supported": false }, "attachment": true, - "open_weights": false, - "release_date": "2024-10-11", - "last_updated": "2024-10-11", + "open_weights": true, + "release_date": "2025-03-04", + "last_updated": "2025-05-14", "type": "chat" }, { - "id": "runwayml/runway-gen-4-turbo", - "name": "Runway-Gen-4-Turbo", - "display_name": "Runway-Gen-4-Turbo", + "id": "command-r7b-arabic-02-2025", + "name": "Command R7B Arabic", + "display_name": "Command R7B Arabic", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ - "video" + "text" ] }, "limit": { - "context": 256, - "output": 8192 + "context": 128000, + "output": 4000 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { "supported": false }, - "attachment": true, - "open_weights": false, - "release_date": "2025-05-09", - "last_updated": "2025-05-09", + "attachment": false, + "open_weights": true, + "knowledge": "2024-06-01", + "release_date": "2025-02-27", + "last_updated": "2025-02-27", + "cost": { + "input": 0.0375, + "output": 0.15 + }, "type": "chat" }, { - "id": "stabilityai/stablediffusionxl", - "name": "StableDiffusionXL", - "display_name": "StableDiffusionXL", + "id": "c4ai-aya-vision-8b", + "name": "Aya Vision 8B", + "display_name": "Aya Vision 8B", "modalities": { "input": [ "text", "image" ], "output": [ - "image" + "text" ] }, "limit": { - "context": 200, - "output": 8192 + "context": 16000, + "output": 4000 }, - "temperature": false, - "tool_call": true, + "temperature": true, + "tool_call": false, "reasoning": { "supported": false }, "attachment": true, - "open_weights": false, - "release_date": "2023-07-09", - "last_updated": "2023-07-09", + "open_weights": true, + "release_date": "2025-03-04", + "last_updated": "2025-05-14", "type": "chat" }, - { - "id": "poetools/claude-code", - "name": "claude-code", - "display_name": "claude-code", + { + "id": "command-r-08-2024", + "name": "Command R", + "display_name": "Command R", "modalities": { "input": [ "text" @@ -99970,297 +105695,318 @@ ] }, "limit": { - "context": 8192, - "output": 8192 + "context": 128000, + "output": 4000 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false + }, + "attachment": false, + "open_weights": true, + "knowledge": "2024-06-01", + "release_date": "2024-08-30", + "last_updated": "2024-08-30", + "cost": { + "input": 0.15, + "output": 0.6 }, - "attachment": true, - "open_weights": false, - "release_date": "2025-11-27", - "last_updated": "2025-11-27", "type": "chat" }, { - "id": "google/imagen-4-ultra", - "name": "Imagen-4-Ultra", - "display_name": "Imagen-4-Ultra", + "id": "command-r7b-12-2024", + "name": "Command R7B", + "display_name": "Command R7B", "modalities": { "input": [ "text" ], "output": [ - "image" + "text" ] }, "limit": { - "context": 480, - "output": 8192 + "context": 128000, + "output": 4000 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { "supported": false }, - "attachment": true, - "open_weights": false, - "release_date": "2025-05-24", - "last_updated": "2025-05-24", + "attachment": false, + "open_weights": true, + "knowledge": "2024-06-01", + "release_date": "2024-02-27", + "last_updated": "2024-02-27", + "cost": { + "input": 0.0375, + "output": 0.15 + }, "type": "chat" }, { - "id": "google/nano-banana-pro", - "name": "Nano-Banana-Pro", - "display_name": "Nano-Banana-Pro", + "id": "command-a-vision-07-2025", + "name": "Command A Vision", + "display_name": "Command A Vision", "modalities": { "input": [ "text", "image" ], "output": [ - "image" + "text" ] }, "limit": { - "context": 65536, - "output": 8192 + "context": 128000, + "output": 8000 }, - "temperature": false, - "tool_call": true, + "temperature": true, + "tool_call": false, "reasoning": { "supported": false }, - "attachment": true, - "open_weights": false, - "release_date": "2025-11-19", - "last_updated": "2025-11-19", + "attachment": false, + "open_weights": true, + "knowledge": "2024-06-01", + "release_date": "2025-07-31", + "last_updated": "2025-07-31", "cost": { - "input": 2, - "output": 12, - "cache_read": 0.2 + "input": 2.5, + "output": 10 }, "type": "chat" }, { - "id": "google/imagen-3-fast", - "name": "Imagen-3-Fast", - "display_name": "Imagen-3-Fast", + "id": "command-a-plus-05-2026", + "name": "Command A Plus", + "display_name": "Command A Plus", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ - "image" + "text" ] }, "limit": { - "context": 480, - "output": 8192 + "context": 128000, + "output": 64000 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "attachment": true, - "open_weights": false, - "release_date": "2024-10-17", - "last_updated": "2024-10-17", + "open_weights": true, + "knowledge": "2025-04-01", + "release_date": "2026-05-20", + "last_updated": "2026-06-09", + "cost": { + "input": 2.5, + "output": 10 + }, "type": "chat" }, { - "id": "google/veo-3", - "name": "Veo-3", - "display_name": "Veo-3", + "id": "command-a-translate-08-2025", + "name": "Command A Translate", + "display_name": "Command A Translate", "modalities": { "input": [ "text" ], "output": [ - "video" + "text" ] }, "limit": { - "context": 480, - "output": 8192 + "context": 8000, + "output": 8000 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { "supported": false }, - "attachment": true, - "open_weights": false, - "release_date": "2025-05-21", - "last_updated": "2025-05-21", + "attachment": false, + "open_weights": true, + "knowledge": "2024-06-01", + "release_date": "2025-08-28", + "last_updated": "2025-08-28", + "cost": { + "input": 2.5, + "output": 10 + }, "type": "chat" }, { - "id": "google/gemini-3-pro", - "name": "Gemini-3-Pro", - "display_name": "Gemini-3-Pro", + "id": "command-r-plus-08-2024", + "name": "Command R+", + "display_name": "Command R+", "modalities": { "input": [ - "text", - "image", - "video", - "audio" + "text" ], "output": [ "text" ] }, "limit": { - "context": 1048576, - "output": 65536 + "context": 128000, + "output": 4000 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": true, - "mode": "level", - "level": "high", - "level_options": [ - "low", - "high" - ], - "summaries": true, - "visibility": "summary", - "continuation": [ - "thought_signatures" - ] - } + "supported": false }, - "attachment": true, - "open_weights": false, - "release_date": "2025-10-22", - "last_updated": "2025-10-22", + "attachment": false, + "open_weights": true, + "knowledge": "2024-06-01", + "release_date": "2024-08-30", + "last_updated": "2024-08-30", "cost": { - "input": 1.6, - "output": 9.6, - "cache_read": 0.16 + "input": 2.5, + "output": 10 }, "type": "chat" }, { - "id": "google/veo-3.1-fast", - "name": "Veo-3.1-Fast", - "display_name": "Veo-3.1-Fast", + "id": "command-a-reasoning-08-2025", + "name": "Command A Reasoning", + "display_name": "Command A Reasoning", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ - "video" + "text" ] }, "limit": { - "context": 480, - "output": 8192 + "context": 256000, + "output": 32000 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true + }, + "attachment": false, + "open_weights": true, + "knowledge": "2024-06-01", + "release_date": "2025-08-21", + "last_updated": "2025-08-21", + "cost": { + "input": 2.5, + "output": 10 }, - "attachment": true, - "open_weights": false, - "release_date": "2025-10-15", - "last_updated": "2025-10-15", "type": "chat" }, { - "id": "google/gemini-2.0-flash-lite", - "name": "Gemini-2.0-Flash-Lite", - "display_name": "Gemini-2.0-Flash-Lite", + "id": "north-mini-code-1-0", + "name": "North Mini Code", + "display_name": "North Mini Code", "modalities": { "input": [ - "text", - "image", - "video", - "audio" + "text" ], "output": [ "text" ] }, "limit": { - "context": 990000, - "output": 8192 + "context": 256000, + "output": 64000 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": true, - "open_weights": false, - "release_date": "2025-02-05", - "last_updated": "2025-02-05", + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } + }, + "attachment": false, + "open_weights": true, + "knowledge": "2025-09-23", + "release_date": "2026-06-09", + "last_updated": "2026-06-09", "cost": { - "input": 0.052, - "output": 0.21 + "input": 0, + "output": 0 }, "type": "chat" }, { - "id": "google/imagen-4", - "name": "Imagen-4", - "display_name": "Imagen-4", + "id": "c4ai-aya-expanse-8b", + "name": "Aya Expanse 8B", + "display_name": "Aya Expanse 8B", "modalities": { "input": [ "text" ], "output": [ - "image" + "text" ] }, "limit": { - "context": 480, - "output": 8192 + "context": 8000, + "output": 4000 }, - "temperature": false, - "tool_call": true, + "temperature": true, + "tool_call": false, "reasoning": { "supported": false }, - "attachment": true, - "open_weights": false, - "release_date": "2025-05-22", - "last_updated": "2025-05-22", + "attachment": false, + "open_weights": true, + "release_date": "2024-10-24", + "last_updated": "2024-10-24", "type": "chat" - }, + } + ] + }, + "sarvam": { + "id": "sarvam", + "name": "Sarvam AI", + "display_name": "Sarvam AI", + "api": "https://api.sarvam.ai/v1", + "doc": "https://docs.sarvam.ai/api-reference-docs/getting-started/models", + "models": [ { - "id": "google/gemini-3-flash", - "name": "Gemini-3-Flash", - "display_name": "Gemini-3-Flash", + "id": "sarvam-105b", + "name": "Sarvam-105B", + "display_name": "Sarvam-105B", "modalities": { "input": [ - "text", - "image", - "video", - "audio" + "text" ], "output": [ "text" ] }, "limit": { - "context": 1048576, - "output": 65536 + "context": 131072, + "output": 131072 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, @@ -100269,53 +106015,37 @@ "extra_capabilities": { "reasoning": { "supported": true, - "default_enabled": true, - "mode": "level", - "level": "high", - "level_options": [ - "minimal", - "low", - "medium", - "high" - ], + "interleaved": true, "summaries": true, "visibility": "summary", "continuation": [ - "thought_signatures" + "thinking_blocks" ] } }, - "attachment": true, - "open_weights": false, - "release_date": "2025-10-07", - "last_updated": "2025-10-07", - "cost": { - "input": 0.4, - "output": 2.4, - "cache_read": 0.04 - }, + "attachment": false, + "open_weights": true, + "release_date": "2026-02-18", + "last_updated": "2026-03-06", "type": "chat" }, { - "id": "google/gemini-2.5-pro", - "name": "Gemini-2.5-Pro", - "display_name": "Gemini-2.5-Pro", + "id": "sarvam-30b", + "name": "Sarvam-30B", + "display_name": "Sarvam-30B", "modalities": { "input": [ - "text", - "image", - "video", - "audio" + "text" ], "output": [ "text" ] }, "limit": { - "context": 1065535, - "output": 65535 + "context": 65536, + "output": 65536 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, @@ -100324,208 +106054,238 @@ "extra_capabilities": { "reasoning": { "supported": true, - "default_enabled": true, - "mode": "budget", - "budget": { - "default": -1, - "min": 128, - "max": 32768, - "auto": -1, - "unit": "tokens" - }, + "interleaved": true, "summaries": true, "visibility": "summary", "continuation": [ - "thought_signatures" + "thinking_blocks" ] } }, - "attachment": true, + "attachment": false, + "open_weights": true, + "release_date": "2026-02-18", + "last_updated": "2026-03-06", + "type": "chat" + } + ] + }, + "stepfun": { + "id": "stepfun", + "name": "StepFun", + "display_name": "StepFun", + "api": "https://api.stepfun.com/v1", + "doc": "https://platform.stepfun.com/docs/zh/overview/concept", + "models": [ + { + "id": "step-1-32k", + "name": "Step 1 (32K)", + "display_name": "Step 1 (32K)", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 32768, + "output": 32768 + }, + "temperature": true, + "tool_call": true, + "reasoning": { + "supported": true, + "default": true + }, + "attachment": false, "open_weights": false, - "release_date": "2025-02-05", - "last_updated": "2025-02-05", + "knowledge": "2024-06", + "release_date": "2025-01-01", + "last_updated": "2026-02-13", "cost": { - "input": 0.87, - "output": 7, - "cache_read": 0.087 + "input": 2.05, + "output": 9.59, + "cache_read": 0.41 }, "type": "chat" }, { - "id": "google/imagen-4-fast", - "name": "Imagen-4-Fast", - "display_name": "Imagen-4-Fast", + "id": "step-3.5-flash-2603", + "name": "Step 3.5 Flash 2603", + "display_name": "Step 3.5 Flash 2603", "modalities": { "input": [ "text" ], "output": [ - "image" + "text" ] }, "limit": { - "context": 480, - "output": 8192 + "context": 256000, + "output": 256000 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true + }, + "attachment": false, + "open_weights": true, + "knowledge": "2025-01", + "release_date": "2026-04-02", + "last_updated": "2026-04-02", + "cost": { + "input": 0.1, + "output": 0.3, + "cache_read": 0.02 }, - "attachment": true, - "open_weights": false, - "release_date": "2025-06-25", - "last_updated": "2025-06-25", "type": "chat" }, { - "id": "google/nano-banana", - "name": "Nano-Banana", - "display_name": "Nano-Banana", + "id": "step-3.5-flash", + "name": "Step 3.5 Flash", + "display_name": "Step 3.5 Flash", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ - "text", - "image" + "text" ] }, "limit": { - "context": 65536, - "output": 8192 + "context": 256000, + "output": 256000 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": true, - "open_weights": false, - "release_date": "2025-08-21", - "last_updated": "2025-08-21", + "attachment": false, + "open_weights": true, + "knowledge": "2025-01", + "release_date": "2026-01-29", + "last_updated": "2026-02-13", "cost": { - "input": 0.21, - "output": 1.8, - "cache_read": 0.021 + "input": 0.096, + "output": 0.288, + "cache_read": 0.019 }, "type": "chat" }, { - "id": "google/gemini-3.1-flash-lite", - "name": "Gemini-3.1-Flash-Lite", - "display_name": "Gemini-3.1-Flash-Lite", + "id": "step-2-16k", + "name": "Step 2 (16K)", + "display_name": "Step 2 (16K)", "modalities": { "input": [ - "text", - "image", - "video", - "audio" + "text" ], "output": [ "text" ] }, "limit": { - "context": 1048576, - "output": 65536 + "context": 16384, + "output": 8192 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, "default": true }, - "extra_capabilities": { - "reasoning": { - "supported": true - } - }, - "attachment": true, + "attachment": false, "open_weights": false, - "release_date": "2026-02-18", - "last_updated": "2026-02-18", + "knowledge": "2024-06", + "release_date": "2025-01-01", + "last_updated": "2026-02-13", "cost": { - "input": 0.25, - "output": 1.5 + "input": 5.21, + "output": 16.44, + "cache_read": 1.04 }, "type": "chat" - }, + } + ] + }, + "hpc-ai": { + "id": "hpc-ai", + "name": "HPC-AI", + "display_name": "HPC-AI", + "api": "https://api.hpc-ai.com/inference/v1", + "doc": "https://www.hpc-ai.com/doc/docs/quickstart/", + "models": [ { - "id": "google/gemini-2.5-flash-lite", - "name": "Gemini-2.5-Flash-Lite", - "display_name": "Gemini-2.5-Flash-Lite", + "id": "moonshotai/kimi-k2.5", + "name": "Kimi K2.5", + "display_name": "Kimi K2.5", "modalities": { "input": [ "text", "image", - "video", - "audio" + "video" ], "output": [ "text" ] }, "limit": { - "context": 1024000, - "output": 64000 + "context": 262144, + "output": 262144 }, "temperature": false, "tool_call": true, "reasoning": { "supported": true, - "default": false + "default": true }, "extra_capabilities": { "reasoning": { "supported": true, - "default_enabled": false, - "mode": "budget", - "budget": { - "default": -1, - "min": 512, - "max": 24576, - "auto": -1, - "unit": "tokens" - }, + "interleaved": true, "summaries": true, "visibility": "summary", "continuation": [ - "thought_signatures" + "thinking_blocks" ] } }, - "attachment": true, - "open_weights": false, - "release_date": "2025-06-19", - "last_updated": "2025-06-19", + "attachment": false, + "open_weights": true, + "knowledge": "2025-01-01", + "release_date": "2026-01-01", + "last_updated": "2026-06-01", "cost": { - "input": 0.07, - "output": 0.28 + "input": 0.3, + "output": 1.5, + "cache_read": 0.05 }, "type": "chat" }, { - "id": "google/gemini-2.5-flash", - "name": "Gemini-2.5-Flash", - "display_name": "Gemini-2.5-Flash", + "id": "zai-org/glm-5.1", + "name": "GLM 5.1", + "display_name": "GLM 5.1", "modalities": { "input": [ - "text", - "image", - "video", - "audio" + "text" ], "output": [ "text" ] }, "limit": { - "context": 1065535, - "output": 65535 + "context": 202000, + "output": 202000 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, @@ -100534,147 +106294,165 @@ "extra_capabilities": { "reasoning": { "supported": true, - "default_enabled": true, - "mode": "budget", - "budget": { - "default": -1, - "min": 0, - "max": 24576, - "auto": -1, - "off": 0, - "unit": "tokens" - }, + "interleaved": true, "summaries": true, "visibility": "summary", "continuation": [ - "thought_signatures" + "thinking_blocks" ] } }, - "attachment": true, - "open_weights": false, - "release_date": "2025-04-26", - "last_updated": "2025-04-26", + "attachment": false, + "open_weights": true, + "release_date": "2026-04-08", + "last_updated": "2026-06-01", "cost": { - "input": 0.21, - "output": 1.8, - "cache_read": 0.021 + "input": 0.615, + "output": 2.46, + "cache_read": 0.133 }, "type": "chat" }, { - "id": "google/gemma-4-31b", - "name": "Gemma-4-31B", - "display_name": "Gemma-4-31B", + "id": "minimax/minimax-m2.5", + "name": "MiniMax M2.5", + "display_name": "MiniMax M2.5", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 262144, - "output": 8192 + "context": 1000000, + "output": 131072 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": true, - "open_weights": false, - "release_date": "2026-04-02", - "last_updated": "2026-04-02", + "extra_capabilities": { + "reasoning": { + "supported": true + } + }, + "attachment": false, + "open_weights": true, + "release_date": "2026-02-12", + "last_updated": "2026-06-01", "cost": { - "input": 0, - "output": 0 + "input": 0.3, + "output": 1.2, + "cache_read": 0.03 }, "type": "chat" - }, + } + ] + }, + "minimax-cn": { + "id": "minimax-cn", + "name": "MiniMax (minimaxi.com)", + "display_name": "MiniMax (minimaxi.com)", + "api": "https://api.minimaxi.com/anthropic/v1", + "doc": "https://platform.minimaxi.com/docs/guides/quickstart", + "models": [ { - "id": "google/veo-2", - "name": "Veo-2", - "display_name": "Veo-2", + "id": "MiniMax-M2.1", + "name": "MiniMax-M2.1", + "display_name": "MiniMax-M2.1", "modalities": { "input": [ "text" ], "output": [ - "video" + "text" ] }, "limit": { - "context": 480, - "output": 8192 + "context": 204800, + "output": 131072 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true + } + }, + "attachment": false, + "open_weights": true, + "release_date": "2025-12-23", + "last_updated": "2025-12-23", + "cost": { + "input": 0.3, + "output": 1.2 }, - "attachment": true, - "open_weights": false, - "release_date": "2024-12-02", - "last_updated": "2024-12-02", "type": "chat" }, { - "id": "google/gemini-2.0-flash", - "name": "Gemini-2.0-Flash", - "display_name": "Gemini-2.0-Flash", + "id": "MiniMax-M2.5-highspeed", + "name": "MiniMax-M2.5-highspeed", + "display_name": "MiniMax-M2.5-highspeed", "modalities": { "input": [ - "text", - "image", - "video", - "audio" + "text" ], "output": [ "text" ] }, "limit": { - "context": 990000, - "output": 8192 + "context": 204800, + "output": 131072 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": true, - "open_weights": false, - "release_date": "2024-12-11", - "last_updated": "2024-12-11", + "extra_capabilities": { + "reasoning": { + "supported": true + } + }, + "attachment": false, + "open_weights": true, + "release_date": "2026-02-13", + "last_updated": "2026-02-13", "cost": { - "input": 0.1, - "output": 0.42 + "input": 0.6, + "output": 2.4, + "cache_read": 0.06, + "cache_write": 0.375 }, "type": "chat" }, { - "id": "google/gemini-3.1-pro", - "name": "Gemini-3.1-Pro", - "display_name": "Gemini-3.1-Pro", + "id": "MiniMax-M2.7-highspeed", + "name": "MiniMax-M2.7-highspeed", + "display_name": "MiniMax-M2.7-highspeed", "modalities": { "input": [ - "text", - "image", - "video", - "audio" + "text" ], "output": [ "text" ] }, "limit": { - "context": 1048576, - "output": 65536 + "context": 204800, + "output": 131072 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, @@ -100683,50 +106461,43 @@ "extra_capabilities": { "reasoning": { "supported": true, - "default_enabled": true, - "mode": "level", - "level": "high", - "level_options": [ - "low", - "high" - ], + "interleaved": true, "summaries": true, "visibility": "summary", "continuation": [ - "thought_signatures" + "thinking_blocks" ] } }, - "attachment": true, - "open_weights": false, - "release_date": "2026-02-19", - "last_updated": "2026-02-19", + "attachment": false, + "open_weights": true, + "release_date": "2026-03-18", + "last_updated": "2026-03-18", "cost": { - "input": 2, - "output": 12, - "cache_read": 0.2 + "input": 0.6, + "output": 2.4, + "cache_read": 0.06, + "cache_write": 0.375 }, "type": "chat" }, { - "id": "google/gemini-3.5-flash", - "name": "Gemini-3.5-Flash", - "display_name": "Gemini-3.5-Flash", + "id": "MiniMax-M2", + "name": "MiniMax-M2", + "display_name": "MiniMax-M2", "modalities": { "input": [ - "text", - "image", - "audio" + "text" ], "output": [ "text" ] }, "limit": { - "context": 1048576, - "output": 65536 + "context": 196608, + "output": 128000 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, @@ -100734,181 +106505,236 @@ }, "extra_capabilities": { "reasoning": { - "supported": true, - "default_enabled": true, - "mode": "level", - "level": "high", - "level_options": [ - "minimal", - "low", - "medium", - "high" - ], - "summaries": true, - "visibility": "summary", - "continuation": [ - "thought_signatures" - ] + "supported": true } }, - "attachment": true, - "open_weights": false, - "knowledge": "2025-01", - "release_date": "2026-05-19", - "last_updated": "2026-05-19", + "attachment": false, + "open_weights": true, + "release_date": "2025-10-27", + "last_updated": "2025-10-27", "cost": { - "input": 1.5152, - "output": 9.0909, - "cache_read": 0.1515 + "input": 0.3, + "output": 1.2 }, "type": "chat" }, { - "id": "google/veo-3.1", - "name": "Veo-3.1", - "display_name": "Veo-3.1", + "id": "MiniMax-M2.5", + "name": "MiniMax-M2.5", + "display_name": "MiniMax-M2.5", "modalities": { "input": [ "text" ], "output": [ - "video" + "text" ] }, "limit": { - "context": 480, - "output": 8192 + "context": 204800, + "output": 131072 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true + } + }, + "attachment": false, + "open_weights": true, + "release_date": "2026-02-12", + "last_updated": "2026-02-12", + "cost": { + "input": 0.3, + "output": 1.2, + "cache_read": 0.03, + "cache_write": 0.375 }, - "attachment": true, - "open_weights": false, - "release_date": "2025-10-15", - "last_updated": "2025-10-15", "type": "chat" }, { - "id": "google/lyria", - "name": "Lyria", - "display_name": "Lyria", + "id": "MiniMax-M3", + "name": "MiniMax-M3", + "display_name": "MiniMax-M3", "modalities": { "input": [ - "text" + "text", + "image", + "video" ], "output": [ - "audio" + "text" ] }, "limit": { - "context": 8192, - "output": 8192 + "context": 512000, + "output": 128000 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true + } }, "attachment": true, - "open_weights": false, - "release_date": "2025-06-04", - "last_updated": "2025-06-04", + "open_weights": true, + "release_date": "2026-06-01", + "last_updated": "2026-06-01", + "cost": { + "input": 0.6, + "output": 2.4, + "cache_read": 0.12 + }, "type": "chat" }, { - "id": "google/gemini-deep-research", - "name": "gemini-deep-research", - "display_name": "gemini-deep-research", + "id": "MiniMax-M2.7", + "name": "MiniMax-M2.7", + "display_name": "MiniMax-M2.7", "modalities": { "input": [ - "text", - "image", - "video" + "text" ], "output": [ "text" ] }, "limit": { - "context": 1048576, - "output": 8192 + "context": 204800, + "output": 131072 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, "default": true }, - "attachment": true, - "open_weights": false, - "release_date": "2025-12-11", - "last_updated": "2025-12-11", + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } + }, + "attachment": false, + "open_weights": true, + "release_date": "2026-03-18", + "last_updated": "2026-03-18", "cost": { - "input": 1.6, - "output": 9.6 + "input": 0.3, + "output": 1.2, + "cache_read": 0.06, + "cache_write": 0.375 }, "type": "chat" - }, + } + ] + }, + "alibaba-coding-plan": { + "id": "alibaba-coding-plan", + "name": "Alibaba Coding Plan", + "display_name": "Alibaba Coding Plan", + "api": "https://coding-intl.dashscope.aliyuncs.com/v1", + "doc": "https://www.alibabacloud.com/help/en/model-studio/coding-plan", + "models": [ { - "id": "google/veo-3-fast", - "name": "Veo-3-Fast", - "display_name": "Veo-3-Fast", + "id": "qwen3-coder-plus", + "name": "Qwen3 Coder Plus", + "display_name": "Qwen3 Coder Plus", "modalities": { "input": [ "text" ], "output": [ - "video" + "text" ] }, "limit": { - "context": 480, - "output": 8192 + "context": 1000000, + "output": 65536 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { "supported": false }, - "attachment": true, - "open_weights": false, - "release_date": "2025-10-13", - "last_updated": "2025-10-13", + "attachment": false, + "open_weights": true, + "knowledge": "2025-04", + "release_date": "2025-07-23", + "last_updated": "2025-07-23", + "cost": { + "input": 0, + "output": 0, + "cache_read": 0, + "cache_write": 0 + }, "type": "chat" }, { - "id": "google/imagen-3", - "name": "Imagen-3", - "display_name": "Imagen-3", + "id": "glm-4.7", + "name": "GLM-4.7", + "display_name": "GLM-4.7", "modalities": { "input": [ "text" ], "output": [ - "image" + "text" ] }, "limit": { - "context": 480, - "output": 8192 + "context": 202752, + "output": 16384 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } + }, + "attachment": false, + "open_weights": true, + "knowledge": "2025-04", + "release_date": "2025-12-22", + "last_updated": "2025-12-22", + "cost": { + "input": 0, + "output": 0, + "cache_read": 0, + "cache_write": 0 }, - "attachment": true, - "open_weights": false, - "release_date": "2024-10-15", - "last_updated": "2024-10-15", "type": "chat" }, { - "id": "openai/chatgpt-4o-latest", - "name": "ChatGPT-4o-Latest", - "display_name": "ChatGPT-4o-Latest", + "id": "qwen3.7-plus", + "name": "Qwen3.7 Plus", + "display_name": "Qwen3.7 Plus", "modalities": { "input": [ "text", @@ -100919,42 +106745,50 @@ ] }, "limit": { - "context": 128000, - "output": 8192 + "context": 1000000, + "output": 64000 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": true, + "extra_capabilities": { + "reasoning": { + "supported": true + } + }, + "attachment": false, "open_weights": false, - "release_date": "2024-08-14", - "last_updated": "2024-08-14", + "knowledge": "2025-04", + "release_date": "2026-06-02", + "last_updated": "2026-06-02", "cost": { - "input": 4.5, - "output": 14 + "input": 0, + "output": 0, + "cache_read": 0, + "cache_write": 0 }, "type": "chat" }, { - "id": "openai/gpt-5-pro", - "name": "GPT-5-Pro", - "display_name": "GPT-5-Pro", + "id": "qwen3.7-max", + "name": "Qwen3.7 Max", + "display_name": "Qwen3.7 Max", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 400000, - "output": 128000 + "context": 1000000, + "output": 65536 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, @@ -100962,47 +106796,40 @@ }, "extra_capabilities": { "reasoning": { - "supported": true, - "default_enabled": true, - "mode": "fixed", - "effort": "high", - "verbosity": "medium", - "verbosity_options": [ - "low", - "medium", - "high" - ], - "visibility": "hidden" + "supported": true } }, - "attachment": true, + "attachment": false, "open_weights": false, - "release_date": "2025-10-06", - "last_updated": "2025-10-06", + "release_date": "2026-05-21", + "last_updated": "2026-05-21", "cost": { - "input": 14, - "output": 110 + "input": 2.5, + "output": 7.5, + "cache_read": 0.5, + "cache_write": 3.125 }, "type": "chat" }, { - "id": "openai/gpt-5-mini", - "name": "GPT-5-mini", - "display_name": "GPT-5-mini", + "id": "qwen3.6-flash", + "name": "Qwen3.6 Flash", + "display_name": "Qwen3.6 Flash", "modalities": { "input": [ "text", - "image" + "image", + "video" ], "output": [ "text" ] }, "limit": { - "context": 400000, - "output": 128000 + "context": 1000000, + "output": 65536 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, @@ -101011,245 +106838,261 @@ "extra_capabilities": { "reasoning": { "supported": true, - "default_enabled": true, - "mode": "effort", - "effort": "medium", - "effort_options": [ - "minimal", - "low", - "medium", - "high" - ], - "verbosity": "medium", - "verbosity_options": [ - "low", - "medium", - "high" - ], - "visibility": "hidden" + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] } }, "attachment": true, "open_weights": false, - "release_date": "2025-06-25", - "last_updated": "2025-06-25", + "release_date": "2026-04-27", + "last_updated": "2026-04-27", "cost": { - "input": 0.22, - "output": 1.8, - "cache_read": 0.022 + "input": 0.1875, + "output": 1.125, + "cache_write": 0.234375 }, "type": "chat" }, { - "id": "openai/o3-mini-high", - "name": "o3-mini-high", - "display_name": "o3-mini-high", + "id": "qwen3-max-2026-01-23", + "name": "Qwen3 Max", + "display_name": "Qwen3 Max", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 100000 + "context": 262144, + "output": 32768 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": true }, "extra_capabilities": { "reasoning": { "supported": true, - "default_enabled": true, - "mode": "effort", - "effort": "medium", - "effort_options": [ - "low", - "medium", - "high" - ], - "visibility": "hidden" + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] } }, - "attachment": true, + "attachment": false, "open_weights": false, - "release_date": "2025-01-31", - "last_updated": "2025-01-31", + "knowledge": "2025-04", + "release_date": "2026-01-23", + "last_updated": "2026-01-23", "cost": { - "input": 0.99, - "output": 4 + "input": 0, + "output": 0, + "cache_read": 0, + "cache_write": 0 }, "type": "chat" }, { - "id": "openai/gpt-image-1", - "name": "GPT-Image-1", - "display_name": "GPT-Image-1", + "id": "qwen3.5-plus", + "name": "Qwen3.5 Plus", + "display_name": "Qwen3.5 Plus", "modalities": { "input": [ "text", - "image" + "image", + "video" ], "output": [ - "image" + "text" ] }, "limit": { - "context": 128000, - "output": 8192 + "context": 1000000, + "output": 65536 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": true, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } + }, + "attachment": false, "open_weights": false, - "release_date": "2025-03-31", - "last_updated": "2025-03-31", - "type": "imageGeneration" + "knowledge": "2025-04", + "release_date": "2026-02-16", + "last_updated": "2026-02-16", + "cost": { + "input": 0, + "output": 0, + "cache_read": 0, + "cache_write": 0 + }, + "type": "chat" }, { - "id": "openai/gpt-5-chat", - "name": "GPT-5-Chat", - "display_name": "GPT-5-Chat", + "id": "kimi-k2.5", + "name": "Kimi K2.5", + "display_name": "Kimi K2.5", "modalities": { "input": [ "text", - "image" + "image", + "video" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 16384 + "context": 262144, + "output": 32768 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } }, "attachment": true, - "open_weights": false, - "release_date": "2025-08-07", - "last_updated": "2025-08-07", + "open_weights": true, + "knowledge": "2025-01", + "release_date": "2026-01-27", + "last_updated": "2026-01-27", "cost": { - "input": 1.1, - "output": 9, - "cache_read": 0.11 + "input": 0, + "output": 0, + "cache_read": 0, + "cache_write": 0 }, "type": "chat" }, { - "id": "openai/gpt-4o", - "name": "GPT-4o", - "display_name": "GPT-4o", + "id": "MiniMax-M2.5", + "name": "MiniMax-M2.5", + "display_name": "MiniMax-M2.5", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 8192 + "context": 196608, + "output": 24576 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } + }, + "attachment": false, + "open_weights": true, + "release_date": "2026-02-12", + "last_updated": "2026-02-12", + "cost": { + "input": 0, + "output": 0, + "cache_read": 0, + "cache_write": 0 }, - "attachment": true, - "open_weights": false, - "release_date": "2024-05-13", - "last_updated": "2024-05-13", "type": "chat" }, { - "id": "openai/gpt-5.2", - "name": "GPT-5.2", - "display_name": "GPT-5.2", + "id": "qwen3-coder-next", + "name": "Qwen3 Coder Next", + "display_name": "Qwen3 Coder Next", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 400000, - "output": 128000 + "context": 262144, + "output": 65536 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": false - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": false, - "mode": "effort", - "effort": "none", - "effort_options": [ - "none", - "low", - "medium", - "high", - "xhigh" - ], - "verbosity": "medium", - "verbosity_options": [ - "low", - "medium", - "high" - ], - "visibility": "hidden" - } + "supported": false }, - "attachment": true, - "open_weights": false, - "release_date": "2025-12-08", - "last_updated": "2025-12-08", + "attachment": false, + "open_weights": true, + "release_date": "2026-02-03", + "last_updated": "2026-02-03", "cost": { - "input": 1.6, - "output": 13, - "cache_read": 0.16 + "input": 0, + "output": 0, + "cache_read": 0, + "cache_write": 0 }, "type": "chat" }, { - "id": "openai/gpt-5-codex", - "name": "GPT-5-Codex", - "display_name": "GPT-5-Codex", + "id": "glm-5", + "name": "GLM-5", + "display_name": "GLM-5", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 400000, - "output": 128000 + "context": 202752, + "output": 16384 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, @@ -101258,52 +107101,45 @@ "extra_capabilities": { "reasoning": { "supported": true, - "default_enabled": true, - "mode": "effort", - "effort": "medium", - "effort_options": [ - "minimal", - "low", - "medium", - "high" - ], - "verbosity": "medium", - "verbosity_options": [ - "low", - "medium", - "high" - ], - "visibility": "hidden" + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] } }, - "attachment": true, + "attachment": false, "open_weights": false, - "release_date": "2025-09-23", - "last_updated": "2025-09-23", + "release_date": "2026-02-11", + "last_updated": "2026-02-11", "cost": { - "input": 1.1, - "output": 9 + "input": 0, + "output": 0, + "cache_read": 0, + "cache_write": 0 }, "type": "chat" }, { - "id": "openai/o3", - "name": "o3", - "display_name": "o3", + "id": "qwen3.6-plus", + "name": "Qwen3.6 Plus", + "display_name": "Qwen3.6 Plus", "modalities": { "input": [ "text", - "image" + "image", + "video" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 100000 + "context": 1000000, + "output": 65536 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, @@ -101312,43 +107148,50 @@ "extra_capabilities": { "reasoning": { "supported": true, - "default_enabled": true, - "mode": "effort", - "effort": "medium", - "effort_options": [ - "low", - "medium", - "high" - ], - "visibility": "hidden" + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] } }, - "attachment": true, + "attachment": false, "open_weights": false, - "release_date": "2025-04-16", - "last_updated": "2025-04-16", + "knowledge": "2025-04", + "release_date": "2026-04-02", + "last_updated": "2026-04-02", "cost": { - "input": 1.8, - "output": 7.2, - "cache_read": 0.45 + "input": 0, + "output": 0, + "cache_read": 0, + "cache_write": 0 }, "type": "chat" - }, + } + ] + }, + "poe": { + "id": "poe", + "name": "Poe", + "display_name": "Poe", + "api": "https://api.poe.com/v1", + "doc": "https://creator.poe.com/docs/external-applications/openai-compatible-api", + "models": [ { - "id": "openai/sora-2-pro", - "name": "Sora-2-Pro", - "display_name": "Sora-2-Pro", + "id": "trytako/tako", + "name": "Tako", + "display_name": "Tako", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ - "video" + "text" ] }, "limit": { - "context": 8192, + "context": 2048, "output": 8192 }, "temperature": false, @@ -101358,25 +107201,24 @@ }, "attachment": true, "open_weights": false, - "release_date": "2025-10-06", - "last_updated": "2025-10-06", + "release_date": "2024-08-15", + "last_updated": "2024-08-15", "type": "chat" }, { - "id": "openai/gpt-5", - "name": "GPT-5", - "display_name": "GPT-5", + "id": "xai/grok-code-fast-1", + "name": "Grok Code Fast 1", + "display_name": "Grok Code Fast 1", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 400000, + "context": 256000, "output": 128000 }, "temperature": false, @@ -101387,40 +107229,24 @@ }, "extra_capabilities": { "reasoning": { - "supported": true, - "default_enabled": true, - "mode": "effort", - "effort": "medium", - "effort_options": [ - "minimal", - "low", - "medium", - "high" - ], - "verbosity": "medium", - "verbosity_options": [ - "low", - "medium", - "high" - ], - "visibility": "hidden" + "supported": true } }, "attachment": true, "open_weights": false, - "release_date": "2025-08-05", - "last_updated": "2025-08-05", + "release_date": "2025-08-22", + "last_updated": "2025-08-22", "cost": { - "input": 1.1, - "output": 9, - "cache_read": 0.11 + "input": 0.2, + "output": 1.5, + "cache_read": 0.02 }, "type": "chat" }, { - "id": "openai/gpt-4-classic", - "name": "GPT-4-Classic", - "display_name": "GPT-4-Classic", + "id": "xai/grok-4.1-fast-reasoning", + "name": "Grok-4.1-Fast-Reasoning", + "display_name": "Grok-4.1-Fast-Reasoning", "modalities": { "input": [ "text", @@ -101431,121 +107257,97 @@ ] }, "limit": { - "context": 8192, - "output": 4096 + "context": 2000000, + "output": 30000 }, "temperature": false, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "attachment": true, "open_weights": false, - "release_date": "2024-03-25", - "last_updated": "2024-03-25", - "cost": { - "input": 27, - "output": 54 - }, + "release_date": "2025-11-19", + "last_updated": "2025-11-19", "type": "chat" }, { - "id": "openai/gpt-image-1-mini", - "name": "GPT-Image-1-Mini", - "display_name": "GPT-Image-1-Mini", + "id": "xai/grok-3-mini", + "name": "Grok 3 Mini", + "display_name": "Grok 3 Mini", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ - "image" + "text" ] }, "limit": { - "context": 8192, + "context": 131072, "output": 8192 }, "temperature": false, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "attachment": true, "open_weights": false, - "release_date": "2025-08-26", - "last_updated": "2025-08-26", - "type": "imageGeneration" + "release_date": "2025-04-11", + "last_updated": "2025-04-11", + "cost": { + "input": 0.3, + "output": 0.5, + "cache_read": 0.075 + }, + "type": "chat" }, { - "id": "openai/gpt-5.4-pro", - "name": "GPT-5.4-Pro", - "display_name": "GPT-5.4-Pro", + "id": "xai/grok-4.1-fast-non-reasoning", + "name": "Grok-4.1-Fast-Non-Reasoning", + "display_name": "Grok-4.1-Fast-Non-Reasoning", "modalities": { "input": [ "text", "image" ], "output": [ - "image" + "text" ] }, "limit": { - "context": 1050000, - "output": 128000 + "context": 2000000, + "output": 30000 }, "temperature": false, "tool_call": true, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": true, - "mode": "effort", - "effort": "high", - "effort_options": [ - "medium", - "high", - "xhigh" - ], - "verbosity": "medium", - "verbosity_options": [ - "low", - "medium", - "high" - ], - "visibility": "hidden" - } + "supported": false }, "attachment": true, "open_weights": false, - "release_date": "2026-03-05", - "last_updated": "2026-03-05", - "cost": { - "input": 27, - "output": 160 - }, + "release_date": "2025-11-19", + "last_updated": "2025-11-19", "type": "chat" }, { - "id": "openai/gpt-4.1-mini", - "name": "GPT-4.1-mini", - "display_name": "GPT-4.1-mini", + "id": "xai/grok-3", + "name": "Grok 3", + "display_name": "Grok 3", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 1047576, - "output": 32768 + "context": 131072, + "output": 8192 }, "temperature": false, "tool_call": true, @@ -101554,19 +107356,19 @@ }, "attachment": true, "open_weights": false, - "release_date": "2025-04-15", - "last_updated": "2025-04-15", + "release_date": "2025-04-11", + "last_updated": "2025-04-11", "cost": { - "input": 0.36, - "output": 1.4, - "cache_read": 0.09 + "input": 3, + "output": 15, + "cache_read": 0.75 }, "type": "chat" }, { - "id": "openai/gpt-5.2-pro", - "name": "GPT-5.2-Pro", - "display_name": "GPT-5.2-Pro", + "id": "xai/grok-4-fast-reasoning", + "name": "Grok-4-Fast-Reasoning", + "display_name": "Grok-4-Fast-Reasoning", "modalities": { "input": [ "text", @@ -101577,7 +107379,7 @@ ] }, "limit": { - "context": 400000, + "context": 2000000, "output": 128000 }, "temperature": false, @@ -101588,38 +107390,24 @@ }, "extra_capabilities": { "reasoning": { - "supported": true, - "default_enabled": true, - "mode": "effort", - "effort": "high", - "effort_options": [ - "medium", - "high", - "xhigh" - ], - "verbosity": "medium", - "verbosity_options": [ - "low", - "medium", - "high" - ], - "visibility": "hidden" + "supported": true } }, "attachment": true, "open_weights": false, - "release_date": "2025-12-11", - "last_updated": "2025-12-11", + "release_date": "2025-09-16", + "last_updated": "2025-09-16", "cost": { - "input": 19, - "output": 150 + "input": 0.2, + "output": 0.5, + "cache_read": 0.05 }, "type": "chat" }, { - "id": "openai/o3-pro", - "name": "o3-pro", - "display_name": "o3-pro", + "id": "xai/grok-4", + "name": "Grok-4", + "display_name": "Grok-4", "modalities": { "input": [ "text", @@ -101630,8 +107418,8 @@ ] }, "limit": { - "context": 200000, - "output": 100000 + "context": 256000, + "output": 128000 }, "temperature": false, "tool_call": true, @@ -101641,32 +107429,24 @@ }, "extra_capabilities": { "reasoning": { - "supported": true, - "default_enabled": true, - "mode": "effort", - "effort": "medium", - "effort_options": [ - "low", - "medium", - "high" - ], - "visibility": "hidden" + "supported": true } }, "attachment": true, "open_weights": false, - "release_date": "2025-06-10", - "last_updated": "2025-06-10", + "release_date": "2025-07-10", + "last_updated": "2025-07-10", "cost": { - "input": 18, - "output": 72 + "input": 3, + "output": 15, + "cache_read": 0.75 }, "type": "chat" }, { - "id": "openai/o4-mini", - "name": "o4-mini", - "display_name": "o4-mini", + "id": "xai/grok-4-fast-non-reasoning", + "name": "Grok-4-Fast-Non-Reasoning", + "display_name": "Grok-4-Fast-Non-Reasoning", "modalities": { "input": [ "text", @@ -101677,159 +107457,101 @@ ] }, "limit": { - "context": 200000, - "output": 100000 + "context": 2000000, + "output": 128000 }, "temperature": false, "tool_call": true, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": true, - "mode": "effort", - "effort": "medium", - "effort_options": [ - "low", - "medium", - "high" - ], - "visibility": "hidden" - } + "supported": false }, "attachment": true, "open_weights": false, - "release_date": "2025-04-16", - "last_updated": "2025-04-16", + "release_date": "2025-09-16", + "last_updated": "2025-09-16", "cost": { - "input": 0.99, - "output": 4, - "cache_read": 0.25 + "input": 0.2, + "output": 0.5, + "cache_read": 0.05 }, "type": "chat" }, { - "id": "openai/gpt-5.4", - "name": "GPT-5.4", - "display_name": "GPT-5.4", + "id": "xai/grok-4.20-multi-agent", + "name": "Grok-4.20-Multi-Agent", + "display_name": "Grok-4.20-Multi-Agent", "modalities": { "input": [ "text", - "image", - "pdf" + "image" ], "output": [ - "image" + "text" ] }, "limit": { - "context": 1050000, - "output": 128000 + "context": 128000, + "output": 8192 }, "temperature": false, "tool_call": true, "reasoning": { - "supported": true, - "default": false - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": false, - "mode": "effort", - "effort": "none", - "effort_options": [ - "none", - "low", - "medium", - "high", - "xhigh" - ], - "verbosity": "medium", - "verbosity_options": [ - "low", - "medium", - "high" - ], - "visibility": "hidden" - } + "supported": false }, "attachment": true, "open_weights": false, - "release_date": "2026-02-26", - "last_updated": "2026-02-26", + "release_date": "2026-03-13", + "last_updated": "2026-03-13", "cost": { - "input": 2.2, - "output": 14, - "cache_read": 0.22 + "input": 2, + "output": 6, + "cache_read": 0.2 }, "type": "chat" }, { - "id": "openai/o3-mini", - "name": "o3-mini", - "display_name": "o3-mini", + "id": "topazlabs-co/topazlabs", + "name": "TopazLabs", + "display_name": "TopazLabs", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ - "text" + "image" ] }, "limit": { - "context": 200000, - "output": 100000 + "context": 204, + "output": 8192 }, "temperature": false, "tool_call": true, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": true, - "mode": "effort", - "effort": "medium", - "effort_options": [ - "low", - "medium", - "high" - ], - "visibility": "hidden" - } + "supported": false }, "attachment": true, "open_weights": false, - "release_date": "2025-01-31", - "last_updated": "2025-01-31", - "cost": { - "input": 0.99, - "output": 4 - }, + "release_date": "2024-12-03", + "last_updated": "2024-12-03", "type": "chat" }, { - "id": "openai/dall-e-3", - "name": "DALL-E-3", - "display_name": "DALL-E-3", + "id": "fireworks-ai/kimi-k2.5-fw", + "name": "Kimi-K2.5-FW", + "display_name": "Kimi-K2.5-FW", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ - "image" + "text" ] }, "limit": { - "context": 800, - "output": 8192 + "context": 262144, + "output": 16384 }, "temperature": false, "tool_call": true, @@ -101838,81 +107560,56 @@ }, "attachment": true, "open_weights": false, - "release_date": "2023-11-06", - "last_updated": "2023-11-06", - "type": "imageGeneration" + "release_date": "2026-01-27", + "last_updated": "2026-01-27", + "cost": { + "input": 0, + "output": 0 + }, + "type": "chat" }, { - "id": "openai/gpt-5.5", - "name": "GPT-5.5", - "display_name": "GPT-5.5", + "id": "google/veo-3.1-fast", + "name": "Veo-3.1-Fast", + "display_name": "Veo-3.1-Fast", "modalities": { "input": [ "text", "image" ], "output": [ - "text", - "image" + "video" ] }, "limit": { - "context": 400000, - "output": 128000 + "context": 480, + "output": 8192 }, "temperature": false, "tool_call": true, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": true, - "mode": "effort", - "effort": "medium", - "effort_options": [ - "low", - "medium", - "high", - "xhigh" - ], - "verbosity": "medium", - "verbosity_options": [ - "low", - "medium", - "high" - ], - "visibility": "hidden" - } + "supported": false }, "attachment": true, "open_weights": false, - "knowledge": "2025-12-01", - "release_date": "2026-04-08", - "last_updated": "2026-04-08", - "cost": { - "input": 4.5455, - "output": 27.2727, - "cache_read": 0.4545 - }, + "release_date": "2025-10-15", + "last_updated": "2025-10-15", "type": "chat" }, { - "id": "openai/gpt-4o-mini-search", - "name": "GPT-4o-mini-Search", - "display_name": "GPT-4o-mini-Search", + "id": "google/imagen-3", + "name": "Imagen-3", + "display_name": "Imagen-3", "modalities": { "input": [ "text" ], "output": [ - "text" + "image" ] }, "limit": { - "context": 128000, + "context": 480, "output": 8192 }, "temperature": false, @@ -101922,173 +107619,127 @@ }, "attachment": true, "open_weights": false, - "release_date": "2025-03-11", - "last_updated": "2025-03-11", - "cost": { - "input": 0.14, - "output": 0.54 - }, + "release_date": "2024-10-15", + "last_updated": "2024-10-15", "type": "chat" }, { - "id": "openai/gpt-5.1", - "name": "GPT-5.1", - "display_name": "GPT-5.1", + "id": "google/nano-banana-pro", + "name": "Nano-Banana-Pro", + "display_name": "Nano-Banana-Pro", "modalities": { "input": [ "text", "image" ], "output": [ - "text" + "image" ] }, "limit": { - "context": 400000, - "output": 128000 + "context": 65536, + "output": 8192 }, "temperature": false, "tool_call": true, "reasoning": { - "supported": true, - "default": false - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": false, - "mode": "effort", - "effort": "none", - "effort_options": [ - "none", - "low", - "medium", - "high" - ], - "verbosity": "medium", - "verbosity_options": [ - "low", - "medium", - "high" - ], - "visibility": "hidden" - } + "supported": false }, "attachment": true, "open_weights": false, - "release_date": "2025-11-12", - "last_updated": "2025-11-12", + "release_date": "2025-11-19", + "last_updated": "2025-11-19", "cost": { - "input": 1.1, - "output": 9, - "cache_read": 0.11 + "input": 2, + "output": 12, + "cache_read": 0.2 }, "type": "chat" }, { - "id": "openai/gpt-5-nano", - "name": "GPT-5-nano", - "display_name": "GPT-5-nano", + "id": "google/lyria", + "name": "Lyria", + "display_name": "Lyria", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ - "text" + "audio" ] }, "limit": { - "context": 400000, - "output": 128000 + "context": 8192, + "output": 8192 }, "temperature": false, "tool_call": true, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": true, - "mode": "effort", - "effort": "medium", - "effort_options": [ - "minimal", - "low", - "medium", - "high" - ], - "verbosity": "medium", - "verbosity_options": [ - "low", - "medium", - "high" - ], - "visibility": "hidden" - } + "supported": false }, "attachment": true, "open_weights": false, - "release_date": "2025-08-05", - "last_updated": "2025-08-05", - "cost": { - "input": 0.045, - "output": 0.36, - "cache_read": 0.0045 - }, + "release_date": "2025-06-04", + "last_updated": "2025-06-04", "type": "chat" }, { - "id": "openai/gpt-4o-aug", - "name": "GPT-4o-Aug", - "display_name": "GPT-4o-Aug", + "id": "google/gemini-3.1-flash-lite", + "name": "Gemini-3.1-Flash-Lite", + "display_name": "Gemini-3.1-Flash-Lite", "modalities": { "input": [ "text", - "image" + "image", + "video", + "audio" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 8192 + "context": 1048576, + "output": 65536 }, "temperature": false, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true + } }, "attachment": true, "open_weights": false, - "release_date": "2024-11-21", - "last_updated": "2024-11-21", + "release_date": "2026-02-18", + "last_updated": "2026-02-18", "cost": { - "input": 2.2, - "output": 9, - "cache_read": 1.1 + "input": 0.25, + "output": 1.5 }, "type": "chat" }, { - "id": "openai/gpt-4o-mini", - "name": "GPT-4o-mini", - "display_name": "GPT-4o-mini", + "id": "google/nano-banana", + "name": "Nano-Banana", + "display_name": "Nano-Banana", "modalities": { "input": [ "text", "image" ], "output": [ - "text" + "text", + "image" ] }, "limit": { - "context": 124096, - "output": 4096 + "context": 65536, + "output": 8192 }, "temperature": false, "tool_call": true, @@ -102097,140 +107748,94 @@ }, "attachment": true, "open_weights": false, - "release_date": "2024-07-18", - "last_updated": "2024-07-18", + "release_date": "2025-08-21", + "last_updated": "2025-08-21", "cost": { - "input": 0.14, - "output": 0.54, - "cache_read": 0.068 + "input": 0.21, + "output": 1.8, + "cache_read": 0.021 }, "type": "chat" }, { - "id": "openai/gpt-5.1-codex-max", - "name": "GPT-5.1-Codex-Max", - "display_name": "GPT-5.1-Codex-Max", + "id": "google/gemini-deep-research", + "name": "gemini-deep-research", + "display_name": "gemini-deep-research", "modalities": { "input": [ "text", - "image" + "image", + "video" ], "output": [ "text" ] }, "limit": { - "context": 400000, - "output": 128000 + "context": 1048576, + "output": 8192 }, "temperature": false, "tool_call": true, "reasoning": { "supported": true, - "default": false - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": false, - "mode": "effort", - "effort": "none", - "effort_options": [ - "none", - "low", - "medium", - "high" - ], - "verbosity": "medium", - "verbosity_options": [ - "low", - "medium", - "high" - ], - "visibility": "hidden" - } + "default": true }, "attachment": true, "open_weights": false, - "release_date": "2025-12-08", - "last_updated": "2025-12-08", + "release_date": "2025-12-11", + "last_updated": "2025-12-11", "cost": { - "input": 1.1, - "output": 9, - "cache_read": 0.11 + "input": 1.6, + "output": 9.6 }, "type": "chat" }, { - "id": "openai/gpt-5.1-codex-mini", - "name": "GPT-5.1-Codex-Mini", - "display_name": "GPT-5.1-Codex-Mini", + "id": "google/veo-3", + "name": "Veo-3", + "display_name": "Veo-3", "modalities": { "input": [ "text" ], "output": [ - "text" + "video" ] }, "limit": { - "context": 400000, - "output": 128000 + "context": 480, + "output": 8192 }, "temperature": false, "tool_call": true, "reasoning": { - "supported": true, - "default": false - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": false, - "mode": "effort", - "effort": "none", - "effort_options": [ - "none", - "low", - "medium", - "high" - ], - "verbosity": "medium", - "verbosity_options": [ - "low", - "medium", - "high" - ], - "visibility": "hidden" - } + "supported": false }, "attachment": true, "open_weights": false, - "release_date": "2025-11-12", - "last_updated": "2025-11-12", - "cost": { - "input": 0.22, - "output": 1.8, - "cache_read": 0.022 - }, + "release_date": "2025-05-21", + "last_updated": "2025-05-21", "type": "chat" }, { - "id": "openai/o1-pro", - "name": "o1-pro", - "display_name": "o1-pro", + "id": "google/gemini-3-flash", + "name": "Gemini-3-Flash", + "display_name": "Gemini-3-Flash", "modalities": { "input": [ "text", - "image" + "image", + "video", + "audio" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 100000 + "context": 1048576, + "output": 65536 }, "temperature": false, "tool_call": true, @@ -102242,40 +107847,46 @@ "reasoning": { "supported": true, "default_enabled": true, - "mode": "effort", - "effort": "medium", - "effort_options": [ + "mode": "level", + "level": "high", + "level_options": [ + "minimal", "low", "medium", "high" ], - "visibility": "hidden" + "summaries": true, + "visibility": "summary", + "continuation": [ + "thought_signatures" + ] } }, "attachment": true, "open_weights": false, - "release_date": "2025-03-19", - "last_updated": "2025-03-19", + "release_date": "2025-10-07", + "last_updated": "2025-10-07", "cost": { - "input": 140, - "output": 540 + "input": 0.4, + "output": 2.4, + "cache_read": 0.04 }, "type": "chat" }, { - "id": "openai/gpt-4o-search", - "name": "GPT-4o-Search", - "display_name": "GPT-4o-Search", + "id": "google/imagen-3-fast", + "name": "Imagen-3-Fast", + "display_name": "Imagen-3-Fast", "modalities": { "input": [ "text" ], "output": [ - "text" + "image" ] }, "limit": { - "context": 128000, + "context": 480, "output": 8192 }, "temperature": false, @@ -102285,29 +107896,28 @@ }, "attachment": true, "open_weights": false, - "release_date": "2025-03-11", - "last_updated": "2025-03-11", - "cost": { - "input": 2.2, - "output": 9 - }, + "release_date": "2024-10-17", + "last_updated": "2024-10-17", "type": "chat" }, { - "id": "openai/o3-deep-research", - "name": "o3-deep-research", - "display_name": "o3-deep-research", + "id": "google/gemini-2.5-pro", + "name": "Gemini-2.5-Pro", + "display_name": "Gemini-2.5-Pro", "modalities": { "input": [ - "text" + "text", + "image", + "video", + "audio" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 100000 + "context": 1065535, + "output": 65535 }, "temperature": false, "tool_call": true, @@ -102319,43 +107929,47 @@ "reasoning": { "supported": true, "default_enabled": true, - "mode": "effort", - "effort": "medium", - "effort_options": [ - "low", - "medium", - "high" - ], - "visibility": "hidden" + "mode": "budget", + "budget": { + "default": -1, + "min": 128, + "max": 32768, + "auto": -1, + "unit": "tokens" + }, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thought_signatures" + ] } }, "attachment": true, "open_weights": false, - "release_date": "2025-06-27", - "last_updated": "2025-06-27", + "release_date": "2025-02-05", + "last_updated": "2025-02-05", "cost": { - "input": 9, - "output": 36, - "cache_read": 2.2 + "input": 0.87, + "output": 7, + "cache_read": 0.087 }, "type": "chat" }, { - "id": "openai/gpt-3.5-turbo-raw", - "name": "GPT-3.5-Turbo-Raw", - "display_name": "GPT-3.5-Turbo-Raw", + "id": "google/veo-3.1", + "name": "Veo-3.1", + "display_name": "Veo-3.1", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ - "text" + "video" ] }, "limit": { - "context": 4524, - "output": 2048 + "context": 480, + "output": 8192 }, "temperature": false, "tool_call": true, @@ -102364,119 +107978,110 @@ }, "attachment": true, "open_weights": false, - "release_date": "2023-09-27", - "last_updated": "2023-09-27", - "cost": { - "input": 0.45, - "output": 1.4 - }, + "release_date": "2025-10-15", + "last_updated": "2025-10-15", "type": "chat" }, { - "id": "openai/gpt-4.1", - "name": "GPT-4.1", - "display_name": "GPT-4.1", + "id": "google/gemini-2.5-flash", + "name": "Gemini-2.5-Flash", + "display_name": "Gemini-2.5-Flash", "modalities": { "input": [ "text", - "image" + "image", + "video", + "audio" ], "output": [ "text" ] }, "limit": { - "context": 1047576, - "output": 32768 + "context": 1065535, + "output": 65535 }, "temperature": false, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": true, + "mode": "budget", + "budget": { + "default": -1, + "min": 0, + "max": 24576, + "auto": -1, + "off": 0, + "unit": "tokens" + }, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thought_signatures" + ] + } }, "attachment": true, "open_weights": false, - "release_date": "2025-04-14", - "last_updated": "2025-04-14", + "release_date": "2025-04-26", + "last_updated": "2025-04-26", "cost": { - "input": 1.8, - "output": 7.2, - "cache_read": 0.45 + "input": 0.21, + "output": 1.8, + "cache_read": 0.021 }, "type": "chat" }, { - "id": "openai/gpt-5.4-nano", - "name": "GPT-5.4-Nano", - "display_name": "GPT-5.4-Nano", + "id": "google/imagen-4-fast", + "name": "Imagen-4-Fast", + "display_name": "Imagen-4-Fast", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ - "text" + "image" ] }, "limit": { - "context": 400000, - "output": 128000 + "context": 480, + "output": 8192 }, "temperature": false, "tool_call": true, "reasoning": { - "supported": true, - "default": false - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": false, - "mode": "effort", - "effort": "none", - "effort_options": [ - "none", - "low", - "medium", - "high", - "xhigh" - ], - "verbosity": "medium", - "verbosity_options": [ - "low", - "medium", - "high" - ], - "visibility": "hidden" - } + "supported": false }, "attachment": true, "open_weights": false, - "release_date": "2026-03-11", - "last_updated": "2026-03-11", - "cost": { - "input": 0.18, - "output": 1.1, - "cache_read": 0.018 - }, + "release_date": "2025-06-25", + "last_updated": "2025-06-25", "type": "chat" }, { - "id": "openai/gpt-5.3-codex", - "name": "GPT-5.3-Codex", - "display_name": "GPT-5.3-Codex", + "id": "google/gemini-3.5-flash", + "name": "Gemini-3.5-Flash", + "display_name": "Gemini-3.5-Flash", "modalities": { "input": [ "text", - "image" + "image", + "audio" ], "output": [ "text" ] }, "limit": { - "context": 400000, - "output": 128000 + "context": 1048576, + "output": 65536 }, "temperature": false, "tool_call": true, @@ -102488,81 +108093,59 @@ "reasoning": { "supported": true, "default_enabled": true, - "mode": "effort", - "effort": "medium", - "effort_options": [ - "low", - "medium", - "high", - "xhigh" - ], - "verbosity": "medium", - "verbosity_options": [ + "mode": "level", + "level": "high", + "level_options": [ + "minimal", "low", "medium", "high" ], - "visibility": "hidden" + "summaries": true, + "visibility": "summary", + "continuation": [ + "thought_signatures" + ] } }, "attachment": true, "open_weights": false, - "release_date": "2026-02-10", - "last_updated": "2026-02-10", + "knowledge": "2025-01", + "release_date": "2026-05-19", + "last_updated": "2026-05-19", "cost": { - "input": 1.6, - "output": 13, - "cache_read": 0.16 + "input": 1.5152, + "output": 9.0909, + "cache_read": 0.1515 }, "type": "chat" }, { - "id": "openai/gpt-5.3-codex-spark", - "name": "GPT-5.3-Codex-Spark", - "display_name": "GPT-5.3-Codex-Spark", + "id": "google/gemma-4-31b", + "name": "Gemma-4-31B", + "display_name": "Gemma-4-31B", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 16384 + "context": 262144, + "output": 8192 }, "temperature": false, "tool_call": true, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": true, - "mode": "effort", - "effort": "medium", - "effort_options": [ - "low", - "medium", - "high", - "xhigh" - ], - "verbosity": "medium", - "verbosity_options": [ - "low", - "medium", - "high" - ], - "visibility": "hidden" - } + "supported": false }, "attachment": true, "open_weights": false, - "release_date": "2026-03-04", - "last_updated": "2026-03-04", + "release_date": "2026-04-02", + "last_updated": "2026-04-02", "cost": { "input": 0, "output": 0 @@ -102570,21 +108153,20 @@ "type": "chat" }, { - "id": "openai/gpt-5.3-instant", - "name": "GPT-5.3-Instant", - "display_name": "GPT-5.3-Instant", + "id": "google/veo-3-fast", + "name": "Veo-3-Fast", + "display_name": "Veo-3-Fast", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ - "text" + "video" ] }, "limit": { - "context": 128000, - "output": 16384 + "context": 480, + "output": 8192 }, "temperature": false, "tool_call": true, @@ -102593,32 +108175,28 @@ }, "attachment": true, "open_weights": false, - "release_date": "2026-03-03", - "last_updated": "2026-03-03", - "cost": { - "input": 1.6, - "output": 13, - "cache_read": 0.16 - }, + "release_date": "2025-10-13", + "last_updated": "2025-10-13", "type": "chat" }, { - "id": "openai/gpt-5.5-pro", - "name": "GPT-5.5-Pro", - "display_name": "GPT-5.5-Pro", + "id": "google/gemini-3-pro", + "name": "Gemini-3-Pro", + "display_name": "Gemini-3-Pro", "modalities": { "input": [ "text", - "image" + "image", + "video", + "audio" ], "output": [ - "text", - "image" + "text" ] }, "limit": { - "context": 400000, - "output": 128000 + "context": 1048576, + "output": 65536 }, "temperature": false, "tool_call": true, @@ -102628,115 +108206,135 @@ }, "extra_capabilities": { "reasoning": { - "supported": true + "supported": true, + "default_enabled": true, + "mode": "level", + "level": "high", + "level_options": [ + "low", + "high" + ], + "summaries": true, + "visibility": "summary", + "continuation": [ + "thought_signatures" + ] } }, "attachment": true, "open_weights": false, - "knowledge": "2025-12-01", - "release_date": "2026-04-08", - "last_updated": "2026-04-08", + "release_date": "2025-10-22", + "last_updated": "2025-10-22", "cost": { - "input": 27.2727, - "output": 163.6364 + "input": 1.6, + "output": 9.6, + "cache_read": 0.16 }, "type": "chat" }, { - "id": "openai/o4-mini-deep-research", - "name": "o4-mini-deep-research", - "display_name": "o4-mini-deep-research", + "id": "google/gemini-2.0-flash", + "name": "Gemini-2.0-Flash", + "display_name": "Gemini-2.0-Flash", "modalities": { "input": [ - "text" + "text", + "image", + "video", + "audio" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 100000 + "context": 990000, + "output": 8192 }, "temperature": false, "tool_call": true, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": true, - "mode": "effort", - "effort": "medium", - "effort_options": [ - "low", - "medium", - "high" - ], - "visibility": "hidden" - } + "supported": false }, "attachment": true, "open_weights": false, - "release_date": "2025-06-27", - "last_updated": "2025-06-27", + "release_date": "2024-12-11", + "last_updated": "2024-12-11", "cost": { - "input": 1.8, - "output": 7.2, - "cache_read": 0.45 + "input": 0.1, + "output": 0.42 }, "type": "chat" }, { - "id": "openai/gpt-3.5-turbo", - "name": "GPT-3.5-Turbo", - "display_name": "GPT-3.5-Turbo", + "id": "google/gemini-2.5-flash-lite", + "name": "Gemini-2.5-Flash-Lite", + "display_name": "Gemini-2.5-Flash-Lite", "modalities": { "input": [ "text", - "image" + "image", + "video", + "audio" ], "output": [ "text" ] }, "limit": { - "context": 16384, - "output": 2048 + "context": 1024000, + "output": 64000 }, "temperature": false, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": false + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": false, + "mode": "budget", + "budget": { + "default": -1, + "min": 512, + "max": 24576, + "auto": -1, + "unit": "tokens" + }, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thought_signatures" + ] + } }, "attachment": true, "open_weights": false, - "release_date": "2023-09-13", - "last_updated": "2023-09-13", + "release_date": "2025-06-19", + "last_updated": "2025-06-19", "cost": { - "input": 0.45, - "output": 1.4 + "input": 0.07, + "output": 0.28 }, "type": "chat" }, { - "id": "openai/gpt-4-classic-0314", - "name": "GPT-4-Classic-0314", - "display_name": "GPT-4-Classic-0314", + "id": "google/imagen-4", + "name": "Imagen-4", + "display_name": "Imagen-4", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ - "text" + "image" ] }, "limit": { - "context": 8192, - "output": 4096 + "context": 480, + "output": 8192 }, "temperature": false, "tool_call": true, @@ -102745,30 +108343,25 @@ }, "attachment": true, "open_weights": false, - "release_date": "2024-08-26", - "last_updated": "2024-08-26", - "cost": { - "input": 27, - "output": 54 - }, + "release_date": "2025-05-22", + "last_updated": "2025-05-22", "type": "chat" }, { - "id": "openai/gpt-3.5-turbo-instruct", - "name": "GPT-3.5-Turbo-Instruct", - "display_name": "GPT-3.5-Turbo-Instruct", + "id": "google/imagen-4-ultra", + "name": "Imagen-4-Ultra", + "display_name": "Imagen-4-Ultra", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ - "text" + "image" ] }, "limit": { - "context": 3500, - "output": 1024 + "context": 480, + "output": 8192 }, "temperature": false, "tool_call": true, @@ -102777,84 +108370,77 @@ }, "attachment": true, "open_weights": false, - "release_date": "2023-09-20", - "last_updated": "2023-09-20", - "cost": { - "input": 1.4, - "output": 1.8 - }, + "release_date": "2025-05-24", + "last_updated": "2025-05-24", "type": "chat" }, { - "id": "openai/gpt-5.1-instant", - "name": "GPT-5.1-Instant", - "display_name": "GPT-5.1-Instant", + "id": "google/gemini-3.1-pro", + "name": "Gemini-3.1-Pro", + "display_name": "Gemini-3.1-Pro", "modalities": { "input": [ "text", - "image" + "image", + "video", + "audio" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 16384 + "context": 1048576, + "output": 65536 }, "temperature": false, "tool_call": true, "reasoning": { "supported": true, - "default": false + "default": true }, "extra_capabilities": { "reasoning": { "supported": true, - "default_enabled": false, - "mode": "effort", - "effort": "none", - "effort_options": [ - "none", - "low", - "medium", - "high" - ], - "verbosity": "medium", - "verbosity_options": [ + "default_enabled": true, + "mode": "level", + "level": "high", + "level_options": [ "low", - "medium", "high" ], - "visibility": "hidden" + "summaries": true, + "visibility": "summary", + "continuation": [ + "thought_signatures" + ] } }, "attachment": true, "open_weights": false, - "release_date": "2025-11-12", - "last_updated": "2025-11-12", + "release_date": "2026-02-19", + "last_updated": "2026-02-19", "cost": { - "input": 1.1, - "output": 9, - "cache_read": 0.11 + "input": 2, + "output": 12, + "cache_read": 0.2 }, "type": "chat" }, { - "id": "openai/sora-2", - "name": "Sora-2", - "display_name": "Sora-2", + "id": "google/veo-2", + "name": "Veo-2", + "display_name": "Veo-2", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "video" ] }, "limit": { - "context": 8192, + "context": 480, "output": 8192 }, "temperature": false, @@ -102864,157 +108450,129 @@ }, "attachment": true, "open_weights": false, - "release_date": "2025-10-06", - "last_updated": "2025-10-06", + "release_date": "2024-12-02", + "last_updated": "2024-12-02", "type": "chat" }, { - "id": "openai/gpt-5.2-codex", - "name": "GPT-5.2-Codex", - "display_name": "GPT-5.2-Codex", + "id": "google/gemini-2.0-flash-lite", + "name": "Gemini-2.0-Flash-Lite", + "display_name": "Gemini-2.0-Flash-Lite", "modalities": { "input": [ "text", - "image" + "image", + "video", + "audio" ], "output": [ "text" ] }, "limit": { - "context": 400000, - "output": 128000 + "context": 990000, + "output": 8192 }, "temperature": false, "tool_call": true, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": true, - "mode": "effort", - "effort": "medium", - "effort_options": [ - "low", - "medium", - "high", - "xhigh" - ], - "verbosity": "medium", - "verbosity_options": [ - "low", - "medium", - "high" - ], - "visibility": "hidden" - } + "supported": false }, "attachment": true, "open_weights": false, - "release_date": "2026-01-14", - "last_updated": "2026-01-14", + "release_date": "2025-02-05", + "last_updated": "2025-02-05", "cost": { - "input": 1.6, - "output": 13, - "cache_read": 0.16 + "input": 0.052, + "output": 0.21 }, "type": "chat" }, { - "id": "openai/gpt-image-2", - "name": "GPT-Image-2", - "display_name": "GPT-Image-2", + "id": "elevenlabs/elevenlabs-music", + "name": "ElevenLabs-Music", + "display_name": "ElevenLabs-Music", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ - "image" + "audio" ] }, "limit": { - "context": 8192, + "context": 2000, "output": 8192 }, "temperature": false, - "tool_call": false, + "tool_call": true, "reasoning": { "supported": false }, "attachment": true, "open_weights": false, - "release_date": "2026-04-21", - "last_updated": "2026-04-21", - "cost": { - "input": 5.0505, - "output": 32.3232, - "cache_read": 1.2626 - }, - "type": "imageGeneration" + "release_date": "2025-08-29", + "last_updated": "2025-08-29", + "type": "chat" }, { - "id": "openai/gpt-5.1-codex", - "name": "GPT-5.1-Codex", - "display_name": "GPT-5.1-Codex", + "id": "elevenlabs/elevenlabs-v2.5-turbo", + "name": "ElevenLabs-v2.5-Turbo", + "display_name": "ElevenLabs-v2.5-Turbo", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ - "text" + "audio" ] }, "limit": { - "context": 400000, - "output": 128000 + "context": 128000, + "output": 8192 }, "temperature": false, "tool_call": true, "reasoning": { - "supported": true, - "default": false - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": false, - "mode": "effort", - "effort": "none", - "effort_options": [ - "none", - "low", - "medium", - "high" - ], - "verbosity": "medium", - "verbosity_options": [ - "low", - "medium", - "high" - ], - "visibility": "hidden" - } + "supported": false }, "attachment": true, "open_weights": false, - "release_date": "2025-11-12", - "last_updated": "2025-11-12", - "cost": { - "input": 1.1, - "output": 9, - "cache_read": 0.11 + "release_date": "2024-10-28", + "last_updated": "2024-10-28", + "type": "chat" + }, + { + "id": "elevenlabs/elevenlabs-v3", + "name": "ElevenLabs-v3", + "display_name": "ElevenLabs-v3", + "modalities": { + "input": [ + "text" + ], + "output": [ + "audio" + ] + }, + "limit": { + "context": 128000, + "output": 8192 }, + "temperature": false, + "tool_call": true, + "reasoning": { + "supported": false + }, + "attachment": true, + "open_weights": false, + "release_date": "2025-06-05", + "last_updated": "2025-06-05", "type": "chat" }, { - "id": "openai/gpt-5.4-mini", - "name": "GPT-5.4-Mini", - "display_name": "GPT-5.4-Mini", + "id": "openai/chatgpt-4o-latest", + "name": "ChatGPT-4o-Latest", + "display_name": "ChatGPT-4o-Latest", "modalities": { "input": [ "text", @@ -103025,52 +108583,28 @@ ] }, "limit": { - "context": 400000, - "output": 128000 + "context": 128000, + "output": 8192 }, "temperature": false, "tool_call": true, "reasoning": { - "supported": true, - "default": false - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": false, - "mode": "effort", - "effort": "none", - "effort_options": [ - "none", - "low", - "medium", - "high", - "xhigh" - ], - "verbosity": "medium", - "verbosity_options": [ - "low", - "medium", - "high" - ], - "visibility": "hidden" - } + "supported": false }, "attachment": true, "open_weights": false, - "release_date": "2026-03-12", - "last_updated": "2026-03-12", + "release_date": "2024-08-14", + "last_updated": "2024-08-14", "cost": { - "input": 0.68, - "output": 4, - "cache_read": 0.068 + "input": 4.5, + "output": 14 }, "type": "chat" }, { - "id": "openai/gpt-4-turbo", - "name": "GPT-4-Turbo", - "display_name": "GPT-4-Turbo", + "id": "openai/gpt-3.5-turbo-instruct", + "name": "GPT-3.5-Turbo-Instruct", + "display_name": "GPT-3.5-Turbo-Instruct", "modalities": { "input": [ "text", @@ -103081,8 +108615,8 @@ ] }, "limit": { - "context": 128000, - "output": 4096 + "context": 3500, + "output": 1024 }, "temperature": false, "tool_call": true, @@ -103091,18 +108625,18 @@ }, "attachment": true, "open_weights": false, - "release_date": "2023-09-13", - "last_updated": "2023-09-13", + "release_date": "2023-09-20", + "last_updated": "2023-09-20", "cost": { - "input": 9, - "output": 27 + "input": 1.4, + "output": 1.8 }, "type": "chat" }, { - "id": "openai/o1", - "name": "o1", - "display_name": "o1", + "id": "openai/o3", + "name": "o3", + "display_name": "o3", "modalities": { "input": [ "text", @@ -103138,72 +108672,12 @@ }, "attachment": true, "open_weights": false, - "release_date": "2024-12-18", - "last_updated": "2024-12-18", - "cost": { - "input": 14, - "output": 54 - }, - "type": "chat" - }, - { - "id": "openai/gpt-image-1.5", - "name": "gpt-image-1.5", - "display_name": "gpt-image-1.5", - "modalities": { - "input": [ - "text", - "image" - ], - "output": [ - "image" - ] - }, - "limit": { - "context": 128000, - "output": 8192 - }, - "temperature": false, - "tool_call": false, - "reasoning": { - "supported": false - }, - "attachment": true, - "open_weights": false, - "release_date": "2025-12-16", - "last_updated": "2025-12-16", - "type": "imageGeneration" - }, - { - "id": "openai/gpt-4.1-nano", - "name": "GPT-4.1-nano", - "display_name": "GPT-4.1-nano", - "modalities": { - "input": [ - "text", - "image" - ], - "output": [ - "text" - ] - }, - "limit": { - "context": 1047576, - "output": 32768 - }, - "temperature": false, - "tool_call": true, - "reasoning": { - "supported": false - }, - "attachment": true, - "open_weights": false, - "release_date": "2025-04-15", - "last_updated": "2025-04-15", + "release_date": "2025-04-16", + "last_updated": "2025-04-16", "cost": { - "input": 0.09, - "output": 0.36, - "cache_read": 0.022 + "input": 1.8, + "output": 7.2, + "cache_read": 0.45 }, "type": "chat" }, @@ -103264,9 +108738,9 @@ "type": "chat" }, { - "id": "cerebras/gpt-oss-120b-cs", - "name": "GPT-OSS-120B-CS", - "display_name": "GPT-OSS-120B-CS", + "id": "openai/gpt-4o-search", + "name": "GPT-4o-Search", + "display_name": "GPT-4o-Search", "modalities": { "input": [ "text" @@ -103282,61 +108756,87 @@ "temperature": false, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, "attachment": true, "open_weights": false, - "release_date": "2025-08-06", - "last_updated": "2025-08-06", + "release_date": "2025-03-11", + "last_updated": "2025-03-11", "cost": { - "input": 0.35, - "output": 0.75 + "input": 2.2, + "output": 9 }, "type": "chat" }, { - "id": "cerebras/llama-3.3-70b-cs", - "name": "llama-3.3-70b-cs", - "display_name": "llama-3.3-70b-cs", + "id": "openai/gpt-5.2-pro", + "name": "GPT-5.2-Pro", + "display_name": "GPT-5.2-Pro", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 8192, - "output": 8192 + "context": 400000, + "output": 128000 }, "temperature": false, - "tool_call": false, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": true, + "mode": "effort", + "effort": "high", + "effort_options": [ + "medium", + "high", + "xhigh" + ], + "verbosity": "medium", + "verbosity_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" + } }, "attachment": true, "open_weights": false, - "release_date": "2025-05-13", - "last_updated": "2025-05-13", + "release_date": "2025-12-11", + "last_updated": "2025-12-11", + "cost": { + "input": 19, + "output": 150 + }, "type": "chat" }, { - "id": "cerebras/llama-3.1-8b-cs", - "name": "Llama-3.1-8B-CS", - "display_name": "Llama-3.1-8B-CS", + "id": "openai/gpt-4-classic-0314", + "name": "GPT-4-Classic-0314", + "display_name": "GPT-4-Classic-0314", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 8192 + "context": 8192, + "output": 4096 }, "temperature": false, "tool_call": true, @@ -103345,29 +108845,30 @@ }, "attachment": true, "open_weights": false, - "release_date": "2025-05-13", - "last_updated": "2025-05-13", + "release_date": "2024-08-26", + "last_updated": "2024-08-26", "cost": { - "input": 0.1, - "output": 0.1 + "input": 27, + "output": 54 }, "type": "chat" }, { - "id": "cerebras/qwen3-235b-2507-cs", - "name": "qwen3-235b-2507-cs", - "display_name": "qwen3-235b-2507-cs", + "id": "openai/gpt-5", + "name": "GPT-5", + "display_name": "GPT-5", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 8192, - "output": 8192 + "context": 400000, + "output": 128000 }, "temperature": false, "tool_call": true, @@ -103375,55 +108876,87 @@ "supported": true, "default": true }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": true, + "mode": "effort", + "effort": "medium", + "effort_options": [ + "minimal", + "low", + "medium", + "high" + ], + "verbosity": "medium", + "verbosity_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" + } + }, "attachment": true, "open_weights": false, - "release_date": "2025-08-06", - "last_updated": "2025-08-06", + "release_date": "2025-08-05", + "last_updated": "2025-08-05", + "cost": { + "input": 1.1, + "output": 9, + "cache_read": 0.11 + }, "type": "chat" }, { - "id": "cerebras/qwen3-32b-cs", - "name": "qwen3-32b-cs", - "display_name": "qwen3-32b-cs", + "id": "openai/gpt-5-chat", + "name": "GPT-5-Chat", + "display_name": "GPT-5-Chat", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 8192, - "output": 8192 + "context": 128000, + "output": 16384 }, "temperature": false, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, "attachment": true, "open_weights": false, - "release_date": "2025-05-15", - "last_updated": "2025-05-15", + "release_date": "2025-08-07", + "last_updated": "2025-08-07", + "cost": { + "input": 1.1, + "output": 9, + "cache_read": 0.11 + }, "type": "chat" }, { - "id": "ideogramai/ideogram-v2a", - "name": "Ideogram-v2a", - "display_name": "Ideogram-v2a", + "id": "openai/gpt-3.5-turbo", + "name": "GPT-3.5-Turbo", + "display_name": "GPT-3.5-Turbo", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ - "image" + "text" ] }, "limit": { - "context": 150, - "output": 8192 + "context": 16384, + "output": 2048 }, "temperature": false, "tool_call": true, @@ -103432,52 +108965,77 @@ }, "attachment": true, "open_weights": false, - "release_date": "2025-02-27", - "last_updated": "2025-02-27", + "release_date": "2023-09-13", + "last_updated": "2023-09-13", + "cost": { + "input": 0.45, + "output": 1.4 + }, "type": "chat" }, { - "id": "ideogramai/ideogram", - "name": "Ideogram", - "display_name": "Ideogram", + "id": "openai/gpt-5-pro", + "name": "GPT-5-Pro", + "display_name": "GPT-5-Pro", "modalities": { "input": [ "text", "image" ], "output": [ - "image" + "text" ] }, "limit": { - "context": 150, - "output": 8192 + "context": 400000, + "output": 128000 }, "temperature": false, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": true, + "mode": "fixed", + "effort": "high", + "verbosity": "medium", + "verbosity_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" + } }, "attachment": true, "open_weights": false, - "release_date": "2024-04-03", - "last_updated": "2024-04-03", + "release_date": "2025-10-06", + "last_updated": "2025-10-06", + "cost": { + "input": 14, + "output": 110 + }, "type": "chat" }, { - "id": "ideogramai/ideogram-v2a-turbo", - "name": "Ideogram-v2a-Turbo", - "display_name": "Ideogram-v2a-Turbo", + "id": "openai/gpt-4o", + "name": "GPT-4o", + "display_name": "GPT-4o", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ - "image" + "text" ] }, "limit": { - "context": 150, + "context": 128000, "output": 8192 }, "temperature": false, @@ -103487,42 +109045,62 @@ }, "attachment": true, "open_weights": false, - "release_date": "2025-02-27", - "last_updated": "2025-02-27", + "release_date": "2024-05-13", + "last_updated": "2024-05-13", "type": "chat" }, { - "id": "ideogramai/ideogram-v2", - "name": "Ideogram-v2", - "display_name": "Ideogram-v2", + "id": "openai/o4-mini", + "name": "o4-mini", + "display_name": "o4-mini", "modalities": { "input": [ "text", "image" ], "output": [ - "image" + "text" ] }, "limit": { - "context": 150, - "output": 8192 + "context": 200000, + "output": 100000 }, "temperature": false, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": true, + "mode": "effort", + "effort": "medium", + "effort_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" + } }, "attachment": true, "open_weights": false, - "release_date": "2024-08-21", - "last_updated": "2024-08-21", + "release_date": "2025-04-16", + "last_updated": "2025-04-16", + "cost": { + "input": 0.99, + "output": 4, + "cache_read": 0.25 + }, "type": "chat" }, { - "id": "lumalabs/ray2", - "name": "Ray2", - "display_name": "Ray2", + "id": "openai/sora-2", + "name": "Sora-2", + "display_name": "Sora-2", "modalities": { "input": [ "text", @@ -103533,7 +109111,7 @@ ] }, "limit": { - "context": 5000, + "context": 8192, "output": 8192 }, "temperature": false, @@ -103543,23 +109121,14 @@ }, "attachment": true, "open_weights": false, - "release_date": "2025-02-20", - "last_updated": "2025-02-20", + "release_date": "2025-10-06", + "last_updated": "2025-10-06", "type": "chat" - } - ] - }, - "umans-ai-coding-plan": { - "id": "umans-ai-coding-plan", - "name": "Umans AI Coding Plan", - "display_name": "Umans AI Coding Plan", - "api": "https://api.code.umans.ai/v1", - "doc": "https://app.umans.ai/offers/code/docs", - "models": [ + }, { - "id": "umans-kimi-k2.6", - "name": "Kimi K2.6", - "display_name": "Kimi K2.6", + "id": "openai/o3-pro", + "name": "o3-pro", + "display_name": "o3-pro", "modalities": { "input": [ "text", @@ -103570,8 +109139,8 @@ ] }, "limit": { - "context": 262144, - "output": 262144 + "context": 200000, + "output": 100000 }, "temperature": false, "tool_call": true, @@ -103582,76 +109151,63 @@ "extra_capabilities": { "reasoning": { "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] + "default_enabled": true, + "mode": "effort", + "effort": "medium", + "effort_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" } }, "attachment": true, - "open_weights": true, - "knowledge": "2025-01", - "release_date": "2026-04-21", - "last_updated": "2026-04-21", + "open_weights": false, + "release_date": "2025-06-10", + "last_updated": "2025-06-10", "cost": { - "input": 0, - "output": 0, - "cache_read": 0, - "cache_write": 0 + "input": 18, + "output": 72 }, "type": "chat" }, { - "id": "umans-glm-5.1", - "name": "GLM 5.1", - "display_name": "GLM 5.1", + "id": "openai/gpt-4-classic", + "name": "GPT-4-Classic", + "display_name": "GPT-4-Classic", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 204800, - "output": 131072 + "context": 8192, + "output": 4096 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } + "supported": false }, - "attachment": false, - "open_weights": true, - "release_date": "2026-03-27", - "last_updated": "2026-03-27", + "attachment": true, + "open_weights": false, + "release_date": "2024-03-25", + "last_updated": "2024-03-25", "cost": { - "input": 0, - "output": 0, - "cache_read": 0, - "cache_write": 0 + "input": 27, + "output": 54 }, "type": "chat" }, { - "id": "umans-qwen3.6-35b-a3b", - "name": "Qwen3.6 35B A3B", - "display_name": "Qwen3.6 35B A3B", + "id": "openai/gpt-4o-aug", + "name": "GPT-4o-Aug", + "display_name": "GPT-4o-Aug", "modalities": { "input": [ "text", @@ -103662,31 +109218,29 @@ ] }, "limit": { - "context": 262144, - "output": 262144 + "context": 128000, + "output": 8192 }, "temperature": false, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, "attachment": true, - "open_weights": true, - "release_date": "2026-04-17", - "last_updated": "2026-04-17", + "open_weights": false, + "release_date": "2024-11-21", + "last_updated": "2024-11-21", "cost": { - "input": 0, - "output": 0, - "cache_read": 0, - "cache_write": 0 + "input": 2.2, + "output": 9, + "cache_read": 1.1 }, "type": "chat" }, { - "id": "umans-coder", - "name": "Umans Coder", - "display_name": "Umans Coder", + "id": "openai/gpt-5.4-nano", + "name": "GPT-5.4-Nano", + "display_name": "GPT-5.4-Nano", "modalities": { "input": [ "text", @@ -103697,87 +109251,80 @@ ] }, "limit": { - "context": 262144, - "output": 262144 + "context": 400000, + "output": 128000 }, "temperature": false, "tool_call": true, "reasoning": { "supported": true, - "default": true + "default": false }, "extra_capabilities": { "reasoning": { "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] + "default_enabled": false, + "mode": "effort", + "effort": "none", + "effort_options": [ + "none", + "low", + "medium", + "high", + "xhigh" + ], + "verbosity": "medium", + "verbosity_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" } }, "attachment": true, - "open_weights": true, - "knowledge": "2025-01", - "release_date": "2026-04-21", - "last_updated": "2026-04-21", + "open_weights": false, + "release_date": "2026-03-11", + "last_updated": "2026-03-11", "cost": { - "input": 0, - "output": 0, - "cache_read": 0, - "cache_write": 0 + "input": 0.18, + "output": 1.1, + "cache_read": 0.018 }, "type": "chat" }, { - "id": "umans-flash", - "name": "Umans Flash", - "display_name": "Umans Flash", + "id": "openai/sora-2-pro", + "name": "Sora-2-Pro", + "display_name": "Sora-2-Pro", "modalities": { "input": [ "text", "image" ], "output": [ - "text" + "video" ] }, "limit": { - "context": 262144, - "output": 262144 + "context": 8192, + "output": 8192 }, "temperature": false, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, "attachment": true, - "open_weights": true, - "release_date": "2026-04-17", - "last_updated": "2026-04-17", - "cost": { - "input": 0, - "output": 0, - "cache_read": 0, - "cache_write": 0 - }, + "open_weights": false, + "release_date": "2025-10-06", + "last_updated": "2025-10-06", "type": "chat" - } - ] - }, - "firepass": { - "id": "firepass", - "name": "Fireworks (Firepass)", - "display_name": "Fireworks (Firepass)", - "api": "https://api.fireworks.ai/inference/v1/", - "doc": "https://docs.fireworks.ai/firepass", - "models": [ + }, { - "id": "accounts/fireworks/routers/kimi-k2p6-turbo", - "name": "Kimi K2.6 Turbo", - "display_name": "Kimi K2.6 Turbo", + "id": "openai/gpt-5.1-codex", + "name": "GPT-5.1-Codex", + "display_name": "GPT-5.1-Codex", "modalities": { "input": [ "text", @@ -103788,94 +109335,84 @@ ] }, "limit": { - "context": 262000, - "output": 262000 + "context": 400000, + "output": 128000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { "supported": true, - "default": true + "default": false }, "extra_capabilities": { "reasoning": { "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] + "default_enabled": false, + "mode": "effort", + "effort": "none", + "effort_options": [ + "none", + "low", + "medium", + "high" + ], + "verbosity": "medium", + "verbosity_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" } }, - "attachment": false, - "open_weights": true, - "release_date": "2026-04-17", - "last_updated": "2026-04-17", + "attachment": true, + "open_weights": false, + "release_date": "2025-11-12", + "last_updated": "2025-11-12", "cost": { - "input": 0, - "output": 0, - "cache_read": 0 + "input": 1.1, + "output": 9, + "cache_read": 0.11 }, "type": "chat" - } - ] - }, - "gmicloud": { - "id": "gmicloud", - "name": "GMI Cloud", - "display_name": "GMI Cloud", - "api": "https://api.gmi-serving.com/v1", - "doc": "https://docs.gmicloud.ai/inference-engine/api-reference/llm-api-reference", - "models": [ + }, { - "id": "zai-org/GLM-5-FP8", - "name": "GLM-5", - "display_name": "GLM-5", + "id": "openai/gpt-5.3-instant", + "name": "GPT-5.3-Instant", + "display_name": "GPT-5.3-Instant", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 202752, - "output": 131072 + "context": 128000, + "output": 16384 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } + "supported": false }, - "attachment": false, - "open_weights": true, - "release_date": "2026-02-11", - "last_updated": "2026-02-11", + "attachment": true, + "open_weights": false, + "release_date": "2026-03-03", + "last_updated": "2026-03-03", "cost": { - "input": 0.6, - "output": 1.92, - "cache_read": 0.12 + "input": 1.6, + "output": 13, + "cache_read": 0.16 }, "type": "chat" }, { - "id": "zai-org/GLM-5.1-FP8", - "name": "GLM-5.1", - "display_name": "GLM-5.1", + "id": "openai/gpt-5.3-codex-spark", + "name": "GPT-5.3-Codex-Spark", + "display_name": "GPT-5.3-Codex-Spark", "modalities": { "input": [ "text" @@ -103885,10 +109422,10 @@ ] }, "limit": { - "context": 202752, - "output": 131072 + "context": 128000, + "output": 16384 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { "supported": true, @@ -103897,42 +109434,52 @@ "extra_capabilities": { "reasoning": { "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] + "default_enabled": true, + "mode": "effort", + "effort": "medium", + "effort_options": [ + "low", + "medium", + "high", + "xhigh" + ], + "verbosity": "medium", + "verbosity_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" } }, - "attachment": false, - "open_weights": true, - "release_date": "2026-03-27", - "last_updated": "2026-03-27", + "attachment": true, + "open_weights": false, + "release_date": "2026-03-04", + "last_updated": "2026-03-04", "cost": { - "input": 0.98, - "output": 3.08, - "cache_read": 0.182 + "input": 0, + "output": 0 }, "type": "chat" }, { - "id": "anthropic/claude-sonnet-4.6", - "name": "Claude Sonnet 4.6", - "display_name": "Claude Sonnet 4.6", + "id": "openai/gpt-5.1-codex-max", + "name": "GPT-5.1-Codex-Max", + "display_name": "GPT-5.1-Codex-Max", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 409600, - "output": 64000 + "context": 400000, + "output": 128000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { "supported": true, @@ -103942,226 +109489,182 @@ "reasoning": { "supported": true, "default_enabled": false, - "mode": "mixed", - "budget": { - "min": 1024, - "unit": "tokens" - }, - "effort": "high", + "mode": "effort", + "effort": "none", "effort_options": [ + "none", "low", "medium", - "high", - "max" + "high" ], - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" + "verbosity": "medium", + "verbosity_options": [ + "low", + "medium", + "high" ], - "notes": [ - "Anthropic recommends adaptive thinking with effort for Claude 4.6; budget_tokens remains a deprecated compatibility path.", - "Anthropic API defaults effort to high; lower effort levels should be chosen per workload." - ] + "visibility": "hidden" } }, "attachment": true, "open_weights": false, - "knowledge": "2025-08-31", - "release_date": "2026-02-17", - "last_updated": "2026-03-13", + "release_date": "2025-12-08", + "last_updated": "2025-12-08", "cost": { - "input": 3, - "output": 15, - "cache_read": 0.3 + "input": 1.1, + "output": 9, + "cache_read": 0.11 }, "type": "chat" }, { - "id": "anthropic/claude-opus-4.7", - "name": "Claude Opus 4.7", - "display_name": "Claude Opus 4.7", + "id": "openai/dall-e-3", + "name": "DALL-E-3", + "display_name": "DALL-E-3", "modalities": { "input": [ "text" ], "output": [ - "text" + "image" ] }, "limit": { - "context": 409600, - "output": 128000 + "context": 800, + "output": 8192 }, "temperature": false, "tool_call": true, "reasoning": { - "supported": true, - "default": false - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": false, - "mode": "effort", - "effort": "high", - "effort_options": [ - "low", - "medium", - "high", - "xhigh", - "max" - ], - "interleaved": true, - "summaries": true, - "visibility": "omitted", - "continuation": [ - "thinking_blocks" - ], - "notes": [ - "Claude Opus 4.7 and newer Opus models require thinking.type = \"adaptive\" to enable thinking explicitly.", - "Manual budget_tokens requests return 400 on Claude Opus 4.7 and newer adaptive-only Opus models.", - "task_budget is separate from thinking control and should not be treated as a thinking budget." - ] - } + "supported": false }, "attachment": true, "open_weights": false, - "knowledge": "2026-01-31", - "release_date": "2026-04-16", - "last_updated": "2026-04-16", - "cost": { - "input": 4.5, - "output": 22.5, - "cache_read": 0.45 - }, - "type": "chat" + "release_date": "2023-11-06", + "last_updated": "2023-11-06", + "type": "imageGeneration" }, { - "id": "anthropic/claude-opus-4.6", - "name": "Claude Opus 4.6", - "display_name": "Claude Opus 4.6", + "id": "openai/o3-mini", + "name": "o3-mini", + "display_name": "o3-mini", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 409600, - "output": 128000 + "context": 200000, + "output": 100000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { "supported": true, - "default": false + "default": true }, "extra_capabilities": { "reasoning": { "supported": true, - "default_enabled": false, - "mode": "mixed", - "budget": { - "min": 1024, - "unit": "tokens" - }, - "effort": "high", + "default_enabled": true, + "mode": "effort", + "effort": "medium", "effort_options": [ "low", "medium", - "high", - "max" - ], - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" + "high" ], - "notes": [ - "Anthropic recommends adaptive thinking with effort for Claude 4.6; budget_tokens remains a deprecated compatibility path.", - "Anthropic API defaults effort to high; lower effort levels should be chosen per workload." - ] + "visibility": "hidden" } }, "attachment": true, "open_weights": false, - "knowledge": "2025-05-31", - "release_date": "2026-02-05", - "last_updated": "2026-03-13", + "release_date": "2025-01-31", + "last_updated": "2025-01-31", "cost": { - "input": 5, - "output": 25, - "cache_read": 0.5 + "input": 0.99, + "output": 4 }, "type": "chat" }, { - "id": "moonshotai/Kimi-K2.6", - "name": "Kimi K2.6", - "display_name": "Kimi K2.6", + "id": "openai/gpt-5.2", + "name": "GPT-5.2", + "display_name": "GPT-5.2", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 65536, - "output": 65536 + "context": 400000, + "output": 128000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { "supported": true, - "default": true + "default": false }, "extra_capabilities": { "reasoning": { "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] + "default_enabled": false, + "mode": "effort", + "effort": "none", + "effort_options": [ + "none", + "low", + "medium", + "high", + "xhigh" + ], + "verbosity": "medium", + "verbosity_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" } }, "attachment": true, - "open_weights": true, - "knowledge": "2025-01", - "release_date": "2026-04-21", - "last_updated": "2026-04-21", + "open_weights": false, + "release_date": "2025-12-08", + "last_updated": "2025-12-08", "cost": { - "input": 0.855, - "output": 3.6, - "cache_read": 0.144 + "input": 1.6, + "output": 13, + "cache_read": 0.16 }, "type": "chat" }, { - "id": "deepseek-ai/DeepSeek-V4-Flash", - "name": "DeepSeek V4 Flash", - "display_name": "DeepSeek V4 Flash", + "id": "openai/gpt-5.3-codex", + "name": "GPT-5.3-Codex", + "display_name": "GPT-5.3-Codex", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 1048575, - "output": 384000 + "context": 400000, + "output": 128000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { "supported": true, @@ -104170,30 +109673,39 @@ "extra_capabilities": { "reasoning": { "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] + "default_enabled": true, + "mode": "effort", + "effort": "medium", + "effort_options": [ + "low", + "medium", + "high", + "xhigh" + ], + "verbosity": "medium", + "verbosity_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" } }, - "attachment": false, - "open_weights": true, - "knowledge": "2025-05", - "release_date": "2026-04-24", - "last_updated": "2026-04-24", + "attachment": true, + "open_weights": false, + "release_date": "2026-02-10", + "last_updated": "2026-02-10", "cost": { - "input": 0.112, - "output": 0.224, - "cache_read": 0.022 + "input": 1.6, + "output": 13, + "cache_read": 0.16 }, "type": "chat" }, { - "id": "deepseek-ai/DeepSeek-V4-Pro", - "name": "DeepSeek V4 Pro", - "display_name": "DeepSeek V4 Pro", + "id": "openai/gpt-5.1-codex-mini", + "name": "GPT-5.1-Codex-Mini", + "display_name": "GPT-5.1-Codex-Mini", "modalities": { "input": [ "text" @@ -104203,51 +109715,51 @@ ] }, "limit": { - "context": 1048576, - "output": 384000 + "context": 400000, + "output": 128000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { "supported": true, - "default": true + "default": false }, "extra_capabilities": { "reasoning": { "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] + "default_enabled": false, + "mode": "effort", + "effort": "none", + "effort_options": [ + "none", + "low", + "medium", + "high" + ], + "verbosity": "medium", + "verbosity_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" } }, - "attachment": false, - "open_weights": true, - "knowledge": "2025-05", - "release_date": "2026-04-24", - "last_updated": "2026-04-24", + "attachment": true, + "open_weights": false, + "release_date": "2025-11-12", + "last_updated": "2025-11-12", "cost": { - "input": 1.392, - "output": 2.784, - "cache_read": 0.116 + "input": 0.22, + "output": 1.8, + "cache_read": 0.022 }, "type": "chat" - } - ] - }, - "mixlayer": { - "id": "mixlayer", - "name": "Mixlayer", - "display_name": "Mixlayer", - "api": "https://models.mixlayer.ai/v1", - "doc": "https://docs.mixlayer.com", - "models": [ + }, { - "id": "qwen/qwen3.5-122b-a10b", - "name": "Qwen3.5 122B A10B", - "display_name": "Qwen3.5 122B A10B", + "id": "openai/o4-mini-deep-research", + "name": "o4-mini-deep-research", + "display_name": "o4-mini-deep-research", "modalities": { "input": [ "text" @@ -104257,10 +109769,10 @@ ] }, "limit": { - "context": 262144, - "output": 262144 + "context": 200000, + "output": 100000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { "supported": true, @@ -104269,170 +109781,139 @@ "extra_capabilities": { "reasoning": { "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] + "default_enabled": true, + "mode": "effort", + "effort": "medium", + "effort_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" } }, - "attachment": false, - "open_weights": true, - "release_date": "2026-03-18", - "last_updated": "2026-03-18", + "attachment": true, + "open_weights": false, + "release_date": "2025-06-27", + "last_updated": "2025-06-27", "cost": { - "input": 0.4, - "output": 3.2 + "input": 1.8, + "output": 7.2, + "cache_read": 0.45 }, "type": "chat" }, { - "id": "qwen/qwen3.5-9b", - "name": "Qwen3.5 9B", - "display_name": "Qwen3.5 9B", + "id": "openai/gpt-image-1.5", + "name": "gpt-image-1.5", + "display_name": "gpt-image-1.5", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ - "text" + "image" ] }, "limit": { - "context": 262144, - "output": 262144 + "context": 128000, + "output": 8192 }, - "temperature": true, - "tool_call": true, + "temperature": false, + "tool_call": false, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } - }, - "attachment": false, - "open_weights": true, - "release_date": "2026-03-18", - "last_updated": "2026-03-18", - "cost": { - "input": 0.1, - "output": 0.4 + "supported": false }, - "type": "chat" + "attachment": true, + "open_weights": false, + "release_date": "2025-12-16", + "last_updated": "2025-12-16", + "type": "imageGeneration" }, { - "id": "qwen/qwen3.5-35b-a3b", - "name": "Qwen3.5 35B A3B", - "display_name": "Qwen3.5 35B A3B", + "id": "openai/gpt-4.1-nano", + "name": "GPT-4.1-nano", + "display_name": "GPT-4.1-nano", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 262144, - "output": 262144 - }, - "temperature": true, - "tool_call": true, - "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } + "context": 1047576, + "output": 32768 }, - "attachment": false, - "open_weights": true, - "release_date": "2026-03-18", - "last_updated": "2026-03-18", + "temperature": false, + "tool_call": true, + "reasoning": { + "supported": false + }, + "attachment": true, + "open_weights": false, + "release_date": "2025-04-15", + "last_updated": "2025-04-15", "cost": { - "input": 0.25, - "output": 1.3 + "input": 0.09, + "output": 0.36, + "cache_read": 0.022 }, "type": "chat" }, { - "id": "qwen/qwen3.5-397b-a17b", - "name": "Qwen3.5 397B A17B", - "display_name": "Qwen3.5 397B A17B", + "id": "openai/gpt-3.5-turbo-raw", + "name": "GPT-3.5-Turbo-Raw", + "display_name": "GPT-3.5-Turbo-Raw", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 262144, - "output": 262144 + "context": 4524, + "output": 2048 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } + "supported": false }, - "attachment": false, - "open_weights": true, - "release_date": "2026-03-18", - "last_updated": "2026-03-18", + "attachment": true, + "open_weights": false, + "release_date": "2023-09-27", + "last_updated": "2023-09-27", "cost": { - "input": 0.6, - "output": 3.6 + "input": 0.45, + "output": 1.4 }, "type": "chat" }, { - "id": "qwen/qwen3.5-27b", - "name": "Qwen3.5 27B", - "display_name": "Qwen3.5 27B", + "id": "openai/o1", + "name": "o1", + "display_name": "o1", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 262144, - "output": 262144 + "context": 200000, + "output": 100000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { "supported": true, @@ -104441,50 +109922,45 @@ "extra_capabilities": { "reasoning": { "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] + "default_enabled": true, + "mode": "effort", + "effort": "medium", + "effort_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" } }, - "attachment": false, - "open_weights": true, - "release_date": "2026-03-18", - "last_updated": "2026-03-18", + "attachment": true, + "open_weights": false, + "release_date": "2024-12-18", + "last_updated": "2024-12-18", "cost": { - "input": 0.3, - "output": 2.4 + "input": 14, + "output": 54 }, "type": "chat" - } - ] - }, - "minimax-coding-plan": { - "id": "minimax-coding-plan", - "name": "MiniMax Coding Plan (minimax.io)", - "display_name": "MiniMax Coding Plan (minimax.io)", - "api": "https://api.minimax.io/anthropic/v1", - "doc": "https://platform.minimax.io/docs/coding-plan/intro", - "models": [ + }, { - "id": "MiniMax-M2.5", - "name": "MiniMax-M2.5", - "display_name": "MiniMax-M2.5", + "id": "openai/o1-pro", + "name": "o1-pro", + "display_name": "o1-pro", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 204800, - "output": 131072 + "context": 200000, + "output": 100000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { "supported": true, @@ -104492,150 +109968,178 @@ }, "extra_capabilities": { "reasoning": { - "supported": true + "supported": true, + "default_enabled": true, + "mode": "effort", + "effort": "medium", + "effort_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" } }, - "attachment": false, - "open_weights": true, - "release_date": "2026-02-12", - "last_updated": "2026-02-12", + "attachment": true, + "open_weights": false, + "release_date": "2025-03-19", + "last_updated": "2025-03-19", "cost": { - "input": 0, - "output": 0, - "cache_read": 0, - "cache_write": 0 + "input": 140, + "output": 540 }, "type": "chat" }, { - "id": "MiniMax-M3", - "name": "MiniMax-M3", - "display_name": "MiniMax-M3", + "id": "openai/gpt-5.4", + "name": "GPT-5.4", + "display_name": "GPT-5.4", "modalities": { "input": [ "text", "image", - "video" + "pdf" ], "output": [ - "text" + "image" ] }, "limit": { - "context": 512000, + "context": 1050000, "output": 128000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { "supported": true, - "default": true + "default": false }, "extra_capabilities": { "reasoning": { - "supported": true + "supported": true, + "default_enabled": false, + "mode": "effort", + "effort": "none", + "effort_options": [ + "none", + "low", + "medium", + "high", + "xhigh" + ], + "verbosity": "medium", + "verbosity_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" } }, "attachment": true, - "open_weights": true, - "release_date": "2026-06-01", - "last_updated": "2026-06-01", + "open_weights": false, + "release_date": "2026-02-26", + "last_updated": "2026-02-26", "cost": { - "input": 0, - "output": 0, - "cache_read": 0, - "cache_write": 0 + "input": 2.2, + "output": 14, + "cache_read": 0.22 }, "type": "chat" }, { - "id": "MiniMax-M2.5-highspeed", - "name": "MiniMax-M2.5-highspeed", - "display_name": "MiniMax-M2.5-highspeed", + "id": "openai/gpt-5.4-mini", + "name": "GPT-5.4-Mini", + "display_name": "GPT-5.4-Mini", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 204800, - "output": 131072 + "context": 400000, + "output": 128000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { "supported": true, - "default": true + "default": false }, "extra_capabilities": { "reasoning": { - "supported": true + "supported": true, + "default_enabled": false, + "mode": "effort", + "effort": "none", + "effort_options": [ + "none", + "low", + "medium", + "high", + "xhigh" + ], + "verbosity": "medium", + "verbosity_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" } }, - "attachment": false, - "open_weights": true, - "release_date": "2026-02-13", - "last_updated": "2026-02-13", + "attachment": true, + "open_weights": false, + "release_date": "2026-03-12", + "last_updated": "2026-03-12", "cost": { - "input": 0, - "output": 0, - "cache_read": 0, - "cache_write": 0 + "input": 0.68, + "output": 4, + "cache_read": 0.068 }, "type": "chat" }, { - "id": "MiniMax-M2.7", - "name": "MiniMax-M2.7", - "display_name": "MiniMax-M2.7", + "id": "openai/gpt-4.1", + "name": "GPT-4.1", + "display_name": "GPT-4.1", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 204800, - "output": 131072 + "context": 1047576, + "output": 32768 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } + "supported": false }, - "attachment": false, - "open_weights": true, - "release_date": "2026-03-18", - "last_updated": "2026-03-18", + "attachment": true, + "open_weights": false, + "release_date": "2025-04-14", + "last_updated": "2025-04-14", "cost": { - "input": 0, - "output": 0, - "cache_read": 0, - "cache_write": 0 + "input": 1.8, + "output": 7.2, + "cache_read": 0.45 }, "type": "chat" }, { - "id": "MiniMax-M2", - "name": "MiniMax-M2", - "display_name": "MiniMax-M2", + "id": "openai/o3-deep-research", + "name": "o3-deep-research", + "display_name": "o3-deep-research", "modalities": { "input": [ "text" @@ -104645,10 +110149,10 @@ ] }, "limit": { - "context": 196608, - "output": 128000 + "context": 200000, + "output": 100000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { "supported": true, @@ -104656,36 +110160,47 @@ }, "extra_capabilities": { "reasoning": { - "supported": true + "supported": true, + "default_enabled": true, + "mode": "effort", + "effort": "medium", + "effort_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" } }, - "attachment": false, - "open_weights": true, - "release_date": "2025-10-27", - "last_updated": "2025-10-27", + "attachment": true, + "open_weights": false, + "release_date": "2025-06-27", + "last_updated": "2025-06-27", "cost": { - "input": 0, - "output": 0 + "input": 9, + "output": 36, + "cache_read": 2.2 }, "type": "chat" }, { - "id": "MiniMax-M2.7-highspeed", - "name": "MiniMax-M2.7-highspeed", - "display_name": "MiniMax-M2.7-highspeed", + "id": "openai/gpt-5-mini", + "name": "GPT-5-mini", + "display_name": "GPT-5-mini", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 204800, - "output": 131072 + "context": 400000, + "output": 128000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { "supported": true, @@ -104694,213 +110209,229 @@ "extra_capabilities": { "reasoning": { "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] + "default_enabled": true, + "mode": "effort", + "effort": "medium", + "effort_options": [ + "minimal", + "low", + "medium", + "high" + ], + "verbosity": "medium", + "verbosity_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" } }, - "attachment": false, - "open_weights": true, - "release_date": "2026-03-18", - "last_updated": "2026-03-18", + "attachment": true, + "open_weights": false, + "release_date": "2025-06-25", + "last_updated": "2025-06-25", "cost": { - "input": 0, - "output": 0, - "cache_read": 0, - "cache_write": 0 + "input": 0.22, + "output": 1.8, + "cache_read": 0.022 }, "type": "chat" }, { - "id": "MiniMax-M2.1", - "name": "MiniMax-M2.1", - "display_name": "MiniMax-M2.1", + "id": "openai/gpt-image-1", + "name": "GPT-Image-1", + "display_name": "GPT-Image-1", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ - "text" + "image" ] }, "limit": { - "context": 204800, - "output": 131072 + "context": 128000, + "output": 8192 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true - } - }, - "attachment": false, - "open_weights": true, - "release_date": "2025-12-23", - "last_updated": "2025-12-23", - "cost": { - "input": 0, - "output": 0 + "supported": false }, - "type": "chat" - } - ] - }, - "evroc": { - "id": "evroc", - "name": "evroc", - "display_name": "evroc", - "api": "https://models.think.evroc.com/v1", - "doc": "https://docs.evroc.com/products/think/overview.html", - "models": [ + "attachment": true, + "open_weights": false, + "release_date": "2025-03-31", + "last_updated": "2025-03-31", + "type": "imageGeneration" + }, { - "id": "mistralai/Voxtral-Small-24B-2507", - "name": "Voxtral Small 24B", - "display_name": "Voxtral Small 24B", + "id": "openai/gpt-4.1-mini", + "name": "GPT-4.1-mini", + "display_name": "GPT-4.1-mini", "modalities": { "input": [ - "audio", - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 32000, - "output": 32000 + "context": 1047576, + "output": 32768 }, - "tool_call": false, + "temperature": false, + "tool_call": true, "reasoning": { "supported": false }, - "attachment": false, - "open_weights": true, - "release_date": "2025-03-01", - "last_updated": "2025-03-01", + "attachment": true, + "open_weights": false, + "release_date": "2025-04-15", + "last_updated": "2025-04-15", "cost": { - "input": 0.00236, - "output": 0.00236, - "output_audio": 2.36 + "input": 0.36, + "output": 1.4, + "cache_read": 0.09 }, "type": "chat" }, { - "id": "mistralai/devstral-small-2-24b-instruct-2512", - "name": "Devstral Small 2 24B Instruct 2512", - "display_name": "Devstral Small 2 24B Instruct 2512", + "id": "openai/gpt-4-turbo", + "name": "GPT-4-Turbo", + "display_name": "GPT-4-Turbo", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 32768, - "output": 32768 + "context": 128000, + "output": 4096 }, + "temperature": false, "tool_call": true, "reasoning": { "supported": false }, - "attachment": false, - "open_weights": true, - "release_date": "2025-12-01", - "last_updated": "2025-12-01", + "attachment": true, + "open_weights": false, + "release_date": "2023-09-13", + "last_updated": "2023-09-13", "cost": { - "input": 0.12, - "output": 0.47 + "input": 9, + "output": 27 }, "type": "chat" }, { - "id": "mistralai/Magistral-Small-2509", - "name": "Magistral Small 1.2 24B", - "display_name": "Magistral Small 1.2 24B", + "id": "openai/gpt-image-1-mini", + "name": "GPT-Image-1-Mini", + "display_name": "GPT-Image-1-Mini", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ - "text" + "image" ] }, "limit": { - "context": 131072, - "output": 131072 + "context": 8192, + "output": 8192 }, - "tool_call": false, + "temperature": false, + "tool_call": true, "reasoning": { "supported": false }, - "attachment": false, - "open_weights": true, - "release_date": "2025-06-01", - "last_updated": "2025-06-01", - "cost": { - "input": 0.59, - "output": 2.36 - }, - "type": "chat" + "attachment": true, + "open_weights": false, + "release_date": "2025-08-26", + "last_updated": "2025-08-26", + "type": "imageGeneration" }, { - "id": "KBLab/kb-whisper-large", - "name": "KB Whisper", - "display_name": "KB Whisper", + "id": "openai/gpt-5-nano", + "name": "GPT-5-nano", + "display_name": "GPT-5-nano", "modalities": { "input": [ - "audio" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 448, - "output": 448 + "context": 400000, + "output": 128000 }, - "tool_call": false, + "temperature": false, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": false, - "open_weights": true, - "release_date": "2024-10-01", - "last_updated": "2024-10-01", + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": true, + "mode": "effort", + "effort": "medium", + "effort_options": [ + "minimal", + "low", + "medium", + "high" + ], + "verbosity": "medium", + "verbosity_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" + } + }, + "attachment": true, + "open_weights": false, + "release_date": "2025-08-05", + "last_updated": "2025-08-05", "cost": { - "input": 0.00236, - "output": 0.00236, - "output_audio": 2.36 + "input": 0.045, + "output": 0.36, + "cache_read": 0.0045 }, "type": "chat" }, { - "id": "moonshotai/Kimi-K2.5", - "name": "Kimi K2.5", - "display_name": "Kimi K2.5", + "id": "openai/gpt-5.4-pro", + "name": "GPT-5.4-Pro", + "display_name": "GPT-5.4-Pro", "modalities": { "input": [ "text", - "image", - "video" + "image" ], "output": [ - "text" + "image" ] }, "limit": { - "context": 262144, - "output": 262144 + "context": 1050000, + "output": 128000 }, + "temperature": false, "tool_call": true, "reasoning": { "supported": true, @@ -104909,88 +110440,124 @@ "extra_capabilities": { "reasoning": { "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] + "default_enabled": true, + "mode": "effort", + "effort": "high", + "effort_options": [ + "medium", + "high", + "xhigh" + ], + "verbosity": "medium", + "verbosity_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" } }, - "attachment": false, - "open_weights": true, - "release_date": "2026-01-27", - "last_updated": "2026-01-27", + "attachment": true, + "open_weights": false, + "release_date": "2026-03-05", + "last_updated": "2026-03-05", "cost": { - "input": 1.47, - "output": 5.9 + "input": 27, + "output": 160 }, "type": "chat" }, { - "id": "nvidia/Llama-3.3-70B-Instruct-FP8", - "name": "Llama 3.3 70B", - "display_name": "Llama 3.3 70B", + "id": "openai/o3-mini-high", + "name": "o3-mini-high", + "display_name": "o3-mini-high", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 131072, - "output": 32768 + "context": 200000, + "output": 100000 }, - "tool_call": false, + "temperature": false, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": false, - "open_weights": true, - "release_date": "2024-12-01", - "last_updated": "2024-12-01", + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": true, + "mode": "effort", + "effort": "medium", + "effort_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" + } + }, + "attachment": true, + "open_weights": false, + "release_date": "2025-01-31", + "last_updated": "2025-01-31", "cost": { - "input": 1.18, - "output": 1.18 + "input": 0.99, + "output": 4 }, "type": "chat" }, { - "id": "intfloat/multilingual-e5-large-instruct", - "name": "E5 Multi-Lingual Large Embeddings 0.6B", - "display_name": "E5 Multi-Lingual Large Embeddings 0.6B", + "id": "openai/gpt-5.5-pro", + "name": "GPT-5.5-Pro", + "display_name": "GPT-5.5-Pro", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ - "text" + "text", + "image" ] }, "limit": { - "context": 512, - "output": 512 + "context": 400000, + "output": 128000 }, - "tool_call": false, + "temperature": false, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": false, - "open_weights": true, - "release_date": "2024-06-01", - "last_updated": "2024-06-01", + "extra_capabilities": { + "reasoning": { + "supported": true + } + }, + "attachment": true, + "open_weights": false, + "knowledge": "2025-12-01", + "release_date": "2026-04-08", + "last_updated": "2026-04-08", "cost": { - "input": 0.12, - "output": 0.12 + "input": 27.2727, + "output": 163.6364 }, "type": "chat" }, { - "id": "microsoft/Phi-4-multimodal-instruct", - "name": "Phi-4 15B", - "display_name": "Phi-4 15B", + "id": "openai/gpt-4o-mini", + "name": "GPT-4o-mini", + "display_name": "GPT-4o-mini", "modalities": { "input": [ "text", @@ -105001,27 +110568,29 @@ ] }, "limit": { - "context": 32000, - "output": 32000 + "context": 124096, + "output": 4096 }, - "tool_call": false, + "temperature": false, + "tool_call": true, "reasoning": { "supported": false }, - "attachment": false, - "open_weights": true, - "release_date": "2025-01-01", - "last_updated": "2025-01-01", + "attachment": true, + "open_weights": false, + "release_date": "2024-07-18", + "last_updated": "2024-07-18", "cost": { - "input": 0.24, - "output": 0.47 + "input": 0.14, + "output": 0.54, + "cache_read": 0.068 }, "type": "chat" }, { - "id": "Qwen/Qwen3-Embedding-8B", - "name": "Qwen3 Embedding 8B", - "display_name": "Qwen3 Embedding 8B", + "id": "openai/gpt-4o-mini-search", + "name": "GPT-4o-mini-Search", + "display_name": "GPT-4o-mini-Search", "modalities": { "input": [ "text" @@ -105031,178 +110600,295 @@ ] }, "limit": { - "context": 40960, - "output": 4096 + "context": 128000, + "output": 8192 }, - "tool_call": false, + "temperature": false, + "tool_call": true, "reasoning": { "supported": false }, - "attachment": false, - "open_weights": true, - "release_date": "2025-07-30", - "last_updated": "2025-07-30", + "attachment": true, + "open_weights": false, + "release_date": "2025-03-11", + "last_updated": "2025-03-11", "cost": { - "input": 0.12, - "output": 0.12 + "input": 0.14, + "output": 0.54 }, - "type": "embedding" + "type": "chat" }, { - "id": "Qwen/Qwen3-30B-A3B-Instruct-2507-FP8", - "name": "Qwen3 30B 2507", - "display_name": "Qwen3 30B 2507", + "id": "openai/gpt-5-codex", + "name": "GPT-5-Codex", + "display_name": "GPT-5-Codex", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 64000, - "output": 64000 + "context": 400000, + "output": 128000 }, + "temperature": false, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": false, - "open_weights": true, - "release_date": "2025-07-30", - "last_updated": "2025-07-30", + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": true, + "mode": "effort", + "effort": "medium", + "effort_options": [ + "minimal", + "low", + "medium", + "high" + ], + "verbosity": "medium", + "verbosity_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" + } + }, + "attachment": true, + "open_weights": false, + "release_date": "2025-09-23", + "last_updated": "2025-09-23", "cost": { - "input": 0.35, - "output": 1.42 + "input": 1.1, + "output": 9 }, "type": "chat" }, { - "id": "Qwen/Qwen3-VL-30B-A3B-Instruct", - "name": "Qwen3 VL 30B", - "display_name": "Qwen3 VL 30B", + "id": "openai/gpt-5.2-codex", + "name": "GPT-5.2-Codex", + "display_name": "GPT-5.2-Codex", "modalities": { "input": [ "text", - "image", - "video" + "image" ], "output": [ "text" ] }, "limit": { - "context": 100000, - "output": 100000 + "context": 400000, + "output": 128000 }, + "temperature": false, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": false, - "open_weights": true, - "release_date": "2025-07-30", - "last_updated": "2025-07-30", + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": true, + "mode": "effort", + "effort": "medium", + "effort_options": [ + "low", + "medium", + "high", + "xhigh" + ], + "verbosity": "medium", + "verbosity_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" + } + }, + "attachment": true, + "open_weights": false, + "release_date": "2026-01-14", + "last_updated": "2026-01-14", "cost": { - "input": 0.24, - "output": 0.94 + "input": 1.6, + "output": 13, + "cache_read": 0.16 }, "type": "chat" }, { - "id": "openai/gpt-oss-120b", - "name": "GPT OSS 120B", - "display_name": "GPT OSS 120B", + "id": "openai/gpt-5.1-instant", + "name": "GPT-5.1-Instant", + "display_name": "GPT-5.1-Instant", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 65536, - "output": 65536 + "context": 128000, + "output": 16384 }, + "temperature": false, "tool_call": true, "reasoning": { "supported": true, - "default": true + "default": false }, "extra_capabilities": { "reasoning": { - "supported": true + "supported": true, + "default_enabled": false, + "mode": "effort", + "effort": "none", + "effort_options": [ + "none", + "low", + "medium", + "high" + ], + "verbosity": "medium", + "verbosity_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" } }, - "attachment": false, - "open_weights": true, - "release_date": "2025-08-05", - "last_updated": "2025-08-05", + "attachment": true, + "open_weights": false, + "release_date": "2025-11-12", + "last_updated": "2025-11-12", "cost": { - "input": 0.24, - "output": 0.94 + "input": 1.1, + "output": 9, + "cache_read": 0.11 }, "type": "chat" }, { - "id": "openai/whisper-large-v3", - "name": "Whisper 3 Large", - "display_name": "Whisper 3 Large", + "id": "openai/gpt-image-2", + "name": "GPT-Image-2", + "display_name": "GPT-Image-2", "modalities": { "input": [ - "audio" + "text", + "image" ], "output": [ - "text" + "image" ] }, "limit": { - "context": 448, - "output": 4096 + "context": 8192, + "output": 8192 }, + "temperature": false, "tool_call": false, "reasoning": { "supported": false }, - "attachment": false, - "open_weights": true, - "release_date": "2024-10-01", - "last_updated": "2024-10-01", + "attachment": true, + "open_weights": false, + "release_date": "2026-04-21", + "last_updated": "2026-04-21", "cost": { - "input": 0.00236, - "output": 0.00236, - "output_audio": 2.36 + "input": 5.0505, + "output": 32.3232, + "cache_read": 1.2626 }, - "type": "chat" - } - ] - }, - "nvidia": { - "id": "nvidia", - "name": "Nvidia", - "display_name": "Nvidia", - "api": "https://integrate.api.nvidia.com/v1", - "doc": "https://docs.api.nvidia.com/nim/", - "models": [ + "type": "imageGeneration" + }, { - "id": "z-ai/glm-5.1", - "name": "GLM-5.1", - "display_name": "GLM-5.1", + "id": "openai/gpt-5.1", + "name": "GPT-5.1", + "display_name": "GPT-5.1", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 131072, - "output": 131072 + "context": 400000, + "output": 128000 }, - "temperature": true, + "temperature": false, + "tool_call": true, + "reasoning": { + "supported": true, + "default": false + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": false, + "mode": "effort", + "effort": "none", + "effort_options": [ + "none", + "low", + "medium", + "high" + ], + "verbosity": "medium", + "verbosity_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" + } + }, + "attachment": true, + "open_weights": false, + "release_date": "2025-11-12", + "last_updated": "2025-11-12", + "cost": { + "input": 1.1, + "output": 9, + "cache_read": 0.11 + }, + "type": "chat" + }, + { + "id": "openai/gpt-5.5", + "name": "GPT-5.5", + "display_name": "GPT-5.5", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text", + "image" + ] + }, + "limit": { + "context": 400000, + "output": 128000 + }, + "temperature": false, "tool_call": true, "reasoning": { "supported": true, @@ -105211,90 +110897,96 @@ "extra_capabilities": { "reasoning": { "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] + "default_enabled": true, + "mode": "effort", + "effort": "medium", + "effort_options": [ + "low", + "medium", + "high", + "xhigh" + ], + "verbosity": "medium", + "verbosity_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" } }, - "attachment": false, - "open_weights": true, - "release_date": "2026-03-27", - "last_updated": "2026-03-27", + "attachment": true, + "open_weights": false, + "knowledge": "2025-12-01", + "release_date": "2026-04-08", + "last_updated": "2026-04-08", "cost": { - "input": 0, - "output": 0 + "input": 4.5455, + "output": 27.2727, + "cache_read": 0.4545 }, "type": "chat" }, { - "id": "upstage/solar-10_7b-instruct", - "name": "solar-10.7b-instruct", - "display_name": "solar-10.7b-instruct", + "id": "runwayml/runway", + "name": "Runway", + "display_name": "Runway", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ - "text" + "video" ] }, "limit": { - "context": 128000, + "context": 256, "output": 8192 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { "supported": false }, - "attachment": false, - "open_weights": true, - "release_date": "2024-06-05", - "last_updated": "2025-04-10", - "cost": { - "input": 0, - "output": 0 - }, + "attachment": true, + "open_weights": false, + "release_date": "2024-10-11", + "last_updated": "2024-10-11", "type": "chat" }, { - "id": "sarvamai/sarvam-m", - "name": "sarvam-m", - "display_name": "sarvam-m", + "id": "runwayml/runway-gen-4-turbo", + "name": "Runway-Gen-4-Turbo", + "display_name": "Runway-Gen-4-Turbo", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ - "text" + "video" ] }, "limit": { - "context": 128000, + "context": 256, "output": 8192 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { "supported": false }, - "attachment": false, - "open_weights": true, - "release_date": "2025-07-25", - "last_updated": "2025-07-25", - "cost": { - "input": 0, - "output": 0 - }, + "attachment": true, + "open_weights": false, + "release_date": "2025-05-09", + "last_updated": "2025-05-09", "type": "chat" }, { - "id": "mistralai/magistral-small-2506", - "name": "Magistral Small 2506", - "display_name": "Magistral Small 2506", + "id": "cerebras/llama-3.1-8b-cs", + "name": "Llama-3.1-8B-CS", + "display_name": "Llama-3.1-8B-CS", "modalities": { "input": [ "text" @@ -105304,60 +110996,56 @@ ] }, "limit": { - "context": 32768, - "output": 32768 + "context": 128000, + "output": 8192 }, - "tool_call": false, + "temperature": false, + "tool_call": true, "reasoning": { "supported": false }, - "attachment": false, + "attachment": true, "open_weights": false, - "release_date": "2025-09-25", - "last_updated": "2025-09-25", + "release_date": "2025-05-13", + "last_updated": "2025-05-13", "cost": { - "input": 0, - "output": 0 + "input": 0.1, + "output": 0.1 }, "type": "chat" }, { - "id": "mistralai/mistral-large-3-675b-instruct-2512", - "name": "Mistral Large 3 675B Instruct 2512", - "display_name": "Mistral Large 3 675B Instruct 2512", + "id": "cerebras/qwen3-235b-2507-cs", + "name": "qwen3-235b-2507-cs", + "display_name": "qwen3-235b-2507-cs", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 262144, - "output": 262144 + "context": 8192, + "output": 8192 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "attachment": true, - "open_weights": true, - "knowledge": "2025-01", - "release_date": "2025-12-02", - "last_updated": "2025-12-02", - "cost": { - "input": 0, - "output": 0 - }, + "open_weights": false, + "release_date": "2025-08-06", + "last_updated": "2025-08-06", "type": "chat" }, { - "id": "mistralai/mistral-nemotron", - "name": "mistral-nemotron", - "display_name": "mistral-nemotron", + "id": "cerebras/gpt-oss-120b-cs", + "name": "GPT-OSS-120B-CS", + "display_name": "GPT-OSS-120B-CS", "modalities": { "input": [ "text" @@ -105370,25 +111058,26 @@ "context": 128000, "output": 8192 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": false, - "open_weights": true, - "release_date": "2025-06-11", - "last_updated": "2025-06-12", + "attachment": true, + "open_weights": false, + "release_date": "2025-08-06", + "last_updated": "2025-08-06", "cost": { - "input": 0, - "output": 0 + "input": 0.35, + "output": 0.75 }, "type": "chat" }, { - "id": "mistralai/mixtral-8x7b-instruct", - "name": "Mistral: Mixtral 8x7B Instruct", - "display_name": "Mistral: Mixtral 8x7B Instruct", + "id": "cerebras/llama-3.3-70b-cs", + "name": "llama-3.3-70b-cs", + "display_name": "llama-3.3-70b-cs", "modalities": { "input": [ "text" @@ -105398,28 +111087,24 @@ ] }, "limit": { - "context": 32768, - "output": 16384 + "context": 8192, + "output": 8192 }, - "temperature": true, - "tool_call": true, + "temperature": false, + "tool_call": false, "reasoning": { "supported": false }, - "attachment": false, - "open_weights": true, - "release_date": "2023-12-10", - "last_updated": "2026-03-15", - "cost": { - "input": 0, - "output": 0 - }, + "attachment": true, + "open_weights": false, + "release_date": "2025-05-13", + "last_updated": "2025-05-13", "type": "chat" }, { - "id": "mistralai/mistral-7b-instruct-v03", - "name": "Mistral-7B-Instruct-v0.3", - "display_name": "Mistral-7B-Instruct-v0.3", + "id": "cerebras/qwen3-32b-cs", + "name": "qwen3-32b-cs", + "display_name": "qwen3-32b-cs", "modalities": { "input": [ "text" @@ -105429,580 +111114,827 @@ ] }, "limit": { - "context": 65536, - "output": 65536 + "context": 8192, + "output": 8192 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { - "supported": false - }, - "attachment": false, - "open_weights": true, - "release_date": "2025-04-01", - "last_updated": "2025-04-01", - "cost": { - "input": 0, - "output": 0 + "supported": true, + "default": true }, + "attachment": true, + "open_weights": false, + "release_date": "2025-05-15", + "last_updated": "2025-05-15", "type": "chat" }, { - "id": "mistralai/mixtral-8x22b-instruct", - "name": "Mistral: Mixtral 8x22B Instruct", - "display_name": "Mistral: Mixtral 8x22B Instruct", + "id": "anthropic/claude-sonnet-3.5", + "name": "Claude-Sonnet-3.5", + "display_name": "Claude-Sonnet-3.5", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 65536, - "output": 13108 + "context": 189096, + "output": 8192 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { "supported": false }, - "attachment": false, - "open_weights": true, - "release_date": "2024-04-17", - "last_updated": "2024-04-17", + "attachment": true, + "open_weights": false, + "release_date": "2024-06-05", + "last_updated": "2024-06-05", "cost": { - "input": 0, - "output": 0 + "input": 2.6, + "output": 13, + "cache_read": 0.26, + "cache_write": 3.2 }, "type": "chat" }, { - "id": "mistralai/mistral-medium-3-instruct", - "name": "Mistral Medium 3", - "display_name": "Mistral Medium 3", + "id": "anthropic/claude-sonnet-3.7", + "name": "Claude-Sonnet-3.7", + "display_name": "Claude-Sonnet-3.7", "modalities": { "input": [ "text", - "image" + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 131072, - "output": 32768 + "context": 196608, + "output": 128000 }, - "tool_call": false, + "temperature": false, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "attachment": true, "open_weights": false, - "release_date": "2025-09-25", - "last_updated": "2025-09-25", + "release_date": "2025-02-19", + "last_updated": "2025-02-19", "cost": { - "input": 0, - "output": 0 + "input": 2.6, + "output": 13, + "cache_read": 0.26, + "cache_write": 3.2 }, "type": "chat" }, { - "id": "mistralai/mistral-small-4-119b-2603", - "name": "mistral-small-4-119b-2603", - "display_name": "mistral-small-4-119b-2603", + "id": "anthropic/claude-sonnet-3.5-june", + "name": "Claude-Sonnet-3.5-June", + "display_name": "Claude-Sonnet-3.5-June", "modalities": { "input": [ "text", - "image" + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 128000, + "context": 189096, "output": 8192 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, "attachment": true, - "open_weights": true, - "release_date": "2026-03-16", - "last_updated": "2026-03-16", + "open_weights": false, + "release_date": "2024-11-18", + "last_updated": "2024-11-18", "cost": { - "input": 0, - "output": 0 + "input": 2.6, + "output": 13, + "cache_read": 0.26, + "cache_write": 3.2 }, "type": "chat" }, { - "id": "qwen/qwen2.5-coder-32b-instruct", - "name": "Qwen2.5 Coder 32b Instruct", - "display_name": "Qwen2.5 Coder 32b Instruct", + "id": "anthropic/claude-sonnet-4.5", + "name": "Claude-Sonnet-4.5", + "display_name": "Claude-Sonnet-4.5", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 4096 + "context": 983040, + "output": 32768 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": false }, - "attachment": false, - "open_weights": true, - "release_date": "2024-11-06", - "last_updated": "2024-11-06", + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": false, + "mode": "budget", + "budget": { + "min": 1024, + "unit": "tokens" + }, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ], + "notes": [ + "Claude 4 manual thinking uses thinking.type = \"enabled\" with budget_tokens.", + "Interleaved thinking requires the interleaved-thinking-2025-05-14 beta header for this model family." + ] + } + }, + "attachment": true, + "open_weights": false, + "release_date": "2025-09-26", + "last_updated": "2025-09-26", "cost": { - "input": 0, - "output": 0 + "input": 2.6, + "output": 13, + "cache_read": 0.26, + "cache_write": 3.2 }, "type": "chat" }, { - "id": "qwen/qwen3.5-122b-a10b", - "name": "Qwen3.5 122B-A10B", - "display_name": "Qwen3.5 122B-A10B", + "id": "anthropic/claude-sonnet-4", + "name": "Claude-Sonnet-4", + "display_name": "Claude-Sonnet-4", "modalities": { "input": [ "text", "image", - "video", - "audio" + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 262144, - "output": 65536 + "context": 983040, + "output": 64000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { "supported": true, - "default": true + "default": false }, "extra_capabilities": { "reasoning": { "supported": true, + "default_enabled": false, + "mode": "budget", + "budget": { + "min": 1024, + "unit": "tokens" + }, "interleaved": true, "summaries": true, "visibility": "summary", "continuation": [ "thinking_blocks" + ], + "notes": [ + "Claude 4 manual thinking uses thinking.type = \"enabled\" with budget_tokens.", + "Interleaved thinking requires the interleaved-thinking-2025-05-14 beta header for this model family." ] } }, "attachment": true, - "open_weights": true, - "release_date": "2026-02-23", - "last_updated": "2026-02-23", + "open_weights": false, + "release_date": "2025-05-21", + "last_updated": "2025-05-21", "cost": { - "input": 0, - "output": 0 + "input": 2.6, + "output": 13, + "cache_read": 0.26, + "cache_write": 3.2 }, "type": "chat" }, { - "id": "qwen/qwen3-next-80b-a3b-instruct", - "name": "Qwen3-Next-80B-A3B-Instruct", - "display_name": "Qwen3-Next-80B-A3B-Instruct", + "id": "anthropic/claude-haiku-4.5", + "name": "Claude-Haiku-4.5", + "display_name": "Claude-Haiku-4.5", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 262144, - "output": 16384 + "context": 192000, + "output": 64000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": false }, - "attachment": false, + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": false, + "mode": "budget", + "budget": { + "min": 1024, + "unit": "tokens" + }, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ], + "notes": [ + "Claude 4 manual thinking uses thinking.type = \"enabled\" with budget_tokens.", + "Interleaved thinking requires the interleaved-thinking-2025-05-14 beta header for this model family." + ] + } + }, + "attachment": true, "open_weights": false, - "knowledge": "2024-12", - "release_date": "2024-12-01", - "last_updated": "2025-09-05", + "release_date": "2025-10-15", + "last_updated": "2025-10-15", "cost": { - "input": 0, - "output": 0 + "input": 0.85, + "output": 4.3, + "cache_read": 0.085, + "cache_write": 1.1 }, "type": "chat" }, { - "id": "qwen/qwen-image-edit", - "name": "Qwen Image Edit", - "display_name": "Qwen Image Edit", + "id": "anthropic/claude-haiku-3", + "name": "Claude-Haiku-3", + "display_name": "Claude-Haiku-3", "modalities": { "input": [ "text", - "image" + "image", + "pdf" ], "output": [ - "image" + "text" ] }, "limit": { - "context": 8192, + "context": 189096, "output": 8192 }, - "temperature": true, - "tool_call": false, + "temperature": false, + "tool_call": true, "reasoning": { "supported": false }, "attachment": true, "open_weights": false, - "release_date": "2025-08-19", - "last_updated": "2025-08-19", + "release_date": "2024-03-09", + "last_updated": "2024-03-09", "cost": { - "input": 0, - "output": 0 + "input": 0.21, + "output": 1.1, + "cache_read": 0.021, + "cache_write": 0.26 }, - "type": "imageGeneration" + "type": "chat" }, { - "id": "qwen/qwen3-coder-480b-a35b-instruct", - "name": "Qwen3 Coder 480B A35B Instruct", - "display_name": "Qwen3 Coder 480B A35B Instruct", + "id": "anthropic/claude-opus-4.7", + "name": "Claude-Opus-4.7", + "display_name": "Claude-Opus-4.7", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 262144, - "output": 66536 + "context": 1048576, + "output": 128000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": false }, - "attachment": false, + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": false, + "mode": "effort", + "effort": "high", + "effort_options": [ + "low", + "medium", + "high", + "xhigh", + "max" + ], + "interleaved": true, + "summaries": true, + "visibility": "omitted", + "continuation": [ + "thinking_blocks" + ], + "notes": [ + "Claude Opus 4.7 and newer Opus models require thinking.type = \"adaptive\" to enable thinking explicitly.", + "Manual budget_tokens requests return 400 on Claude Opus 4.7 and newer adaptive-only Opus models.", + "task_budget is separate from thinking control and should not be treated as a thinking budget." + ] + } + }, + "attachment": true, "open_weights": false, - "knowledge": "2025-04", - "release_date": "2025-07-23", - "last_updated": "2025-07-23", + "release_date": "2026-04-15", + "last_updated": "2026-04-15", "cost": { - "input": 0, - "output": 0 + "input": 4.3, + "output": 21, + "cache_read": 0.43, + "cache_write": 5.4 }, "type": "chat" }, { - "id": "qwen/qwen-image", - "name": "Qwen Image", - "display_name": "Qwen Image", + "id": "anthropic/claude-haiku-3.5", + "name": "Claude-Haiku-3.5", + "display_name": "Claude-Haiku-3.5", "modalities": { "input": [ "text", - "image" + "image", + "pdf" ], "output": [ - "image" + "text" ] }, "limit": { - "context": 8192, + "context": 189096, "output": 8192 }, - "temperature": true, - "tool_call": false, + "temperature": false, + "tool_call": true, "reasoning": { "supported": false }, "attachment": true, "open_weights": false, - "release_date": "2025-08-07", - "last_updated": "2025-08-07", + "release_date": "2024-10-01", + "last_updated": "2024-10-01", "cost": { - "input": 0, - "output": 0 + "input": 0.68, + "output": 3.4, + "cache_read": 0.068, + "cache_write": 0.85 }, - "type": "imageGeneration" + "type": "chat" }, { - "id": "qwen/qwen3.5-397b-a17b", - "name": "Qwen3.5-397B-A17B", - "display_name": "Qwen3.5-397B-A17B", + "id": "anthropic/claude-opus-4.8", + "name": "Claude-Opus-4.8", + "display_name": "Claude-Opus-4.8", "modalities": { "input": [ "text", - "image" + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 262144, - "output": 8192 + "context": 1048576, + "output": 128000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { "supported": true, - "default": true + "default": false }, "extra_capabilities": { "reasoning": { "supported": true, + "default_enabled": false, + "mode": "effort", + "effort": "high", + "effort_options": [ + "low", + "medium", + "high", + "xhigh", + "max" + ], "interleaved": true, "summaries": true, - "visibility": "summary", + "visibility": "omitted", "continuation": [ "thinking_blocks" + ], + "notes": [ + "Claude Opus 4.7 and newer Opus models require thinking.type = \"adaptive\" to enable thinking explicitly.", + "Manual budget_tokens requests return 400 on Claude Opus 4.7 and newer adaptive-only Opus models.", + "task_budget is separate from thinking control and should not be treated as a thinking budget." ] } }, "attachment": true, - "open_weights": true, - "knowledge": "2026-01", - "release_date": "2026-02-16", - "last_updated": "2026-02-16", + "open_weights": false, + "release_date": "2026-05-28", + "last_updated": "2026-05-28", "cost": { - "input": 0, - "output": 0 + "input": 4.2929, + "output": 21.4646 }, "type": "chat" }, { - "id": "black-forest-labs/flux_1-schnell", - "name": "FLUX.1-schnell", - "display_name": "FLUX.1-schnell", + "id": "anthropic/claude-opus-4.1", + "name": "Claude-Opus-4.1", + "display_name": "Claude-Opus-4.1", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ - "image" + "text" ] }, "limit": { - "context": 77, - "output": 8192 + "context": 196608, + "output": 32000 }, "temperature": false, - "tool_call": false, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": false }, - "attachment": false, - "open_weights": true, - "knowledge": "2024-07", - "release_date": "2024-08-01", - "last_updated": "2026-02-04", + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": false, + "mode": "budget", + "budget": { + "min": 1024, + "unit": "tokens" + }, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ], + "notes": [ + "Claude 4 manual thinking uses thinking.type = \"enabled\" with budget_tokens.", + "Interleaved thinking requires the interleaved-thinking-2025-05-14 beta header for this model family." + ] + } + }, + "attachment": true, + "open_weights": false, + "release_date": "2025-08-05", + "last_updated": "2025-08-05", "cost": { - "input": 0, - "output": 0 + "input": 13, + "output": 64, + "cache_read": 1.3, + "cache_write": 16 }, "type": "chat" }, { - "id": "black-forest-labs/flux_2-klein-4b", - "name": "FLUX.2 Klein 4B", - "display_name": "FLUX.2 Klein 4B", + "id": "anthropic/claude-opus-4.5", + "name": "Claude-Opus-4.5", + "display_name": "Claude-Opus-4.5", "modalities": { "input": [ + "text", "image", - "text" + "pdf" ], "output": [ - "image" + "text" ] }, "limit": { - "context": 40960, - "output": 40960 + "context": 196608, + "output": 64000 }, - "temperature": true, - "tool_call": false, + "temperature": false, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": false }, - "attachment": false, - "open_weights": true, - "knowledge": "2025-06", - "release_date": "2026-01-14", - "last_updated": "2026-01-31", + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": false, + "mode": "mixed", + "budget": { + "min": 1024, + "unit": "tokens" + }, + "effort": "high", + "effort_options": [ + "low", + "medium", + "high" + ], + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ], + "notes": [ + "Claude Opus 4.5 uses manual thinking.type = \"enabled\" with budget_tokens; effort can be used alongside the thinking budget.", + "Interleaved thinking requires the interleaved-thinking-2025-05-14 beta header." + ] + } + }, + "attachment": true, + "open_weights": false, + "release_date": "2025-11-21", + "last_updated": "2025-11-21", "cost": { - "input": 0, - "output": 0 + "input": 4.3, + "output": 21, + "cache_read": 0.43, + "cache_write": 5.3 }, "type": "chat" }, { - "id": "black-forest-labs/flux_1-kontext-dev", - "name": "FLUX.1-Kontext-dev", - "display_name": "FLUX.1-Kontext-dev", + "id": "anthropic/claude-sonnet-4.6", + "name": "Claude-Sonnet-4.6", + "display_name": "Claude-Sonnet-4.6", "modalities": { "input": [ "text", - "image" + "image", + "pdf" ], "output": [ - "image" + "text" ] }, "limit": { - "context": 40960, - "output": 40960 + "context": 983040, + "output": 128000 }, "temperature": false, - "tool_call": false, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": false + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": false, + "mode": "mixed", + "budget": { + "min": 1024, + "unit": "tokens" + }, + "effort": "high", + "effort_options": [ + "low", + "medium", + "high", + "max" + ], + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ], + "notes": [ + "Anthropic recommends adaptive thinking with effort for Claude 4.6; budget_tokens remains a deprecated compatibility path.", + "Anthropic API defaults effort to high; lower effort levels should be chosen per workload." + ] + } }, "attachment": true, - "open_weights": true, - "release_date": "2025-08-12", - "last_updated": "2025-08-12", + "open_weights": false, + "release_date": "2026-02-05", + "last_updated": "2026-02-05", "cost": { - "input": 0, - "output": 0 + "input": 2.6, + "output": 13, + "cache_read": 0.26, + "cache_write": 3.2 }, "type": "chat" }, { - "id": "black-forest-labs/flux.1-dev", - "name": "FLUX.1-dev", - "display_name": "FLUX.1-dev", + "id": "anthropic/claude-opus-4", + "name": "Claude-Opus-4", + "display_name": "Claude-Opus-4", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ - "image" + "text" ] }, "limit": { - "context": 4096, - "output": 8192 + "context": 192512, + "output": 28672 }, - "temperature": true, - "tool_call": false, + "temperature": false, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": false }, - "attachment": false, + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": false, + "mode": "budget", + "budget": { + "min": 1024, + "unit": "tokens" + }, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ], + "notes": [ + "Claude 4 manual thinking uses thinking.type = \"enabled\" with budget_tokens.", + "Interleaved thinking requires the interleaved-thinking-2025-05-14 beta header for this model family." + ] + } + }, + "attachment": true, "open_weights": false, - "knowledge": "2024-08", - "release_date": "2024-08-01", - "last_updated": "2025-09-05", + "release_date": "2025-05-21", + "last_updated": "2025-05-21", "cost": { - "input": 0, - "output": 0 + "input": 13, + "output": 64, + "cache_read": 1.3, + "cache_write": 16 }, "type": "chat" }, { - "id": "moonshotai/kimi-k2.6", - "name": "Kimi K2.6", - "display_name": "Kimi K2.6", + "id": "anthropic/claude-opus-4.6", + "name": "Claude-Opus-4.6", + "display_name": "Claude-Opus-4.6", "modalities": { "input": [ "text", "image", - "video" + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 262144, - "output": 262144 + "context": 983040, + "output": 128000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { "supported": true, - "default": true + "default": false }, "extra_capabilities": { "reasoning": { "supported": true, + "default_enabled": false, + "mode": "mixed", + "budget": { + "min": 1024, + "unit": "tokens" + }, + "effort": "high", + "effort_options": [ + "low", + "medium", + "high", + "max" + ], "interleaved": true, "summaries": true, "visibility": "summary", "continuation": [ "thinking_blocks" + ], + "notes": [ + "Anthropic recommends adaptive thinking with effort for Claude 4.6; budget_tokens remains a deprecated compatibility path.", + "Anthropic API defaults effort to high; lower effort levels should be chosen per workload." ] } }, "attachment": true, - "open_weights": true, - "knowledge": "2025-01", - "release_date": "2026-04-21", - "last_updated": "2026-04-21", + "open_weights": false, + "release_date": "2026-02-04", + "last_updated": "2026-02-04", "cost": { - "input": 0, - "output": 0 + "input": 4.3, + "output": 21, + "cache_read": 0.43, + "cache_write": 5.3 }, "type": "chat" }, { - "id": "moonshotai/kimi-k2-instruct-0905", - "name": "Kimi K2 0905", - "display_name": "Kimi K2 0905", + "id": "lumalabs/ray2", + "name": "Ray2", + "display_name": "Ray2", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ - "text" + "video" ] }, "limit": { - "context": 262144, - "output": 262144 + "context": 5000, + "output": 8192 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { "supported": false }, - "attachment": false, - "open_weights": true, - "knowledge": "2024-10", - "release_date": "2025-09-05", - "last_updated": "2025-09-05", - "cost": { - "input": 0, - "output": 0 - }, + "attachment": true, + "open_weights": false, + "release_date": "2025-02-20", + "last_updated": "2025-02-20", "type": "chat" }, { - "id": "abacusai/dracarys-llama-3_1-70b-instruct", - "name": "dracarys-llama-3.1-70b-instruct", - "display_name": "dracarys-llama-3.1-70b-instruct", + "id": "poetools/claude-code", + "name": "claude-code", + "display_name": "claude-code", "modalities": { "input": [ "text" @@ -106012,28 +111944,25 @@ ] }, "limit": { - "context": 128000, + "context": 8192, "output": 8192 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { - "supported": false - }, - "attachment": false, - "open_weights": true, - "release_date": "2024-09-11", - "last_updated": "2025-05-22", - "cost": { - "input": 0, - "output": 0 + "supported": true, + "default": true }, + "attachment": true, + "open_weights": false, + "release_date": "2025-11-27", + "last_updated": "2025-11-27", "type": "chat" }, { - "id": "deepseek-ai/deepseek-v4-flash", - "name": "DeepSeek V4 Flash", - "display_name": "DeepSeek V4 Flash", + "id": "empiriolabs/deepseek-v4-pro-el", + "name": "DeepSeek-V4-Pro-EL", + "display_name": "DeepSeek-V4-Pro-EL", "modalities": { "input": [ "text" @@ -106043,42 +111972,28 @@ ] }, "limit": { - "context": 1048576, - "output": 393216 + "context": 1000000, + "output": 384000 }, - "temperature": true, "tool_call": true, "reasoning": { "supported": true, "default": true }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } - }, - "attachment": false, + "attachment": true, "open_weights": true, - "knowledge": "2025-05", "release_date": "2026-04-24", - "last_updated": "2026-04-24", + "last_updated": "2026-05-02", "cost": { - "input": 0.14, - "output": 0.28, - "cache_read": 0.0028 + "input": 1.67, + "output": 3.33 }, "type": "chat" }, { - "id": "deepseek-ai/deepseek-v4-pro", - "name": "DeepSeek V4 Pro", - "display_name": "DeepSeek V4 Pro", + "id": "empiriolabs/deepseek-v4-flash-el", + "name": "DeepSeek-V4-Flash-EL", + "display_name": "DeepSeek-V4-Flash-EL", "modalities": { "input": [ "text" @@ -106088,204 +112003,166 @@ ] }, "limit": { - "context": 1048576, - "output": 393216 + "context": 1000000, + "output": 384000 }, - "temperature": true, "tool_call": true, "reasoning": { "supported": true, "default": true }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } - }, - "attachment": false, + "attachment": true, "open_weights": true, - "knowledge": "2025-05", "release_date": "2026-04-24", - "last_updated": "2026-04-24", + "last_updated": "2026-05-02", "cost": { - "input": 0.435, - "output": 0.87, - "cache_read": 0.003625 + "input": 0.14, + "output": 0.28 }, "type": "chat" }, { - "id": "nvidia/cosmos-predict1-5b", - "name": "cosmos-predict1-5b", - "display_name": "cosmos-predict1-5b", + "id": "stabilityai/stablediffusionxl", + "name": "StableDiffusionXL", + "display_name": "StableDiffusionXL", "modalities": { "input": [ "text", - "image", - "video" + "image" ], "output": [ - "video" + "image" ] }, "limit": { - "context": 8192, - "output": 4096 + "context": 200, + "output": 8192 }, "temperature": false, - "tool_call": false, + "tool_call": true, "reasoning": { "supported": false }, "attachment": true, - "open_weights": true, - "release_date": "2025-03-18", - "last_updated": "2025-03-18", - "cost": { - "input": 0, - "output": 0 - }, + "open_weights": false, + "release_date": "2023-07-09", + "last_updated": "2023-07-09", "type": "chat" }, { - "id": "nvidia/magpie-tts-zeroshot", - "name": "magpie-tts-zeroshot", - "display_name": "magpie-tts-zeroshot", + "id": "ideogramai/ideogram", + "name": "Ideogram", + "display_name": "Ideogram", "modalities": { "input": [ "text", - "audio" + "image" ], "output": [ - "audio" + "image" ] }, "limit": { - "context": 8192, - "output": 4096 + "context": 150, + "output": 8192 }, "temperature": false, - "tool_call": false, + "tool_call": true, "reasoning": { "supported": false }, "attachment": true, - "open_weights": true, - "release_date": "2025-05-22", - "last_updated": "2025-06-12", - "cost": { - "input": 0, - "output": 0 - }, + "open_weights": false, + "release_date": "2024-04-03", + "last_updated": "2024-04-03", "type": "chat" }, { - "id": "nvidia/sparsedrive", - "name": "sparsedrive", - "display_name": "sparsedrive", + "id": "ideogramai/ideogram-v2a", + "name": "Ideogram-v2a", + "display_name": "Ideogram-v2a", "modalities": { "input": [ - "video" + "text" ], "output": [ - "text" + "image" ] }, "limit": { - "context": 128000, + "context": 150, "output": 8192 }, - "temperature": true, - "tool_call": false, + "temperature": false, + "tool_call": true, "reasoning": { "supported": false }, "attachment": true, - "open_weights": true, - "release_date": "2025-03-18", - "last_updated": "2025-07-20", - "cost": { - "input": 0, - "output": 0 - }, + "open_weights": false, + "release_date": "2025-02-27", + "last_updated": "2025-02-27", "type": "chat" }, { - "id": "nvidia/streampetr", - "name": "streampetr", - "display_name": "streampetr", + "id": "ideogramai/ideogram-v2", + "name": "Ideogram-v2", + "display_name": "Ideogram-v2", "modalities": { "input": [ - "video" + "text", + "image" ], "output": [ - "text" + "image" ] }, "limit": { - "context": 128000, + "context": 150, "output": 8192 }, - "temperature": true, - "tool_call": false, + "temperature": false, + "tool_call": true, "reasoning": { "supported": false }, "attachment": true, - "open_weights": true, - "release_date": "2025-11-13", - "last_updated": "2025-11-13", - "cost": { - "input": 0, - "output": 0 - }, + "open_weights": false, + "release_date": "2024-08-21", + "last_updated": "2024-08-21", "type": "chat" }, { - "id": "nvidia/nemotron-3-nano-omni-30b-a3b-reasoning", - "name": "Nemotron 3 Nano Omni", - "display_name": "Nemotron 3 Nano Omni", + "id": "ideogramai/ideogram-v2a-turbo", + "name": "Ideogram-v2a-Turbo", + "display_name": "Ideogram-v2a-Turbo", "modalities": { "input": [ - "text", - "image", - "video", - "audio" + "text" ], "output": [ - "text" + "image" ] }, "limit": { - "context": 256000, - "output": 65536 + "context": 150, + "output": 8192 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, "attachment": true, - "open_weights": true, - "release_date": "2026-04-28", - "last_updated": "2026-04-28", - "cost": { - "input": 0, - "output": 0 - }, + "open_weights": false, + "release_date": "2025-02-27", + "last_updated": "2025-02-27", "type": "chat" }, { - "id": "nvidia/nemotron-3-nano-30b-a3b", - "name": "nemotron-3-nano-30b-a3b", - "display_name": "nemotron-3-nano-30b-a3b", + "id": "novita/glm-4.7", + "name": "glm-4.7", + "display_name": "glm-4.7", "modalities": { "input": [ "text" @@ -106295,7 +112172,7 @@ ] }, "limit": { - "context": 131072, + "context": 205000, "output": 131072 }, "temperature": true, @@ -106304,21 +112181,27 @@ "supported": true, "default": true }, - "attachment": false, - "open_weights": true, - "knowledge": "2024-09", - "release_date": "2024-12", - "last_updated": "2024-12", - "cost": { - "input": 0, - "output": 0 + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } }, + "attachment": true, + "open_weights": false, + "release_date": "2025-12-22", + "last_updated": "2025-12-22", "type": "chat" }, { - "id": "nvidia/nv-embed-v1", - "name": "nv-embed-v1", - "display_name": "nv-embed-v1", + "id": "novita/minimax-m2.1", + "name": "minimax-m2.1", + "display_name": "minimax-m2.1", "modalities": { "input": [ "text" @@ -106328,60 +112211,62 @@ ] }, "limit": { - "context": 32768, - "output": 2048 + "context": 205000, + "output": 131072 }, "temperature": false, - "tool_call": false, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": false, - "open_weights": true, - "release_date": "2024-06-07", - "last_updated": "2025-07-22", - "cost": { - "input": 0, - "output": 0 + "extra_capabilities": { + "reasoning": { + "supported": true + } }, + "attachment": true, + "open_weights": false, + "release_date": "2025-12-26", + "last_updated": "2025-12-26", "type": "chat" }, { - "id": "nvidia/llama-nemotron-rerank-vl-1b-v2", - "name": "llama-nemotron-rerank-vl-1b-v2", - "display_name": "llama-nemotron-rerank-vl-1b-v2", + "id": "novita/glm-4.6", + "name": "GLM-4.6", + "display_name": "GLM-4.6", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 4096 + "context": 8192, + "output": 8192 }, "temperature": false, - "tool_call": false, + "tool_call": true, "reasoning": { - "supported": false + "supported": true }, - "attachment": true, - "open_weights": true, - "release_date": "2026-03-31", - "last_updated": "2026-03-31", - "cost": { - "input": 0, - "output": 0 + "extra_capabilities": { + "reasoning": { + "supported": true + } }, + "attachment": true, + "open_weights": false, + "release_date": "2025-09-30", + "last_updated": "2025-09-30", "type": "chat" }, { - "id": "nvidia/studiovoice", - "name": "studiovoice", - "display_name": "studiovoice", + "id": "novita/kimi-k2-thinking", + "name": "kimi-k2-thinking", + "display_name": "kimi-k2-thinking", "modalities": { "input": [ "text" @@ -106391,28 +112276,36 @@ ] }, "limit": { - "context": 128000, + "context": 256000, "output": 8192 }, - "temperature": true, - "tool_call": false, + "temperature": false, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": false, - "open_weights": true, - "release_date": "2024-10-03", - "last_updated": "2025-06-13", - "cost": { - "input": 0, - "output": 0 + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } }, + "attachment": true, + "open_weights": false, + "release_date": "2025-11-07", + "last_updated": "2025-11-07", "type": "chat" }, { - "id": "nvidia/cosmos-transfer2_5-2b", - "name": "cosmos-transfer2.5-2b", - "display_name": "cosmos-transfer2.5-2b", + "id": "novita/kimi-k2.5", + "name": "Kimi-K2.5", + "display_name": "Kimi-K2.5", "modalities": { "input": [ "text", @@ -106420,94 +112313,115 @@ "video" ], "output": [ - "video" + "text" ] }, "limit": { - "context": 8192, - "output": 4096 + "context": 128000, + "output": 262144 }, - "temperature": false, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } }, "attachment": true, - "open_weights": true, - "release_date": "2026-02-26", - "last_updated": "2026-02-26", + "open_weights": false, + "release_date": "2026-01-27", + "last_updated": "2026-01-27", "cost": { - "input": 0, - "output": 0 + "input": 0.6, + "output": 3, + "cache_read": 0.1 }, "type": "chat" }, { - "id": "nvidia/nemotron-3-content-safety", - "name": "nemotron-3-content-safety", - "display_name": "nemotron-3-content-safety", + "id": "novita/glm-4.6v", + "name": "glm-4.6v", + "display_name": "glm-4.6v", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 4096 + "context": 131000, + "output": 32768 }, "temperature": false, - "tool_call": false, + "tool_call": true, "reasoning": { - "supported": false - }, - "attachment": false, - "open_weights": true, - "release_date": "2026-04-16", - "last_updated": "2026-04-16", - "cost": { - "input": 0, - "output": 0 + "supported": true, + "default": true }, + "attachment": true, + "open_weights": false, + "release_date": "2025-12-09", + "last_updated": "2025-12-09", "type": "chat" }, { - "id": "nvidia/usdvalidate", - "name": "usdvalidate", - "display_name": "usdvalidate", + "id": "novita/kimi-k2.6", + "name": "Kimi-K2.6", + "display_name": "Kimi-K2.6", "modalities": { "input": [ - "text" + "text", + "image", + "video" ], "output": [ "text" ] }, "limit": { - "context": 8192, - "output": 4096 + "context": 262144, + "output": 262144 }, - "temperature": false, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": false, + "extra_capabilities": { + "reasoning": { + "supported": true + } + }, + "attachment": true, "open_weights": true, - "release_date": "2024-07-24", - "last_updated": "2025-01-08", + "knowledge": "2025-04", + "release_date": "2026-04-20", + "last_updated": "2026-05-02", "cost": { - "input": 0, - "output": 0 + "input": 0.96, + "output": 4.04, + "cache_read": 0.16 }, "type": "chat" }, { - "id": "nvidia/llama-3_2-nemoretriever-300m-embed-v1", - "name": "llama-3_2-nemoretriever-300m-embed-v1", - "display_name": "llama-3_2-nemoretriever-300m-embed-v1", + "id": "novita/glm-4.7-flash", + "name": "glm-4.7-flash", + "display_name": "glm-4.7-flash", "modalities": { "input": [ "text" @@ -106517,60 +112431,58 @@ ] }, "limit": { - "context": 32768, - "output": 2048 + "context": 200000, + "output": 65500 }, "temperature": false, - "tool_call": false, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": false, - "open_weights": true, - "release_date": "2025-07-24", - "last_updated": "2025-07-24", - "cost": { - "input": 0, - "output": 0 + "extra_capabilities": { + "reasoning": { + "supported": true + } }, + "attachment": true, + "open_weights": false, + "release_date": "2026-01-19", + "last_updated": "2026-01-19", "type": "chat" }, { - "id": "nvidia/llama-nemotron-embed-vl-1b-v2", - "name": "llama-nemotron-embed-vl-1b-v2", - "display_name": "llama-nemotron-embed-vl-1b-v2", + "id": "novita/glm-4.7-n", + "name": "glm-4.7-n", + "display_name": "glm-4.7-n", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 32768, - "output": 2048 + "context": 205000, + "output": 131072 }, "temperature": false, - "tool_call": false, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "attachment": true, - "open_weights": true, - "release_date": "2026-02-10", - "last_updated": "2026-02-10", - "cost": { - "input": 0, - "output": 0 - }, + "open_weights": false, + "release_date": "2025-12-22", + "last_updated": "2025-12-22", "type": "chat" }, { - "id": "nvidia/usdcode", - "name": "usdcode", - "display_name": "usdcode", + "id": "novita/glm-5", + "name": "GLM-5", + "display_name": "GLM-5", "modalities": { "input": [ "text" @@ -106580,28 +112492,41 @@ ] }, "limit": { - "context": 128000, - "output": 4096 + "context": 205000, + "output": 131072 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": false, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } + }, + "attachment": true, "open_weights": false, - "release_date": "2026-01-01", - "last_updated": "2026-01-01", + "release_date": "2026-02-15", + "last_updated": "2026-02-15", "cost": { - "input": 0, - "output": 0 + "input": 1, + "output": 3.2, + "cache_read": 0.2 }, "type": "chat" }, { - "id": "nvidia/llama-3_1-nemotron-safety-guard-8b-v3", - "name": "llama-3.1-nemotron-safety-guard-8b-v3", - "display_name": "llama-3.1-nemotron-safety-guard-8b-v3", + "id": "novita/deepseek-v3.2", + "name": "DeepSeek-V3.2", + "display_name": "DeepSeek-V3.2", "modalities": { "input": [ "text" @@ -106612,27 +112537,43 @@ }, "limit": { "context": 128000, - "output": 4096 + "output": 8192 }, - "temperature": false, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": false, + "extra_capabilities": { + "reasoning": { + "supported": true + } + }, + "attachment": true, "open_weights": true, - "release_date": "2025-10-28", - "last_updated": "2025-10-28", + "release_date": "2025-12-01", + "last_updated": "2025-12-01", "cost": { - "input": 0, - "output": 0 + "input": 0.27, + "output": 0.4, + "cache_read": 0.13 }, "type": "chat" - }, + } + ] + }, + "kimi-for-coding": { + "id": "kimi-for-coding", + "name": "Kimi For Coding", + "display_name": "Kimi For Coding", + "api": "https://api.kimi.com/coding/v1", + "doc": "https://www.kimi.com/code/docs/en/third-party-tools/other-coding-agents.html", + "models": [ { - "id": "nvidia/rerank-qa-mistral-4b", - "name": "rerank-qa-mistral-4b", - "display_name": "rerank-qa-mistral-4b", + "id": "kimi-k2-thinking", + "name": "Kimi K2 Thinking", + "display_name": "Kimi K2 Thinking", "modalities": { "input": [ "text" @@ -106642,39 +112583,56 @@ ] }, "limit": { - "context": 128000, - "output": 4096 + "context": 262144, + "output": 32768 }, - "temperature": false, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } }, "attachment": false, "open_weights": true, - "release_date": "2024-03-17", - "last_updated": "2025-01-17", + "knowledge": "2025-07", + "release_date": "2025-11", + "last_updated": "2025-12", "cost": { "input": 0, - "output": 0 + "output": 0, + "cache_read": 0, + "cache_write": 0 }, "type": "chat" }, { - "id": "nvidia/nemotron-3-ultra-550b-a55b", - "name": "Nemotron 3 Ultra 550B A55B", - "display_name": "Nemotron 3 Ultra 550B A55B", + "id": "k2p5", + "name": "Kimi K2.5", + "display_name": "Kimi K2.5", "modalities": { "input": [ - "text" + "text", + "image", + "video" ], "output": [ "text" ] }, "limit": { - "context": 1000000, - "output": 65536 + "context": 262144, + "output": 32768 }, "temperature": true, "tool_call": true, @@ -106684,30 +112642,34 @@ }, "attachment": false, "open_weights": true, - "release_date": "2026-06-04", - "last_updated": "2026-06-04", + "knowledge": "2025-01", + "release_date": "2026-01", + "last_updated": "2026-01", "cost": { - "input": 0.5, - "output": 2.5, - "cache_read": 0.15 + "input": 0, + "output": 0, + "cache_read": 0, + "cache_write": 0 }, "type": "chat" }, { - "id": "nvidia/nvidia-nemotron-nano-9b-v2", - "name": "nvidia-nemotron-nano-9b-v2", - "display_name": "nvidia-nemotron-nano-9b-v2", + "id": "k2p6", + "name": "Kimi K2.6", + "display_name": "Kimi K2.6", "modalities": { "input": [ - "text" + "text", + "image", + "video" ], "output": [ "text" ] }, "limit": { - "context": 131072, - "output": 131072 + "context": 262144, + "output": 32768 }, "temperature": true, "tool_call": true, @@ -106717,50 +112679,67 @@ }, "attachment": false, "open_weights": true, - "knowledge": "2024-09", - "release_date": "2025-08-18", - "last_updated": "2025-08-18", + "knowledge": "2025-01", + "release_date": "2026-04", + "last_updated": "2026-04", "cost": { "input": 0, - "output": 0 + "output": 0, + "cache_read": 0, + "cache_write": 0 }, "type": "chat" - }, + } + ] + }, + "dinference": { + "id": "dinference", + "name": "DInference", + "display_name": "DInference", + "api": "https://api.dinference.com/v1", + "doc": "https://dinference.com", + "models": [ { - "id": "nvidia/synthetic-video-detector", - "name": "synthetic-video-detector", - "display_name": "synthetic-video-detector", + "id": "minimax-m2.5", + "name": "MiniMax-M2.5", + "display_name": "MiniMax-M2.5", "modalities": { "input": [ - "video" + "text" ], "output": [ "text" ] }, "limit": { - "context": 8192, - "output": 4096 + "context": 200000, + "output": 32000 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": true, + "extra_capabilities": { + "reasoning": { + "supported": true + } + }, + "attachment": false, "open_weights": true, - "release_date": "2026-04-16", - "last_updated": "2026-04-16", + "release_date": "2026-02-12", + "last_updated": "2026-02-12", "cost": { - "input": 0, - "output": 0 + "input": 0.22, + "output": 0.88 }, "type": "chat" }, { - "id": "nvidia/nv-embedcode-7b-v1", - "name": "nv-embedcode-7b-v1", - "display_name": "nv-embedcode-7b-v1", + "id": "glm-4.7", + "name": "GLM-4.7", + "display_name": "GLM-4.7", "modalities": { "input": [ "text" @@ -106770,61 +112749,84 @@ ] }, "limit": { - "context": 32768, - "output": 2048 + "context": 200000, + "output": 128000 }, - "temperature": false, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } }, "attachment": false, "open_weights": true, - "release_date": "2025-03-17", - "last_updated": "2025-05-29", + "knowledge": "2025-04", + "release_date": "2025-12-22", + "last_updated": "2025-12-22", "cost": { - "input": 0, - "output": 0 + "input": 0.45, + "output": 1.65 }, "type": "chat" }, { - "id": "nvidia/cosmos-transfer1-7b", - "name": "cosmos-transfer1-7b", - "display_name": "cosmos-transfer1-7b", + "id": "glm-5.1", + "name": "GLM-5.1", + "display_name": "GLM-5.1", "modalities": { "input": [ - "text", - "image", - "video" + "text" ], "output": [ - "video" + "text" ] }, "limit": { - "context": 8192, - "output": 4096 + "context": 200000, + "output": 128000 }, - "temperature": false, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": true, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } + }, + "attachment": false, "open_weights": true, - "release_date": "2025-06-13", - "last_updated": "2025-06-30", + "release_date": "2026-03-27", + "last_updated": "2026-03-27", "cost": { - "input": 0, - "output": 0 + "input": 1.25, + "output": 3.89 }, "type": "chat" }, { - "id": "nvidia/nemotron-mini-4b-instruct", - "name": "nemotron-mini-4b-instruct", - "display_name": "nemotron-mini-4b-instruct", + "id": "gpt-oss-120b", + "name": "GPT OSS 120B", + "display_name": "GPT OSS 120B", "modalities": { "input": [ "text" @@ -106834,134 +112836,207 @@ ] }, "limit": { - "context": 128000, - "output": 8192 + "context": 131072, + "output": 32768 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true + } }, "attachment": false, "open_weights": true, - "release_date": "2024-08-21", - "last_updated": "2024-08-26", + "release_date": "2025-08", + "last_updated": "2025-08", "cost": { - "input": 0, - "output": 0 + "input": 0.0675, + "output": 0.27 }, "type": "chat" }, { - "id": "nvidia/nemotron-voicechat", - "name": "nemotron-voicechat", - "display_name": "nemotron-voicechat", + "id": "glm-5", + "name": "GLM-5", + "display_name": "GLM-5", "modalities": { "input": [ - "text", - "audio" + "text" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 8192 + "context": 200000, + "output": 128000 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": true, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } + }, + "attachment": false, "open_weights": true, - "release_date": "2026-03-16", - "last_updated": "2026-03-16", + "release_date": "2026-02-11", + "last_updated": "2026-02-11", "cost": { - "input": 0, - "output": 0 + "input": 0.75, + "output": 2.4 }, "type": "chat" - }, + } + ] + }, + "perplexity-agent": { + "id": "perplexity-agent", + "name": "Perplexity Agent", + "display_name": "Perplexity Agent", + "api": "https://api.perplexity.ai/v1", + "doc": "https://docs.perplexity.ai/docs/agent-api/models", + "models": [ { - "id": "nvidia/riva-translate-4b-instruct-v1_1", - "name": "riva-translate-4b-instruct-v1_1", - "display_name": "riva-translate-4b-instruct-v1_1", + "id": "xai/grok-4-1-fast-non-reasoning", + "name": "Grok 4.1 Fast (Non-Reasoning)", + "display_name": "Grok 4.1 Fast (Non-Reasoning)", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 4096 + "context": 2000000, + "output": 30000 }, - "temperature": false, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { "supported": false }, - "attachment": false, - "open_weights": true, - "release_date": "2025-12-12", - "last_updated": "2025-12-12", + "attachment": true, + "open_weights": false, + "knowledge": "2025-07", + "release_date": "2025-11-19", + "last_updated": "2025-11-19", "cost": { - "input": 0, - "output": 0 + "input": 0.2, + "output": 0.5, + "cache_read": 0.05 }, "type": "chat" }, { - "id": "nvidia/nemotron-content-safety-reasoning-4b", - "name": "nemotron-content-safety-reasoning-4b", - "display_name": "nemotron-content-safety-reasoning-4b", + "id": "google/gemini-2.5-pro", + "name": "Gemini 2.5 Pro", + "display_name": "Gemini 2.5 Pro", "modalities": { "input": [ - "text" + "text", + "image", + "audio", + "video", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 4096 + "context": 1048576, + "output": 65536 }, - "temperature": false, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { "supported": true, "default": true }, - "attachment": false, - "open_weights": true, - "release_date": "2026-01-22", - "last_updated": "2026-01-22", + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": true, + "mode": "budget", + "budget": { + "default": -1, + "min": 128, + "max": 32768, + "auto": -1, + "unit": "tokens" + }, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thought_signatures" + ] + } + }, + "attachment": true, + "open_weights": false, + "knowledge": "2025-01", + "release_date": "2025-03-20", + "last_updated": "2025-06-05", "cost": { - "input": 0, - "output": 0 + "input": 1.25, + "output": 10, + "cache_read": 0.125, + "tiers": [ + { + "input": 2.5, + "output": 15, + "cache_read": 0.25, + "tier": { + "type": "context", + "size": 200000 + } + } + ], + "context_over_200k": { + "input": 2.5, + "output": 15, + "cache_read": 0.25 + } }, "type": "chat" }, { - "id": "nvidia/nemotron-3-super-120b-a12b", - "name": "Nemotron 3 Super", - "display_name": "Nemotron 3 Super", + "id": "google/gemini-2.5-flash", + "name": "Gemini 2.5 Flash", + "display_name": "Gemini 2.5 Flash", "modalities": { "input": [ - "text" + "text", + "image", + "audio", + "video", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 262144, - "output": 262144 + "context": 1048576, + "output": 65536 }, "temperature": true, "tool_call": true, @@ -106969,252 +113044,469 @@ "supported": true, "default": true }, - "attachment": false, - "open_weights": true, - "knowledge": "2024-04", - "release_date": "2026-03-11", - "last_updated": "2026-03-11", + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": true, + "mode": "budget", + "budget": { + "default": -1, + "min": 0, + "max": 24576, + "auto": -1, + "off": 0, + "unit": "tokens" + }, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thought_signatures" + ] + } + }, + "attachment": true, + "open_weights": false, + "knowledge": "2025-01", + "release_date": "2025-03-20", + "last_updated": "2025-06-05", "cost": { - "input": 0.2, - "output": 0.8 + "input": 0.3, + "output": 2.5, + "cache_read": 0.03 }, "type": "chat" }, { - "id": "nvidia/gliner-pii", - "name": "gliner-pii", - "display_name": "gliner-pii", + "id": "google/gemini-3.1-pro-preview", + "name": "Gemini 3.1 Pro Preview", + "display_name": "Gemini 3.1 Pro Preview", "modalities": { "input": [ - "text" + "text", + "image", + "video", + "audio", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 4096 + "context": 1048576, + "output": 65536 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": false, - "open_weights": true, - "release_date": "2026-03-03", - "last_updated": "2026-03-03", + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": true, + "mode": "level", + "level": "high", + "level_options": [ + "low", + "high" + ], + "summaries": true, + "visibility": "summary", + "continuation": [ + "thought_signatures" + ] + } + }, + "attachment": true, + "open_weights": false, + "knowledge": "2025-01", + "release_date": "2026-02-19", + "last_updated": "2026-02-19", "cost": { - "input": 0, - "output": 0 + "input": 2, + "output": 12, + "cache_read": 0.2, + "tiers": [ + { + "input": 4, + "output": 18, + "cache_read": 0.4, + "tier": { + "type": "context", + "size": 200000 + } + } + ], + "context_over_200k": { + "input": 4, + "output": 18, + "cache_read": 0.4 + } }, "type": "chat" }, { - "id": "nvidia/bevformer", - "name": "bevformer", - "display_name": "bevformer", + "id": "google/gemini-3-flash-preview", + "name": "Gemini 3 Flash Preview", + "display_name": "Gemini 3 Flash Preview", "modalities": { "input": [ - "video" + "text", + "image", + "video", + "audio", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 8192 + "context": 1048576, + "output": 65536 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": true, + "mode": "level", + "level": "high", + "level_options": [ + "minimal", + "low", + "medium", + "high" + ], + "summaries": true, + "visibility": "summary", + "continuation": [ + "thought_signatures" + ] + } }, "attachment": true, - "open_weights": true, - "release_date": "2025-03-18", - "last_updated": "2025-07-20", + "open_weights": false, + "knowledge": "2025-01", + "release_date": "2025-12-17", + "last_updated": "2025-12-17", "cost": { - "input": 0, - "output": 0 + "input": 0.5, + "output": 3, + "cache_read": 0.05, + "tiers": [ + { + "input": 0.5, + "output": 3, + "cache_read": 0.05, + "tier": { + "type": "context", + "size": 200000 + } + } + ], + "context_over_200k": { + "input": 0.5, + "output": 3, + "cache_read": 0.05 + } }, "type": "chat" }, { - "id": "nvidia/active-speaker-detection", - "name": "Active Speaker Detection", - "display_name": "Active Speaker Detection", + "id": "openai/gpt-5.2", + "name": "GPT-5.2", + "display_name": "GPT-5.2", "modalities": { "input": [ - "video" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 8192, - "output": 4096 + "context": 400000, + "output": 128000 }, "temperature": false, - "tool_call": false, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": false + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": false, + "mode": "effort", + "effort": "none", + "effort_options": [ + "none", + "low", + "medium", + "high", + "xhigh" + ], + "verbosity": "medium", + "verbosity_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" + } }, "attachment": true, - "open_weights": true, - "release_date": "2026-04-16", - "last_updated": "2026-04-16", + "open_weights": false, + "knowledge": "2025-08-31", + "release_date": "2025-12-11", + "last_updated": "2025-12-11", "cost": { - "input": 0, - "output": 0 + "input": 1.75, + "output": 14, + "cache_read": 0.175 }, "type": "chat" }, { - "id": "minimaxai/minimax-m2.7", - "name": "MiniMax-M2.7", - "display_name": "MiniMax-M2.7", + "id": "openai/gpt-5.4", + "name": "GPT-5.4", + "display_name": "GPT-5.4", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 204800, - "output": 131072 + "context": 1050000, + "output": 128000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { "supported": true, - "default": true + "default": false }, "extra_capabilities": { "reasoning": { "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] + "default_enabled": false, + "mode": "effort", + "effort": "none", + "effort_options": [ + "none", + "low", + "medium", + "high", + "xhigh" + ], + "verbosity": "medium", + "verbosity_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" } }, - "attachment": false, - "open_weights": true, - "release_date": "2026-03-18", - "last_updated": "2026-04-11", + "attachment": true, + "open_weights": false, + "knowledge": "2025-08-31", + "release_date": "2026-03-05", + "last_updated": "2026-03-05", "cost": { - "input": 0, - "output": 0 + "input": 2.5, + "output": 15, + "cache_read": 0.25 }, "type": "chat" }, { - "id": "microsoft/phi-4-multimodal-instruct", - "name": "Phi 4 Multimodal", - "display_name": "Phi 4 Multimodal", + "id": "openai/gpt-5-mini", + "name": "GPT-5 Mini", + "display_name": "GPT-5 Mini", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 16384 + "context": 400000, + "output": 128000 }, - "tool_call": false, + "temperature": false, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": false, + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": true, + "mode": "effort", + "effort": "medium", + "effort_options": [ + "minimal", + "low", + "medium", + "high" + ], + "verbosity": "medium", + "verbosity_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" + } + }, + "attachment": true, "open_weights": false, - "release_date": "2025-07-26", - "last_updated": "2025-07-26", + "knowledge": "2024-05-30", + "release_date": "2025-08-07", + "last_updated": "2025-08-07", "cost": { - "input": 0, - "output": 0 + "input": 0.25, + "output": 2, + "cache_read": 0.025 }, "type": "chat" }, { - "id": "microsoft/phi-4-mini-instruct", - "name": "Phi-4-Mini", - "display_name": "Phi-4-Mini", + "id": "openai/gpt-5.1", + "name": "GPT-5.1", + "display_name": "GPT-5.1", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 131072, - "output": 8192 + "context": 400000, + "output": 128000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": false }, - "attachment": false, - "open_weights": true, - "knowledge": "2024-12", - "release_date": "2024-12-01", - "last_updated": "2025-09-05", + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": false, + "mode": "effort", + "effort": "none", + "effort_options": [ + "none", + "low", + "medium", + "high" + ], + "verbosity": "medium", + "verbosity_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" + } + }, + "attachment": true, + "open_weights": false, + "knowledge": "2024-09-30", + "release_date": "2025-11-13", + "last_updated": "2025-11-13", "cost": { - "input": 0, - "output": 0 + "input": 1.25, + "output": 10, + "cache_read": 0.125 }, "type": "chat" }, { - "id": "stepfun-ai/step-3.7-flash", - "name": "Step 3.7 Flash", - "display_name": "Step 3.7 Flash", + "id": "openai/gpt-5.5", + "name": "GPT-5.5", + "display_name": "GPT-5.5", "modalities": { "input": [ "text", - "image" + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 256000, - "output": 16384 + "context": 1050000, + "output": 128000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { "supported": true, "default": true }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": true, + "mode": "effort", + "effort": "medium", + "effort_options": [ + "low", + "medium", + "high", + "xhigh" + ], + "verbosity": "medium", + "verbosity_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" + } + }, "attachment": true, - "open_weights": true, - "release_date": "2026-05-28", - "last_updated": "2026-05-28", + "open_weights": false, + "knowledge": "2025-12-01", + "release_date": "2026-04-23", + "last_updated": "2026-04-23", "cost": { - "input": 0, - "output": 0 + "input": 5, + "output": 30, + "cache_read": 0.5 }, "type": "chat" }, { - "id": "stepfun-ai/step-3.5-flash", - "name": "Step 3.5 Flash", - "display_name": "Step 3.5 Flash", + "id": "nvidia/nemotron-3-super-120b-a12b", + "name": "Nemotron 3 Super 120B", + "display_name": "Nemotron 3 Super 120B", "modalities": { "input": [ "text" @@ -107224,8 +113516,8 @@ ] }, "limit": { - "context": 256000, - "output": 16384 + "context": 1000000, + "output": 32000 }, "temperature": true, "tool_call": true, @@ -107235,209 +113527,386 @@ }, "attachment": false, "open_weights": true, - "release_date": "2026-02-02", - "last_updated": "2026-02-02", + "knowledge": "2026-02", + "release_date": "2026-03-11", + "last_updated": "2026-03-11", "cost": { - "input": 0, - "output": 0 + "input": 0.25, + "output": 2.5 }, "type": "chat" }, { - "id": "meta/llama-3.1-70b-instruct", - "name": "Llama 3.1 70b Instruct", - "display_name": "Llama 3.1 70b Instruct", + "id": "anthropic/claude-opus-4-5", + "name": "Claude Opus 4.5", + "display_name": "Claude Opus 4.5", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 4096 + "context": 200000, + "output": 64000 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": false }, - "attachment": false, - "open_weights": true, - "release_date": "2024-07-16", - "last_updated": "2024-07-16", + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": false, + "mode": "mixed", + "budget": { + "min": 1024, + "unit": "tokens" + }, + "effort": "high", + "effort_options": [ + "low", + "medium", + "high" + ], + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ], + "notes": [ + "Claude Opus 4.5 uses manual thinking.type = \"enabled\" with budget_tokens; effort can be used alongside the thinking budget.", + "Interleaved thinking requires the interleaved-thinking-2025-05-14 beta header." + ] + } + }, + "attachment": true, + "open_weights": false, + "knowledge": "2025-03-31", + "release_date": "2025-11-24", + "last_updated": "2025-11-24", "cost": { - "input": 0, - "output": 0 + "input": 5, + "output": 25, + "cache_read": 0.5 }, "type": "chat" }, { - "id": "meta/llama-guard-4-12b", - "name": "Llama Guard 4 12B", - "display_name": "Llama Guard 4 12B", + "id": "anthropic/claude-sonnet-4-5", + "name": "Claude Sonnet 4.5", + "display_name": "Claude Sonnet 4.5", "modalities": { "input": [ "text", - "image" + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 16384 + "context": 200000, + "output": 64000 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": false + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": false, + "mode": "budget", + "budget": { + "min": 1024, + "unit": "tokens" + }, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ], + "notes": [ + "Claude 4 manual thinking uses thinking.type = \"enabled\" with budget_tokens.", + "Interleaved thinking requires the interleaved-thinking-2025-05-14 beta header for this model family." + ] + } }, "attachment": true, - "open_weights": true, - "release_date": "2025-04-05", - "last_updated": "2026-04-30", + "open_weights": false, + "knowledge": "2025-07-31", + "release_date": "2025-09-29", + "last_updated": "2025-09-29", "cost": { - "input": 0, - "output": 0 + "input": 3, + "output": 15, + "cache_read": 0.3 }, "type": "chat" }, { - "id": "meta/llama-4-maverick-17b-128e-instruct", - "name": "Llama 4 Maverick 17b 128e Instruct", - "display_name": "Llama 4 Maverick 17b 128e Instruct", + "id": "anthropic/claude-opus-4-7", + "name": "Claude Opus 4.7", + "display_name": "Claude Opus 4.7", "modalities": { "input": [ "text", - "image" + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 4096 + "context": 1000000, + "output": 128000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": false + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": false, + "mode": "effort", + "effort": "high", + "effort_options": [ + "low", + "medium", + "high", + "xhigh", + "max" + ], + "interleaved": true, + "summaries": true, + "visibility": "omitted", + "continuation": [ + "thinking_blocks" + ], + "notes": [ + "Claude Opus 4.7 and newer Opus models require thinking.type = \"adaptive\" to enable thinking explicitly.", + "Manual budget_tokens requests return 400 on Claude Opus 4.7 and newer adaptive-only Opus models.", + "task_budget is separate from thinking control and should not be treated as a thinking budget." + ] + } }, "attachment": true, - "open_weights": true, - "knowledge": "2024-02", - "release_date": "2025-04-01", - "last_updated": "2025-04-01", + "open_weights": false, + "knowledge": "2026-01-31", + "release_date": "2026-04-16", + "last_updated": "2026-04-16", "cost": { - "input": 0, - "output": 0 + "input": 5, + "output": 25, + "cache_read": 0.5 }, "type": "chat" }, { - "id": "meta/esm2-650m", - "name": "esm2-650m", - "display_name": "esm2-650m", + "id": "anthropic/claude-haiku-4-5", + "name": "Claude Haiku 4.5", + "display_name": "Claude Haiku 4.5", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 8192 + "context": 200000, + "output": 64000 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": false }, - "attachment": false, - "open_weights": true, - "release_date": "2024-08-29", - "last_updated": "2025-03-10", + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": false, + "mode": "budget", + "budget": { + "min": 1024, + "unit": "tokens" + }, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ], + "notes": [ + "Claude 4 manual thinking uses thinking.type = \"enabled\" with budget_tokens.", + "Interleaved thinking requires the interleaved-thinking-2025-05-14 beta header for this model family." + ] + } + }, + "attachment": true, + "open_weights": false, + "knowledge": "2025-02-28", + "release_date": "2025-10-15", + "last_updated": "2025-10-15", "cost": { - "input": 0, - "output": 0 + "input": 1, + "output": 5, + "cache_read": 0.1 }, "type": "chat" }, { - "id": "meta/llama-3.2-3b-instruct", - "name": "Llama 3.2 3B Instruct", - "display_name": "Llama 3.2 3B Instruct", + "id": "anthropic/claude-opus-4-6", + "name": "Claude Opus 4.6", + "display_name": "Claude Opus 4.6", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 32768, - "output": 32000 + "context": 200000, + "output": 128000 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": false }, - "attachment": false, - "open_weights": true, - "release_date": "2024-09-18", - "last_updated": "2024-09-18", + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": false, + "mode": "mixed", + "budget": { + "min": 1024, + "unit": "tokens" + }, + "effort": "high", + "effort_options": [ + "low", + "medium", + "high", + "max" + ], + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ], + "notes": [ + "Anthropic recommends adaptive thinking with effort for Claude 4.6; budget_tokens remains a deprecated compatibility path.", + "Anthropic API defaults effort to high; lower effort levels should be chosen per workload." + ] + } + }, + "attachment": true, + "open_weights": false, + "knowledge": "2025-05-31", + "release_date": "2026-02-05", + "last_updated": "2026-02-05", "cost": { - "input": 0, - "output": 0 + "input": 5, + "output": 25, + "cache_read": 0.5 }, "type": "chat" }, { - "id": "meta/llama-3.2-11b-vision-instruct", - "name": "Llama 3.2 11b Vision Instruct", - "display_name": "Llama 3.2 11b Vision Instruct", + "id": "anthropic/claude-sonnet-4-6", + "name": "Claude Sonnet 4.6", + "display_name": "Claude Sonnet 4.6", "modalities": { "input": [ "text", - "image" + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 4096 + "context": 200000, + "output": 64000 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": false + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": false, + "mode": "mixed", + "budget": { + "min": 1024, + "unit": "tokens" + }, + "effort": "high", + "effort_options": [ + "low", + "medium", + "high", + "max" + ], + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ], + "notes": [ + "Anthropic recommends adaptive thinking with effort for Claude 4.6; budget_tokens remains a deprecated compatibility path.", + "Anthropic API defaults effort to high; lower effort levels should be chosen per workload." + ] + } }, "attachment": true, - "open_weights": true, - "knowledge": "2023-12", - "release_date": "2024-09-18", - "last_updated": "2024-09-18", + "open_weights": false, + "knowledge": "2025-08-31", + "release_date": "2026-02-17", + "last_updated": "2026-02-17", "cost": { - "input": 0, - "output": 0 + "input": 3, + "output": 15, + "cache_read": 0.3 }, "type": "chat" }, { - "id": "meta/llama-3.2-1b-instruct", - "name": "Llama 3.2 1b Instruct", - "display_name": "Llama 3.2 1b Instruct", + "id": "perplexity/sonar", + "name": "Sonar", + "display_name": "Sonar", "modalities": { "input": [ "text" @@ -107448,7 +113917,7 @@ }, "limit": { "context": 128000, - "output": 4096 + "output": 8192 }, "temperature": true, "tool_call": true, @@ -107456,20 +113925,30 @@ "supported": false }, "attachment": false, - "open_weights": true, - "knowledge": "2023-12", - "release_date": "2024-09-18", - "last_updated": "2024-09-18", + "open_weights": false, + "knowledge": "2025-09-01", + "release_date": "2024-01-01", + "last_updated": "2025-09-01", "cost": { - "input": 0, - "output": 0 + "input": 0.25, + "output": 2.5, + "cache_read": 0.0625 }, "type": "chat" - }, + } + ] + }, + "siliconflow-com": { + "id": "siliconflow-com", + "name": "SiliconFlow", + "display_name": "SiliconFlow", + "api": "https://api.siliconflow.com/v1", + "doc": "https://cloud.siliconflow.com/models", + "models": [ { - "id": "meta/esmfold", - "name": "esmfold", - "display_name": "esmfold", + "id": "THUDM/GLM-Z1-32B-0414", + "name": "THUDM/GLM-Z1-32B-0414", + "display_name": "THUDM/GLM-Z1-32B-0414", "modalities": { "input": [ "text" @@ -107479,28 +113958,29 @@ ] }, "limit": { - "context": 128000, - "output": 8192 + "context": 131000, + "output": 131000 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "attachment": false, - "open_weights": true, - "release_date": "2024-03-15", - "last_updated": "2025-06-12", + "open_weights": false, + "release_date": "2025-04-18", + "last_updated": "2025-11-25", "cost": { - "input": 0, - "output": 0 + "input": 0.14, + "output": 0.57 }, "type": "chat" }, { - "id": "meta/llama-3.1-8b-instruct", - "name": "Llama 3.1 8B Instruct", - "display_name": "Llama 3.1 8B Instruct", + "id": "THUDM/GLM-4-32B-0414", + "name": "THUDM/GLM-4-32B-0414", + "display_name": "THUDM/GLM-4-32B-0414", "modalities": { "input": [ "text" @@ -107510,8 +113990,8 @@ ] }, "limit": { - "context": 16000, - "output": 4096 + "context": 33000, + "output": 33000 }, "temperature": true, "tool_call": true, @@ -107519,20 +113999,19 @@ "supported": false }, "attachment": false, - "open_weights": true, - "knowledge": "2023-12", - "release_date": "2025-01-01", - "last_updated": "2025-01-01", + "open_weights": false, + "release_date": "2025-04-18", + "last_updated": "2025-11-25", "cost": { - "input": 0, - "output": 0 + "input": 0.27, + "output": 0.27 }, "type": "chat" }, { - "id": "meta/llama-3.3-70b-instruct", - "name": "Llama 3.3 70b Instruct", - "display_name": "Llama 3.3 70b Instruct", + "id": "THUDM/GLM-4-9B-0414", + "name": "THUDM/GLM-4-9B-0414", + "display_name": "THUDM/GLM-4-9B-0414", "modalities": { "input": [ "text" @@ -107542,8 +114021,8 @@ ] }, "limit": { - "context": 128000, - "output": 4096 + "context": 33000, + "output": 33000 }, "temperature": true, "tool_call": true, @@ -107551,52 +114030,51 @@ "supported": false }, "attachment": false, - "open_weights": true, - "release_date": "2024-11-26", - "last_updated": "2024-11-26", + "open_weights": false, + "release_date": "2025-04-18", + "last_updated": "2025-11-25", "cost": { - "input": 0, - "output": 0 + "input": 0.086, + "output": 0.086 }, "type": "chat" }, { - "id": "meta/llama-3.2-90b-vision-instruct", - "name": "Llama-3.2-90B-Vision-Instruct", - "display_name": "Llama-3.2-90B-Vision-Instruct", + "id": "THUDM/GLM-Z1-9B-0414", + "name": "THUDM/GLM-Z1-9B-0414", + "display_name": "THUDM/GLM-Z1-9B-0414", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 8192 + "context": 131000, + "output": 131000 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": true, - "open_weights": true, - "knowledge": "2023-12", - "release_date": "2024-09-25", - "last_updated": "2024-09-25", + "attachment": false, + "open_weights": false, + "release_date": "2025-04-18", + "last_updated": "2025-11-25", "cost": { - "input": 0, - "output": 0 + "input": 0.086, + "output": 0.086 }, "type": "chat" }, { - "id": "baai/bge-m3", - "name": "BGE M3", - "display_name": "BGE M3", + "id": "meta-llama/Meta-Llama-3.1-8B-Instruct", + "name": "meta-llama/Meta-Llama-3.1-8B-Instruct", + "display_name": "meta-llama/Meta-Llama-3.1-8B-Instruct", "modalities": { "input": [ "text" @@ -107606,41 +114084,39 @@ ] }, "limit": { - "context": 8192, - "output": 1024 + "context": 33000, + "output": 4000 }, - "temperature": false, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { "supported": false }, "attachment": false, - "open_weights": true, - "release_date": "2024-01-30", - "last_updated": "2026-04-30", + "open_weights": false, + "release_date": "2025-04-23", + "last_updated": "2025-11-25", "cost": { - "input": 0, - "output": 0 + "input": 0.06, + "output": 0.06 }, - "type": "embedding" + "type": "chat" }, { - "id": "google/gemma-4-31b-it", - "name": "Gemma-4-31B-IT", - "display_name": "Gemma-4-31B-IT", + "id": "moonshotai/Kimi-K2-Thinking", + "name": "moonshotai/Kimi-K2-Thinking", + "display_name": "moonshotai/Kimi-K2-Thinking", "modalities": { "input": [ - "text", - "image", - "video" + "text" ], "output": [ "text" ] }, "limit": { - "context": 256000, - "output": 16384 + "context": 262000, + "output": 262000 }, "temperature": true, "tool_call": true, @@ -107648,21 +114124,31 @@ "supported": true, "default": true }, - "attachment": true, - "open_weights": true, - "knowledge": "2025-01", - "release_date": "2026-04-02", - "last_updated": "2026-04-02", + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } + }, + "attachment": false, + "open_weights": false, + "release_date": "2025-11-07", + "last_updated": "2025-11-25", "cost": { - "input": 0, - "output": 0 + "input": 0.55, + "output": 2.5 }, "type": "chat" }, { - "id": "google/gemma-2-2b-it", - "name": "Gemma 2 2b It", - "display_name": "Gemma 2 2b It", + "id": "moonshotai/Kimi-K2-Instruct-0905", + "name": "moonshotai/Kimi-K2-Instruct-0905", + "display_name": "moonshotai/Kimi-K2-Instruct-0905", "modalities": { "input": [ "text" @@ -107672,8 +114158,8 @@ ] }, "limit": { - "context": 128000, - "output": 4096 + "context": 262000, + "output": 262000 }, "temperature": true, "tool_call": true, @@ -107681,52 +114167,50 @@ "supported": false }, "attachment": false, - "open_weights": true, - "release_date": "2024-07-16", - "last_updated": "2024-07-16", + "open_weights": false, + "release_date": "2025-09-08", + "last_updated": "2025-11-25", "cost": { - "input": 0, - "output": 0 + "input": 0.4, + "output": 2 }, "type": "chat" }, { - "id": "google/gemma-3n-e4b-it", - "name": "Gemma 3n E4b It", - "display_name": "Gemma 3n E4b It", + "id": "moonshotai/Kimi-K2-Instruct", + "name": "moonshotai/Kimi-K2-Instruct", + "display_name": "moonshotai/Kimi-K2-Instruct", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 4096 + "context": 131000, + "output": 131000 }, "temperature": true, "tool_call": true, "reasoning": { "supported": false }, - "attachment": true, - "open_weights": true, - "knowledge": "2024-06", - "release_date": "2025-06-03", - "last_updated": "2025-06-03", + "attachment": false, + "open_weights": false, + "release_date": "2025-07-13", + "last_updated": "2025-11-25", "cost": { - "input": 0, - "output": 0 + "input": 0.58, + "output": 2.29 }, "type": "chat" }, { - "id": "google/google-paligemma", - "name": "paligemma", - "display_name": "paligemma", + "id": "moonshotai/Kimi-K2.6", + "name": "moonshotai/Kimi-K2.6", + "display_name": "moonshotai/Kimi-K2.6", "modalities": { "input": [ "text", @@ -107737,28 +114221,41 @@ ] }, "limit": { - "context": 128000, - "output": 8192 + "context": 262000, + "output": 262000 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": true, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } + }, + "attachment": false, "open_weights": true, - "release_date": "2024-05-14", - "last_updated": "2024-08-26", + "release_date": "2026-04-21", + "last_updated": "2026-04-21", "cost": { - "input": 0, - "output": 0 + "input": 0.95, + "output": 4, + "cache_read": 0.16 }, "type": "chat" }, { - "id": "google/gemma-3n-e2b-it", - "name": "Gemma 3n E2b It", - "display_name": "Gemma 3n E2b It", + "id": "moonshotai/Kimi-K2.5", + "name": "moonshotai/Kimi-K2.5", + "display_name": "moonshotai/Kimi-K2.5", "modalities": { "input": [ "text", @@ -107769,29 +114266,40 @@ ] }, "limit": { - "context": 128000, - "output": 4096 + "context": 262000, + "output": 262000 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": true, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } + }, + "attachment": false, "open_weights": true, - "knowledge": "2024-06", - "release_date": "2025-06-12", - "last_updated": "2025-06-12", + "release_date": "2026-01-27", + "last_updated": "2026-01-27", "cost": { - "input": 0, - "output": 0 + "input": 0.45, + "output": 2.25 }, "type": "chat" }, { - "id": "openai/gpt-oss-120b", - "name": "GPT-OSS-120B", - "display_name": "GPT-OSS-120B", + "id": "baidu/ERNIE-4.5-300B-A47B", + "name": "baidu/ERNIE-4.5-300B-A47B", + "display_name": "baidu/ERNIE-4.5-300B-A47B", "modalities": { "input": [ "text" @@ -107801,35 +114309,28 @@ ] }, "limit": { - "context": 128000, - "output": 8192 + "context": 131000, + "output": 131000 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true - } + "supported": false }, "attachment": false, - "open_weights": true, - "knowledge": "2025-08", - "release_date": "2025-08-04", - "last_updated": "2025-08-14", + "open_weights": false, + "release_date": "2025-07-02", + "last_updated": "2025-11-25", "cost": { - "input": 0, - "output": 0 + "input": 0.28, + "output": 1.1 }, "type": "chat" }, { - "id": "openai/gpt-oss-20b", - "name": "GPT OSS 20B", - "display_name": "GPT OSS 20B", + "id": "ByteDance-Seed/Seed-OSS-36B-Instruct", + "name": "ByteDance-Seed/Seed-OSS-36B-Instruct", + "display_name": "ByteDance-Seed/Seed-OSS-36B-Instruct", "modalities": { "input": [ "text" @@ -107839,66 +114340,65 @@ ] }, "limit": { - "context": 131072, - "output": 32768 + "context": 262000, + "output": 262000 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": true }, "extra_capabilities": { "reasoning": { "supported": true } - }, - "attachment": false, - "open_weights": true, - "release_date": "2025-08-05", - "last_updated": "2025-08-05", + }, + "attachment": false, + "open_weights": false, + "release_date": "2025-09-04", + "last_updated": "2025-11-25", "cost": { - "input": 0, - "output": 0 + "input": 0.21, + "output": 0.57 }, "type": "chat" }, { - "id": "openai/whisper-large-v3", - "name": "Whisper Large v3", - "display_name": "Whisper Large v3", + "id": "stepfun-ai/Step-3.5-Flash", + "name": "stepfun-ai/Step-3.5-Flash", + "display_name": "stepfun-ai/Step-3.5-Flash", "modalities": { "input": [ - "audio" + "text" ], "output": [ "text" ] }, "limit": { - "context": 8192, - "output": 4096 + "context": 262000, + "output": 262000 }, - "temperature": false, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "attachment": false, - "open_weights": true, - "knowledge": "2023-09", - "release_date": "2023-09-01", - "last_updated": "2025-09-05", + "open_weights": false, + "release_date": "2026-02-11", + "last_updated": "2026-02-11", "cost": { - "input": 0, - "output": 0 + "input": 0.1, + "output": 0.3 }, "type": "chat" }, { - "id": "bytedance/seed-oss-36b-instruct", - "name": "ByteDance-Seed/Seed-OSS-36B-Instruct", - "display_name": "ByteDance-Seed/Seed-OSS-36B-Instruct", + "id": "inclusionAI/Ring-flash-2.0", + "name": "inclusionAI/Ring-flash-2.0", + "display_name": "inclusionAI/Ring-flash-2.0", "modalities": { "input": [ "text" @@ -107908,13 +114408,14 @@ ] }, "limit": { - "context": 262000, - "output": 262000 + "context": 131000, + "output": 131000 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true + "supported": true, + "default": true }, "extra_capabilities": { "reasoning": { @@ -107923,27 +114424,18 @@ }, "attachment": false, "open_weights": false, - "release_date": "2025-09-04", + "release_date": "2025-09-29", "last_updated": "2025-11-25", "cost": { - "input": 0, - "output": 0 + "input": 0.14, + "output": 0.57 }, "type": "chat" - } - ] - }, - "routing-run": { - "id": "routing-run", - "name": "routing.run", - "display_name": "routing.run", - "api": "https://ai.routing.sh/v1", - "doc": "https://docs.routing.run/api-reference/models", - "models": [ + }, { - "id": "route/mistral-large-3", - "name": "Mistral Large 3", - "display_name": "Mistral Large 3", + "id": "inclusionAI/Ling-mini-2.0", + "name": "inclusionAI/Ling-mini-2.0", + "display_name": "inclusionAI/Ling-mini-2.0", "modalities": { "input": [ "text" @@ -107953,8 +114445,8 @@ ] }, "limit": { - "context": 128000, - "output": 32768 + "context": 131000, + "output": 131000 }, "temperature": true, "tool_call": true, @@ -107962,67 +114454,63 @@ "supported": false }, "attachment": false, - "open_weights": true, - "knowledge": "2024-11", - "release_date": "2024-11-01", - "last_updated": "2025-12-02", + "open_weights": false, + "release_date": "2025-09-10", + "last_updated": "2025-11-25", "cost": { - "input": 0.5, - "output": 1.5 + "input": 0.07, + "output": 0.28 }, "type": "chat" }, { - "id": "route/mistral-small-2503", - "name": "Mistral Small 2503", - "display_name": "Mistral Small 2503", + "id": "inclusionAI/Ling-flash-2.0", + "name": "inclusionAI/Ling-flash-2.0", + "display_name": "inclusionAI/Ling-flash-2.0", "modalities": { "input": [ - "text", - "image", - "video" + "text" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 32768 + "context": 131000, + "output": 131000 }, "temperature": true, "tool_call": true, "reasoning": { "supported": false }, - "attachment": true, - "open_weights": true, - "knowledge": "2025-06", - "release_date": "2026-03-16", - "last_updated": "2026-03-16", + "attachment": false, + "open_weights": false, + "release_date": "2025-09-18", + "last_updated": "2025-11-25", "cost": { - "input": 0.15, - "output": 0.6 + "input": 0.14, + "output": 0.57 }, "type": "chat" }, { - "id": "route/mimo-v2.5-pro-6bit", - "name": "MiMo V2.5 Pro 6bit", - "display_name": "MiMo V2.5 Pro 6bit", + "id": "Qwen/Qwen3-Omni-30B-A3B-Thinking", + "name": "Qwen/Qwen3-Omni-30B-A3B-Thinking", + "display_name": "Qwen/Qwen3-Omni-30B-A3B-Thinking", "modalities": { "input": [ "text", "image", - "video" + "audio" ], "output": [ "text" ] }, "limit": { - "context": 1000000, - "output": 262144 + "context": 66000, + "output": 66000 }, "temperature": true, "tool_call": true, @@ -108042,50 +114530,31 @@ } }, "attachment": true, - "open_weights": true, - "knowledge": "2024-12", - "release_date": "2026-04-22", - "last_updated": "2026-04-22", + "open_weights": false, + "release_date": "2025-10-04", + "last_updated": "2025-11-25", "cost": { - "input": 0.45, - "output": 1.35, - "cache_read": 0.2, - "tiers": [ - { - "input": 2, - "output": 6, - "cache_read": 0.4, - "tier": { - "type": "context", - "size": 256000 - } - } - ], - "context_over_200k": { - "input": 2, - "output": 6, - "cache_read": 0.4 - } + "input": 0.1, + "output": 0.4 }, "type": "chat" }, { - "id": "route/gemma-4-31b-it", - "name": "Gemma 4 31B IT", - "display_name": "Gemma 4 31B IT", + "id": "Qwen/Qwen2.5-VL-72B-Instruct", + "name": "Qwen/Qwen2.5-VL-72B-Instruct", + "display_name": "Qwen/Qwen2.5-VL-72B-Instruct", "modalities": { "input": [ "text", - "image", - "video" + "image" ], "output": [ "text" ] }, "limit": { - "context": 131072, - "output": 65536 + "context": 131000, + "output": 4000 }, "temperature": true, "tool_call": true, @@ -108093,74 +114562,62 @@ "supported": false }, "attachment": true, - "open_weights": true, - "release_date": "2026-04-02", - "last_updated": "2026-04-02", + "open_weights": false, + "release_date": "2025-01-28", + "last_updated": "2025-11-25", "cost": { - "input": 0.1, - "output": 0.3 + "input": 0.59, + "output": 0.59 }, "type": "chat" }, { - "id": "route/qwen3.6-27b", - "name": "Qwen3.6 27B", - "display_name": "Qwen3.6 27B", + "id": "Qwen/Qwen2.5-VL-32B-Instruct", + "name": "Qwen/Qwen2.5-VL-32B-Instruct", + "display_name": "Qwen/Qwen2.5-VL-32B-Instruct", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 202000, - "output": 32768 + "context": 131000, + "output": 131000 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } + "supported": false }, - "attachment": false, - "open_weights": true, - "release_date": "2026-04-22", - "last_updated": "2026-04-22", + "attachment": true, + "open_weights": false, + "release_date": "2025-03-24", + "last_updated": "2025-11-25", "cost": { - "input": 1.1, - "output": 3.3 + "input": 0.27, + "output": 0.27 }, "type": "chat" }, { - "id": "route/deepseek-v3.2", - "name": "DeepSeek V3.2", - "display_name": "DeepSeek V3.2", + "id": "Qwen/Qwen3-30B-A3B-Thinking-2507", + "name": "Qwen/Qwen3-30B-A3B-Thinking-2507", + "display_name": "Qwen/Qwen3-30B-A3B-Thinking-2507", "modalities": { "input": [ - "text", - "image", - "video" + "text" ], "output": [ "text" ] }, "limit": { - "context": 163840, - "output": 163840 + "context": 262000, + "output": 131000 }, "temperature": true, "tool_call": true, @@ -108179,21 +114636,20 @@ ] } }, - "attachment": true, - "open_weights": true, - "knowledge": "2024-07", - "release_date": "2025-12-01", - "last_updated": "2025-12-01", + "attachment": false, + "open_weights": false, + "release_date": "2025-07-31", + "last_updated": "2025-11-25", "cost": { - "input": 0.4928, - "output": 0.7392 + "input": 0.09, + "output": 0.3 }, "type": "chat" }, { - "id": "route/minimax-m2.7-highspeed", - "name": "MiniMax M2.7 Highspeed", - "display_name": "MiniMax M2.7 Highspeed", + "id": "Qwen/Qwen2.5-7B-Instruct", + "name": "Qwen/Qwen2.5-7B-Instruct", + "display_name": "Qwen/Qwen2.5-7B-Instruct", "modalities": { "input": [ "text" @@ -108203,89 +114659,60 @@ ] }, "limit": { - "context": 100000, - "output": 131072 + "context": 33000, + "output": 4000 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } + "supported": false }, "attachment": false, - "open_weights": true, - "release_date": "2026-03-18", - "last_updated": "2026-03-18", + "open_weights": false, + "release_date": "2024-09-18", + "last_updated": "2025-11-25", "cost": { - "input": 0.33, - "output": 1.32, - "cache_read": 0.06, - "cache_write": 0.375 + "input": 0.05, + "output": 0.05 }, "type": "chat" }, { - "id": "route/kimi-k2.6", - "name": "Kimi K2.6", - "display_name": "Kimi K2.6", + "id": "Qwen/Qwen3-VL-235B-A22B-Instruct", + "name": "Qwen/Qwen3-VL-235B-A22B-Instruct", + "display_name": "Qwen/Qwen3-VL-235B-A22B-Instruct", "modalities": { "input": [ "text", - "image", - "video" + "image" ], "output": [ "text" ] }, "limit": { - "context": 262144, - "output": 262144 + "context": 262000, + "output": 262000 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } + "supported": false }, "attachment": true, - "open_weights": true, - "knowledge": "2025-01", - "release_date": "2026-04-21", - "last_updated": "2026-04-21", + "open_weights": false, + "release_date": "2025-10-04", + "last_updated": "2025-11-25", "cost": { - "input": 0.462, - "output": 2.42, - "cache_read": 0.16 + "input": 0.3, + "output": 1.5 }, "type": "chat" }, { - "id": "route/deepseek-v4-flash-6bit", - "name": "DeepSeek V4 Flash 6bit", - "display_name": "DeepSeek V4 Flash 6bit", + "id": "Qwen/Qwen2.5-32B-Instruct", + "name": "Qwen/Qwen2.5-32B-Instruct", + "display_name": "Qwen/Qwen2.5-32B-Instruct", "modalities": { "input": [ "text" @@ -108295,42 +114722,28 @@ ] }, "limit": { - "context": 1000000, - "output": 131072 + "context": 33000, + "output": 4000 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } + "supported": false }, "attachment": false, - "open_weights": true, - "knowledge": "2025-05", - "release_date": "2026-04-24", - "last_updated": "2026-04-24", + "open_weights": false, + "release_date": "2024-09-19", + "last_updated": "2025-11-25", "cost": { - "input": 0.4928, - "output": 0.7392, - "cache_read": 0.0028 + "input": 0.18, + "output": 0.18 }, "type": "chat" }, { - "id": "route/qwen3.6-27b-202k", - "name": "Qwen3.6 27B 202K", - "display_name": "Qwen3.6 27B 202K", + "id": "Qwen/Qwen3-Next-80B-A3B-Instruct", + "name": "Qwen/Qwen3-Next-80B-A3B-Instruct", + "display_name": "Qwen/Qwen3-Next-80B-A3B-Instruct", "modalities": { "input": [ "text" @@ -108340,39 +114753,28 @@ ] }, "limit": { - "context": 202000, - "output": 32768 + "context": 262000, + "output": 262000 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } + "supported": false }, "attachment": false, - "open_weights": true, - "release_date": "2026-04-22", - "last_updated": "2026-04-22", + "open_weights": false, + "release_date": "2025-09-18", + "last_updated": "2025-11-25", "cost": { - "input": 1.1, - "output": 3.3 + "input": 0.14, + "output": 1.4 }, "type": "chat" }, { - "id": "route/deepseek-v4-pro-6bit", - "name": "DeepSeek V4 Pro 6bit", - "display_name": "DeepSeek V4 Pro 6bit", + "id": "Qwen/Qwen3-235B-A22B-Thinking-2507", + "name": "Qwen/Qwen3-235B-A22B-Thinking-2507", + "display_name": "Qwen/Qwen3-235B-A22B-Thinking-2507", "modalities": { "input": [ "text" @@ -108382,8 +114784,8 @@ ] }, "limit": { - "context": 1000000, - "output": 131072 + "context": 262000, + "output": 262000 }, "temperature": true, "tool_call": true, @@ -108403,102 +114805,81 @@ } }, "attachment": false, - "open_weights": true, - "knowledge": "2025-05", - "release_date": "2026-04-24", - "last_updated": "2026-04-24", + "open_weights": false, + "release_date": "2025-07-28", + "last_updated": "2025-11-25", "cost": { - "input": 0.4928, - "output": 0.7392, - "cache_read": 0.003625 + "input": 0.13, + "output": 0.6 }, "type": "chat" }, { - "id": "route/kimi-k2.6-6bit", - "name": "Kimi K2.6 6bit", - "display_name": "Kimi K2.6 6bit", + "id": "Qwen/Qwen2.5-72B-Instruct-128K", + "name": "Qwen/Qwen2.5-72B-Instruct-128K", + "display_name": "Qwen/Qwen2.5-72B-Instruct-128K", "modalities": { "input": [ - "text", - "image", - "video" + "text" ], "output": [ "text" ] }, "limit": { - "context": 262144, - "output": 262144 + "context": 131000, + "output": 4000 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } + "supported": false }, - "attachment": true, - "open_weights": true, - "knowledge": "2025-01", - "release_date": "2026-04-21", - "last_updated": "2026-04-21", + "attachment": false, + "open_weights": false, + "release_date": "2024-09-18", + "last_updated": "2025-11-25", "cost": { - "input": 0.462, - "output": 2.42, - "cache_read": 0.16 + "input": 0.59, + "output": 0.59 }, "type": "chat" }, { - "id": "route/mistral-medium-2505", - "name": "Mistral Medium 2505", - "display_name": "Mistral Medium 2505", + "id": "Qwen/Qwen3-Coder-480B-A35B-Instruct", + "name": "Qwen/Qwen3-Coder-480B-A35B-Instruct", + "display_name": "Qwen/Qwen3-Coder-480B-A35B-Instruct", "modalities": { "input": [ - "text", - "image", - "video" + "text" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 32768 + "context": 262000, + "output": 262000 }, "temperature": true, "tool_call": true, "reasoning": { "supported": false }, - "attachment": true, + "attachment": false, "open_weights": false, - "knowledge": "2025-05", - "release_date": "2025-05-07", - "last_updated": "2025-05-07", + "release_date": "2025-07-31", + "last_updated": "2025-11-25", "cost": { - "input": 0.4, - "output": 2 + "input": 0.25, + "output": 1 }, "type": "chat" }, { - "id": "route/step-3.5-flash", - "name": "Step 3.5 Flash", - "display_name": "Step 3.5 Flash", + "id": "Qwen/Qwen3-Coder-30B-A3B-Instruct", + "name": "Qwen/Qwen3-Coder-30B-A3B-Instruct", + "display_name": "Qwen/Qwen3-Coder-30B-A3B-Instruct", "modalities": { "input": [ "text" @@ -108508,42 +114889,28 @@ ] }, "limit": { - "context": 262144, - "output": 65536 + "context": 262000, + "output": 262000 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } + "supported": false }, "attachment": false, - "open_weights": true, - "knowledge": "2025-01", - "release_date": "2026-01-29", - "last_updated": "2026-02-13", + "open_weights": false, + "release_date": "2025-08-01", + "last_updated": "2025-11-25", "cost": { - "input": 0.096, - "output": 0.288, - "cache_read": 0.019 + "input": 0.07, + "output": 0.28 }, "type": "chat" }, { - "id": "route/glm-5.1-6bit", - "name": "GLM 5.1 6bit", - "display_name": "GLM 5.1 6bit", + "id": "Qwen/Qwen3-30B-A3B-Instruct-2507", + "name": "Qwen/Qwen3-30B-A3B-Instruct-2507", + "display_name": "Qwen/Qwen3-30B-A3B-Instruct-2507", "modalities": { "input": [ "text" @@ -108553,53 +114920,40 @@ ] }, "limit": { - "context": 202752, - "output": 65536 + "context": 262000, + "output": 262000 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } + "supported": false }, "attachment": false, - "open_weights": true, - "release_date": "2026-03-27", - "last_updated": "2026-03-27", + "open_weights": false, + "release_date": "2025-07-30", + "last_updated": "2025-11-25", "cost": { - "input": 1, - "output": 3, - "cache_read": 0.26, - "cache_write": 0 + "input": 0.09, + "output": 0.3 }, "type": "chat" }, { - "id": "route/stepfun-3.5-flash", - "name": "StepFun 3.5 Flash", - "display_name": "StepFun 3.5 Flash", + "id": "Qwen/Qwen3-VL-30B-A3B-Thinking", + "name": "Qwen/Qwen3-VL-30B-A3B-Thinking", + "display_name": "Qwen/Qwen3-VL-30B-A3B-Thinking", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 262144, - "output": 65536 + "context": 262000, + "output": 262000 }, "temperature": true, "tool_call": true, @@ -108618,33 +114972,32 @@ ] } }, - "attachment": false, - "open_weights": true, - "knowledge": "2025-01", - "release_date": "2026-01-29", - "last_updated": "2026-02-13", + "attachment": true, + "open_weights": false, + "release_date": "2025-10-11", + "last_updated": "2025-11-25", "cost": { - "input": 0.096, - "output": 0.288, - "cache_read": 0.019 + "input": 0.29, + "output": 1 }, "type": "chat" }, { - "id": "route/minimax-m2.7", - "name": "MiniMax M2.7", - "display_name": "MiniMax M2.7", + "id": "Qwen/Qwen3-VL-8B-Thinking", + "name": "Qwen/Qwen3-VL-8B-Thinking", + "display_name": "Qwen/Qwen3-VL-8B-Thinking", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 100000, - "output": 131072 + "context": 262000, + "output": 262000 }, "temperature": true, "tool_call": true, @@ -108663,67 +115016,52 @@ ] } }, - "attachment": false, - "open_weights": true, - "release_date": "2026-03-18", - "last_updated": "2026-03-18", + "attachment": true, + "open_weights": false, + "release_date": "2025-10-15", + "last_updated": "2025-11-25", "cost": { - "input": 0.33, - "output": 1.32, - "cache_read": 0.06, - "cache_write": 0.375 + "input": 0.18, + "output": 2 }, "type": "chat" }, { - "id": "route/deepseek-v4-flash", - "name": "DeepSeek V4 Flash", - "display_name": "DeepSeek V4 Flash", + "id": "Qwen/Qwen3-VL-8B-Instruct", + "name": "Qwen/Qwen3-VL-8B-Instruct", + "display_name": "Qwen/Qwen3-VL-8B-Instruct", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 1000000, - "output": 131072 + "context": 262000, + "output": 262000 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } + "supported": false }, - "attachment": false, - "open_weights": true, - "knowledge": "2025-05", - "release_date": "2026-04-24", - "last_updated": "2026-04-24", + "attachment": true, + "open_weights": false, + "release_date": "2025-10-15", + "last_updated": "2025-11-25", "cost": { - "input": 0.4928, - "output": 0.7392, - "cache_read": 0.0028 + "input": 0.18, + "output": 0.68 }, "type": "chat" }, { - "id": "route/step-3.5-flash-2603", - "name": "Step 3.5 Flash 2603", - "display_name": "Step 3.5 Flash 2603", + "id": "Qwen/QwQ-32B", + "name": "Qwen/QwQ-32B", + "display_name": "Qwen/QwQ-32B", "modalities": { "input": [ "text" @@ -108733,8 +115071,8 @@ ] }, "limit": { - "context": 262144, - "output": 65536 + "context": 131000, + "output": 131000 }, "temperature": true, "tool_call": true, @@ -108754,110 +115092,105 @@ } }, "attachment": false, - "open_weights": true, - "knowledge": "2025-01", - "release_date": "2026-04-02", - "last_updated": "2026-04-02", + "open_weights": false, + "release_date": "2025-03-06", + "last_updated": "2025-11-25", "cost": { - "input": 0.1, - "output": 0.3, - "cache_read": 0.02 + "input": 0.15, + "output": 0.58 }, "type": "chat" }, { - "id": "route/minimax-m2.5", - "name": "MiniMax M2.5", - "display_name": "MiniMax M2.5", + "id": "Qwen/Qwen3-Omni-30B-A3B-Captioner", + "name": "Qwen/Qwen3-Omni-30B-A3B-Captioner", + "display_name": "Qwen/Qwen3-Omni-30B-A3B-Captioner", "modalities": { "input": [ - "text" + "audio" ], "output": [ "text" ] }, "limit": { - "context": 100000, - "output": 131072 + "context": 66000, + "output": 66000 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true - } + "supported": false }, - "attachment": false, - "open_weights": true, - "release_date": "2026-02-12", - "last_updated": "2026-02-12", + "attachment": true, + "open_weights": false, + "release_date": "2025-10-04", + "last_updated": "2025-11-25", "cost": { - "input": 0.193, - "output": 1.238, - "cache_read": 0.03, - "cache_write": 0.375 + "input": 0.1, + "output": 0.4 }, "type": "chat" }, { - "id": "route/minimax-m2.5-highspeed", - "name": "MiniMax M2.5 Highspeed", - "display_name": "MiniMax M2.5 Highspeed", + "id": "Qwen/Qwen3-VL-235B-A22B-Thinking", + "name": "Qwen/Qwen3-VL-235B-A22B-Thinking", + "display_name": "Qwen/Qwen3-VL-235B-A22B-Thinking", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 100000, - "output": 131072 + "context": 262000, + "output": 262000 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true + "supported": true, + "default": true }, "extra_capabilities": { "reasoning": { - "supported": true + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] } }, - "attachment": false, - "open_weights": true, - "release_date": "2026-02-13", - "last_updated": "2026-02-13", + "attachment": true, + "open_weights": false, + "release_date": "2025-10-04", + "last_updated": "2025-11-25", "cost": { - "input": 0.193, - "output": 1.238, - "cache_read": 0.06, - "cache_write": 0.375 + "input": 0.45, + "output": 3.5 }, "type": "chat" }, { - "id": "route/mimo-v2.5", - "name": "MiMo V2.5", - "display_name": "MiMo V2.5", + "id": "Qwen/Qwen3-Next-80B-A3B-Thinking", + "name": "Qwen/Qwen3-Next-80B-A3B-Thinking", + "display_name": "Qwen/Qwen3-Next-80B-A3B-Thinking", "modalities": { "input": [ - "text", - "image", - "video" + "text" ], "output": [ "text" ] }, "limit": { - "context": 1000000, - "output": 262144 + "context": 262000, + "output": 262000 }, "temperature": true, "tool_call": true, @@ -108876,38 +115209,20 @@ ] } }, - "attachment": true, - "open_weights": true, - "knowledge": "2024-12", - "release_date": "2026-04-22", - "last_updated": "2026-04-22", + "attachment": false, + "open_weights": false, + "release_date": "2025-09-25", + "last_updated": "2025-11-25", "cost": { - "input": 0.45, - "output": 1.35, - "cache_read": 0.2, - "tiers": [ - { - "input": 2, - "output": 6, - "cache_read": 0.4, - "tier": { - "type": "context", - "size": 256000 - } - } - ], - "context_over_200k": { - "input": 2, - "output": 6, - "cache_read": 0.4 - } + "input": 0.14, + "output": 0.57 }, "type": "chat" }, { - "id": "route/deepseek-v4-pro", - "name": "DeepSeek V4 Pro", - "display_name": "DeepSeek V4 Pro", + "id": "Qwen/Qwen2.5-Coder-32B-Instruct", + "name": "Qwen/Qwen2.5-Coder-32B-Instruct", + "display_name": "Qwen/Qwen2.5-Coder-32B-Instruct", "modalities": { "input": [ "text" @@ -108917,88 +115232,60 @@ ] }, "limit": { - "context": 1000000, - "output": 131072 + "context": 33000, + "output": 4000 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } + "supported": false }, "attachment": false, - "open_weights": true, - "knowledge": "2025-05", - "release_date": "2026-04-24", - "last_updated": "2026-04-24", + "open_weights": false, + "release_date": "2024-11-11", + "last_updated": "2025-11-25", "cost": { - "input": 0.4928, - "output": 0.7392, - "cache_read": 0.003625 + "input": 0.18, + "output": 0.18 }, "type": "chat" }, { - "id": "route/kimi-k2.5", - "name": "Kimi K2.5", - "display_name": "Kimi K2.5", + "id": "Qwen/Qwen2.5-VL-7B-Instruct", + "name": "Qwen/Qwen2.5-VL-7B-Instruct", + "display_name": "Qwen/Qwen2.5-VL-7B-Instruct", "modalities": { "input": [ "text", - "image", - "video" + "image" ], "output": [ "text" ] }, "limit": { - "context": 131072, - "output": 32768 + "context": 33000, + "output": 4000 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { - "supported": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } + "supported": false }, "attachment": true, - "open_weights": true, - "knowledge": "2025-01", - "release_date": "2026-01", - "last_updated": "2026-01", + "open_weights": false, + "release_date": "2025-01-28", + "last_updated": "2025-11-25", "cost": { - "input": 0.462, - "output": 2.42, - "cache_read": 0.1 + "input": 0.05, + "output": 0.05 }, "type": "chat" }, { - "id": "route/glm-5.1", - "name": "GLM 5.1", - "display_name": "GLM 5.1", + "id": "Qwen/Qwen3-8B", + "name": "Qwen/Qwen3-8B", + "display_name": "Qwen/Qwen3-8B", "modalities": { "input": [ "text" @@ -109008,14 +115295,13 @@ ] }, "limit": { - "context": 202752, - "output": 65536 + "context": 131000, + "output": 131000 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": true }, "extra_capabilities": { "reasoning": { @@ -109029,93 +115315,50 @@ } }, "attachment": false, - "open_weights": true, - "release_date": "2026-03-27", - "last_updated": "2026-03-27", + "open_weights": false, + "release_date": "2025-04-30", + "last_updated": "2025-11-25", "cost": { - "input": 1, - "output": 3, - "cache_read": 0.26, - "cache_write": 0 + "input": 0.06, + "output": 0.06 }, "type": "chat" }, { - "id": "route/mimo-v2.5-pro", - "name": "MiMo V2.5 Pro", - "display_name": "MiMo V2.5 Pro", + "id": "Qwen/Qwen3-235B-A22B-Instruct-2507", + "name": "Qwen/Qwen3-235B-A22B-Instruct-2507", + "display_name": "Qwen/Qwen3-235B-A22B-Instruct-2507", "modalities": { "input": [ - "text", - "image", - "video" + "text" ], "output": [ "text" ] }, "limit": { - "context": 1000000, - "output": 262144 + "context": 262000, + "output": 262000 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } + "supported": false }, - "attachment": true, - "open_weights": true, - "knowledge": "2024-12", - "release_date": "2026-04-22", - "last_updated": "2026-04-22", + "attachment": false, + "open_weights": false, + "release_date": "2025-07-23", + "last_updated": "2025-11-25", "cost": { - "input": 0.45, - "output": 1.35, - "cache_read": 0.2, - "tiers": [ - { - "input": 2, - "output": 6, - "cache_read": 0.4, - "tier": { - "type": "context", - "size": 256000 - } - } - ], - "context_over_200k": { - "input": 2, - "output": 6, - "cache_read": 0.4 - } + "input": 0.09, + "output": 0.6 }, "type": "chat" - } - ] - }, - "xiaomi-token-plan-ams": { - "id": "xiaomi-token-plan-ams", - "name": "Xiaomi Token Plan (Europe)", - "display_name": "Xiaomi Token Plan (Europe)", - "api": "https://token-plan-ams.xiaomimimo.com/v1", - "doc": "https://platform.xiaomimimo.com/#/docs", - "models": [ + }, { - "id": "mimo-v2.5-pro", - "name": "MiMo-V2.5-Pro", - "display_name": "MiMo-V2.5-Pro", + "id": "Qwen/Qwen3-32B", + "name": "Qwen/Qwen3-32B", + "display_name": "Qwen/Qwen3-32B", "modalities": { "input": [ "text" @@ -109125,14 +115368,13 @@ ] }, "limit": { - "context": 1048576, - "output": 131072 + "context": 131000, + "output": 131000 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": true }, "extra_capabilities": { "reasoning": { @@ -109146,71 +115388,98 @@ } }, "attachment": false, - "open_weights": true, - "knowledge": "2024-12", - "release_date": "2026-04-22", - "last_updated": "2026-04-22", + "open_weights": false, + "release_date": "2025-04-30", + "last_updated": "2025-11-25", "cost": { - "input": 0, - "output": 0, - "cache_read": 0 + "input": 0.14, + "output": 0.57 }, "type": "chat" }, { - "id": "mimo-v2.5-tts", - "name": "MiMo-V2.5-TTS", - "display_name": "MiMo-V2.5-TTS", + "id": "Qwen/Qwen3-VL-32B-Instruct", + "name": "Qwen/Qwen3-VL-32B-Instruct", + "display_name": "Qwen/Qwen3-VL-32B-Instruct", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 262000, + "output": 262000 + }, + "temperature": true, + "tool_call": true, + "reasoning": { + "supported": false + }, + "attachment": true, + "open_weights": false, + "release_date": "2025-10-21", + "last_updated": "2025-11-25", + "cost": { + "input": 0.2, + "output": 0.6 + }, + "type": "chat" + }, + { + "id": "Qwen/Qwen2.5-14B-Instruct", + "name": "Qwen/Qwen2.5-14B-Instruct", + "display_name": "Qwen/Qwen2.5-14B-Instruct", "modalities": { "input": [ "text" ], "output": [ - "audio" + "text" ] }, "limit": { - "context": 8192, - "output": 8192 + "context": 33000, + "output": 4000 }, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { "supported": false }, "attachment": false, - "open_weights": true, - "release_date": "2026-04-22", - "last_updated": "2026-04-22", + "open_weights": false, + "release_date": "2024-09-18", + "last_updated": "2025-11-25", "cost": { - "input": 0, - "output": 0 + "input": 0.1, + "output": 0.1 }, "type": "chat" }, { - "id": "mimo-v2.5", - "name": "MiMo-V2.5", - "display_name": "MiMo-V2.5", + "id": "Qwen/Qwen3-14B", + "name": "Qwen/Qwen3-14B", + "display_name": "Qwen/Qwen3-14B", "modalities": { "input": [ - "text", - "image", - "audio", - "video" + "text" ], "output": [ "text" ] }, "limit": { - "context": 1048576, - "output": 131072 + "context": 131000, + "output": 131000 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": true }, "extra_capabilities": { "reasoning": { @@ -109223,22 +115492,20 @@ ] } }, - "attachment": true, - "open_weights": true, - "knowledge": "2024-12", - "release_date": "2026-04-22", - "last_updated": "2026-04-22", + "attachment": false, + "open_weights": false, + "release_date": "2025-04-30", + "last_updated": "2025-11-25", "cost": { - "input": 0, - "output": 0, - "cache_read": 0 + "input": 0.07, + "output": 0.28 }, "type": "chat" }, { - "id": "mimo-v2-pro", - "name": "MiMo-V2-Pro", - "display_name": "MiMo-V2-Pro", + "id": "Qwen/Qwen3-235B-A22B", + "name": "Qwen/Qwen3-235B-A22B", + "display_name": "Qwen/Qwen3-235B-A22B", "modalities": { "input": [ "text" @@ -109248,14 +115515,13 @@ ] }, "limit": { - "context": 1048576, - "output": 131072 + "context": 131000, + "output": 131000 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": true }, "extra_capabilities": { "reasoning": { @@ -109270,95 +115536,126 @@ }, "attachment": false, "open_weights": false, - "knowledge": "2024-12", - "release_date": "2026-03-18", - "last_updated": "2026-03-18", + "release_date": "2025-04-30", + "last_updated": "2025-11-25", "cost": { - "input": 0, - "output": 0, - "cache_read": 0 + "input": 0.35, + "output": 1.42 }, "type": "chat" }, { - "id": "mimo-v2.5-tts-voiceclone", - "name": "MiMo-V2.5-TTS-VoiceClone", - "display_name": "MiMo-V2.5-TTS-VoiceClone", + "id": "Qwen/Qwen2.5-72B-Instruct", + "name": "Qwen/Qwen2.5-72B-Instruct", + "display_name": "Qwen/Qwen2.5-72B-Instruct", "modalities": { "input": [ "text" ], "output": [ - "audio" + "text" ] }, "limit": { - "context": 8192, - "output": 8192 + "context": 33000, + "output": 4000 }, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { "supported": false }, "attachment": false, - "open_weights": true, - "release_date": "2026-04-22", - "last_updated": "2026-04-22", + "open_weights": false, + "release_date": "2024-09-18", + "last_updated": "2025-11-25", "cost": { - "input": 0, - "output": 0 + "input": 0.59, + "output": 0.59 }, "type": "chat" }, { - "id": "mimo-v2.5-tts-voicedesign", - "name": "MiMo-V2.5-TTS-VoiceDesign", - "display_name": "MiMo-V2.5-TTS-VoiceDesign", + "id": "Qwen/Qwen3-Omni-30B-A3B-Instruct", + "name": "Qwen/Qwen3-Omni-30B-A3B-Instruct", + "display_name": "Qwen/Qwen3-Omni-30B-A3B-Instruct", "modalities": { "input": [ + "text", + "image", + "audio" + ], + "output": [ "text" + ] + }, + "limit": { + "context": 66000, + "output": 66000 + }, + "temperature": true, + "tool_call": true, + "reasoning": { + "supported": false + }, + "attachment": true, + "open_weights": false, + "release_date": "2025-10-04", + "last_updated": "2025-11-25", + "cost": { + "input": 0.1, + "output": 0.4 + }, + "type": "chat" + }, + { + "id": "Qwen/Qwen3-VL-30B-A3B-Instruct", + "name": "Qwen/Qwen3-VL-30B-A3B-Instruct", + "display_name": "Qwen/Qwen3-VL-30B-A3B-Instruct", + "modalities": { + "input": [ + "text", + "image" ], "output": [ - "audio" + "text" ] }, "limit": { - "context": 8192, - "output": 8192 + "context": 262000, + "output": 262000 }, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { "supported": false }, - "attachment": false, - "open_weights": true, - "release_date": "2026-04-22", - "last_updated": "2026-04-22", + "attachment": true, + "open_weights": false, + "release_date": "2025-10-05", + "last_updated": "2025-11-25", "cost": { - "input": 0, - "output": 0 + "input": 0.29, + "output": 1 }, "type": "chat" }, { - "id": "mimo-v2-omni", - "name": "MiMo-V2-Omni", - "display_name": "MiMo-V2-Omni", + "id": "Qwen/Qwen3-VL-32B-Thinking", + "name": "Qwen/Qwen3-VL-32B-Thinking", + "display_name": "Qwen/Qwen3-VL-32B-Thinking", "modalities": { "input": [ "text", - "image", - "audio", - "video", - "pdf" + "image" ], "output": [ "text" ] }, "limit": { - "context": 262144, - "output": 131072 + "context": 262000, + "output": 262000 }, "temperature": true, "tool_call": true, @@ -109379,122 +115676,91 @@ }, "attachment": true, "open_weights": false, - "knowledge": "2024-12", - "release_date": "2026-03-18", - "last_updated": "2026-03-18", + "release_date": "2025-10-21", + "last_updated": "2025-11-25", "cost": { - "input": 0, - "output": 0, - "cache_read": 0 + "input": 0.2, + "output": 1.5 }, "type": "chat" }, { - "id": "mimo-v2-tts", - "name": "MiMo-V2-TTS", - "display_name": "MiMo-V2-TTS", + "id": "openai/gpt-oss-120b", + "name": "openai/gpt-oss-120b", + "display_name": "openai/gpt-oss-120b", "modalities": { "input": [ "text" ], "output": [ - "audio" + "text" ] }, "limit": { - "context": 8192, - "output": 8192 + "context": 131000, + "output": 8000 }, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true + } }, "attachment": false, - "open_weights": true, - "release_date": "2026-03-18", - "last_updated": "2026-03-18", + "open_weights": false, + "release_date": "2025-08-13", + "last_updated": "2025-11-25", "cost": { - "input": 0, - "output": 0 + "input": 0.05, + "output": 0.45 }, "type": "chat" - } - ] - }, - "deepinfra": { - "id": "deepinfra", - "name": "Deep Infra", - "display_name": "Deep Infra", - "doc": "https://deepinfra.com/models", - "models": [ + }, { - "id": "XiaomiMiMo/MiMo-V2.5", - "name": "MiMo-V2.5", - "display_name": "MiMo-V2.5", + "id": "openai/gpt-oss-20b", + "name": "openai/gpt-oss-20b", + "display_name": "openai/gpt-oss-20b", "modalities": { "input": [ - "text", - "image", - "audio", - "video" + "text" ], "output": [ "text" ] }, "limit": { - "context": 262144, - "output": 16384 + "context": 131000, + "output": 8000 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": true }, "extra_capabilities": { "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] + "supported": true } }, - "attachment": true, - "open_weights": true, - "knowledge": "2024-12", - "release_date": "2026-04-22", - "last_updated": "2026-04-22", + "attachment": false, + "open_weights": false, + "release_date": "2025-08-13", + "last_updated": "2025-11-25", "cost": { - "input": 0.4, - "output": 2, - "cache_read": 0.08, - "tiers": [ - { - "input": 0.8, - "output": 4, - "cache_read": 0.16, - "tier": { - "type": "context", - "size": 256000 - } - } - ], - "context_over_200k": { - "input": 0.8, - "output": 4, - "cache_read": 0.16 - } + "input": 0.04, + "output": 0.18 }, "type": "chat" }, { - "id": "XiaomiMiMo/MiMo-V2.5-Pro", - "name": "MiMo-V2.5-Pro", - "display_name": "MiMo-V2.5-Pro", + "id": "tencent/Hunyuan-MT-7B", + "name": "tencent/Hunyuan-MT-7B", + "display_name": "tencent/Hunyuan-MT-7B", "modalities": { "input": [ "text" @@ -109504,58 +115770,28 @@ ] }, "limit": { - "context": 1048576, - "output": 16384 + "context": 33000, + "output": 33000 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } + "supported": false }, "attachment": false, - "open_weights": true, - "knowledge": "2024-12", - "release_date": "2026-04-22", - "last_updated": "2026-04-22", + "open_weights": false, + "release_date": "2025-09-18", + "last_updated": "2025-11-25", "cost": { - "input": 1, - "output": 3, - "cache_read": 0.2, - "tiers": [ - { - "input": 2, - "output": 6, - "cache_read": 0.4, - "tier": { - "type": "context", - "size": 256000 - } - } - ], - "context_over_200k": { - "input": 2, - "output": 6, - "cache_read": 0.4 - } + "input": 0, + "output": 0 }, "type": "chat" }, { - "id": "MiniMaxAI/MiniMax-M2.5", - "name": "MiniMax M2.5", - "display_name": "MiniMax M2.5", + "id": "tencent/Hunyuan-A13B-Instruct", + "name": "tencent/Hunyuan-A13B-Instruct", + "display_name": "tencent/Hunyuan-A13B-Instruct", "modalities": { "input": [ "text" @@ -109565,43 +115801,28 @@ ] }, "limit": { - "context": 204800, - "output": 131072 + "context": 131000, + "output": 131000 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } + "supported": false }, "attachment": false, - "open_weights": true, - "knowledge": "2025-06", - "release_date": "2026-02-12", - "last_updated": "2026-02-12", + "open_weights": false, + "release_date": "2025-06-30", + "last_updated": "2025-11-25", "cost": { - "input": 0.27, - "output": 0.95, - "cache_read": 0.03, - "cache_write": 0.375 + "input": 0.14, + "output": 0.57 }, "type": "chat" }, { - "id": "zai-org/GLM-4.7", - "name": "GLM-4.7", - "display_name": "GLM-4.7", + "id": "nex-agi/DeepSeek-V3.1-Nex-N1", + "name": "nex-agi/DeepSeek-V3.1-Nex-N1", + "display_name": "nex-agi/DeepSeek-V3.1-Nex-N1", "modalities": { "input": [ "text" @@ -109611,8 +115832,8 @@ ] }, "limit": { - "context": 202752, - "output": 16384 + "context": 131000, + "output": 131000 }, "temperature": true, "tool_call": true, @@ -109620,44 +115841,32 @@ "supported": true, "default": true }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } - }, "attachment": false, - "open_weights": true, - "knowledge": "2025-04", - "release_date": "2025-12-22", - "last_updated": "2025-12-22", + "open_weights": false, + "release_date": "2025-01-01", + "last_updated": "2025-11-25", "cost": { - "input": 0.43, - "output": 1.75, - "cache_read": 0.08 + "input": 0.5, + "output": 2 }, "type": "chat" }, { - "id": "zai-org/GLM-5", - "name": "GLM-5", - "display_name": "GLM-5", + "id": "zai-org/GLM-5V-Turbo", + "name": "zai-org/GLM-5V-Turbo", + "display_name": "zai-org/GLM-5V-Turbo", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 202752, - "output": 16384 + "context": 200000, + "output": 131072 }, "temperature": true, "tool_call": true, @@ -109676,22 +115885,21 @@ ] } }, - "attachment": false, - "open_weights": true, - "knowledge": "2025-12", - "release_date": "2026-02-12", - "last_updated": "2026-02-12", + "attachment": true, + "open_weights": false, + "release_date": "2026-04-01", + "last_updated": "2026-04-01", "cost": { - "input": 0.8, - "output": 2.56, - "cache_read": 0.16 + "input": 1.2, + "output": 4, + "cache_write": 0 }, "type": "chat" }, { - "id": "zai-org/GLM-5.1", - "name": "GLM-5.1", - "display_name": "GLM-5.1", + "id": "zai-org/GLM-4.6", + "name": "zai-org/GLM-4.6", + "display_name": "zai-org/GLM-4.6", "modalities": { "input": [ "text" @@ -109701,53 +115909,45 @@ ] }, "limit": { - "context": 202752, - "output": 16384 + "context": 205000, + "output": 205000 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": true }, "extra_capabilities": { "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] + "supported": true } }, "attachment": false, - "open_weights": true, - "knowledge": "2025-04", - "release_date": "2026-04-07", - "last_updated": "2026-04-07", + "open_weights": false, + "release_date": "2025-10-04", + "last_updated": "2025-11-25", "cost": { - "input": 1.4, - "output": 4.4, - "cache_read": 0.26 + "input": 0.5, + "output": 1.9 }, "type": "chat" }, { - "id": "zai-org/GLM-4.7-Flash", - "name": "GLM-4.7-Flash", - "display_name": "GLM-4.7-Flash", + "id": "zai-org/GLM-4.6V", + "name": "zai-org/GLM-4.6V", + "display_name": "zai-org/GLM-4.6V", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 202752, - "output": 16384 + "context": 131000, + "output": 131000 }, "temperature": true, "tool_call": true, @@ -109755,32 +115955,20 @@ "supported": true, "default": true }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } - }, - "attachment": false, - "open_weights": true, - "knowledge": "2025-04", - "release_date": "2026-01-19", - "last_updated": "2026-01-19", + "attachment": true, + "open_weights": false, + "release_date": "2025-12-07", + "last_updated": "2025-12-07", "cost": { - "input": 0.06, - "output": 0.4 + "input": 0.3, + "output": 0.9 }, "type": "chat" }, { - "id": "zai-org/GLM-4.6", - "name": "GLM-4.6", - "display_name": "GLM-4.6", + "id": "zai-org/GLM-5", + "name": "zai-org/GLM-5", + "display_name": "zai-org/GLM-5", "modalities": { "input": [ "text" @@ -109790,8 +115978,8 @@ ] }, "limit": { - "context": 204800, - "output": 131072 + "context": 205000, + "output": 205000 }, "temperature": true, "tool_call": true, @@ -109812,33 +116000,29 @@ }, "attachment": false, "open_weights": true, - "knowledge": "2025-04", - "release_date": "2025-09-30", - "last_updated": "2025-09-30", + "release_date": "2026-02-12", + "last_updated": "2026-02-12", "cost": { - "input": 0.43, - "output": 1.74, - "cache_read": 0.08 + "input": 1, + "output": 3.2 }, "type": "chat" }, { - "id": "moonshotai/Kimi-K2.6", - "name": "Kimi K2.6", - "display_name": "Kimi K2.6", + "id": "zai-org/GLM-4.7", + "name": "zai-org/GLM-4.7", + "display_name": "zai-org/GLM-4.7", "modalities": { "input": [ - "text", - "image", - "video" + "text" ], "output": [ "text" ] }, "limit": { - "context": 262144, - "output": 16384 + "context": 205000, + "output": 205000 }, "temperature": true, "tool_call": true, @@ -109857,68 +116041,52 @@ ] } }, - "attachment": true, - "open_weights": true, - "knowledge": "2024-04", - "release_date": "2026-04-21", - "last_updated": "2026-04-21", + "attachment": false, + "open_weights": false, + "release_date": "2025-12-22", + "last_updated": "2025-12-22", "cost": { - "input": 0.75, - "output": 3.5, - "cache_read": 0.15 + "input": 0.6, + "output": 2.2 }, "type": "chat" }, { - "id": "moonshotai/Kimi-K2.5", - "name": "Kimi K2.5", - "display_name": "Kimi K2.5", + "id": "zai-org/GLM-4.5V", + "name": "zai-org/GLM-4.5V", + "display_name": "zai-org/GLM-4.5V", "modalities": { "input": [ "text", - "image", - "video" + "image" ], "output": [ "text" ] }, "limit": { - "context": 262144, - "output": 32768 + "context": 66000, + "output": 66000 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } + "supported": false }, "attachment": true, - "open_weights": true, - "knowledge": "2025-01", - "release_date": "2026-01-27", - "last_updated": "2026-01-27", + "open_weights": false, + "release_date": "2025-08-13", + "last_updated": "2025-11-25", "cost": { - "input": 0.5, - "output": 2.8 + "input": 0.14, + "output": 0.86 }, "type": "chat" }, { - "id": "meta-llama/Llama-3.3-70B-Instruct-Turbo", - "name": "Llama 3.3 70B Turbo", - "display_name": "Llama 3.3 70B Turbo", + "id": "zai-org/GLM-4.5-Air", + "name": "zai-org/GLM-4.5-Air", + "display_name": "zai-org/GLM-4.5-Air", "modalities": { "input": [ "text" @@ -109928,87 +116096,101 @@ ] }, "limit": { - "context": 131072, - "output": 16384 + "context": 131000, + "output": 131000 }, + "temperature": true, "tool_call": true, "reasoning": { "supported": false }, "attachment": false, - "open_weights": true, - "release_date": "2024-12-06", - "last_updated": "2024-12-06", + "open_weights": false, + "release_date": "2025-07-28", + "last_updated": "2025-11-25", "cost": { - "input": 0.1, - "output": 0.32 + "input": 0.14, + "output": 0.86 }, "type": "chat" }, { - "id": "meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8", - "name": "Llama 4 Maverick 17B FP8", - "display_name": "Llama 4 Maverick 17B FP8", + "id": "zai-org/GLM-5.1", + "name": "zai-org/GLM-5.1", + "display_name": "zai-org/GLM-5.1", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 1000000, - "output": 16384 + "context": 205000, + "output": 205000 }, + "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } }, "attachment": false, "open_weights": true, - "release_date": "2025-04-05", - "last_updated": "2025-04-05", + "release_date": "2026-04-08", + "last_updated": "2026-04-08", "cost": { - "input": 0.15, - "output": 0.6 + "input": 1.4, + "output": 4.4, + "cache_write": 0 }, "type": "chat" }, { - "id": "meta-llama/Llama-4-Scout-17B-16E-Instruct", - "name": "Llama 4 Scout 17B", - "display_name": "Llama 4 Scout 17B", + "id": "zai-org/GLM-4.5", + "name": "zai-org/GLM-4.5", + "display_name": "zai-org/GLM-4.5", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 10000000, - "output": 16384 + "context": 131000, + "output": 131000 }, + "temperature": true, "tool_call": true, "reasoning": { "supported": false }, "attachment": false, - "open_weights": true, - "release_date": "2025-04-05", - "last_updated": "2025-04-05", + "open_weights": false, + "release_date": "2025-07-28", + "last_updated": "2025-11-25", "cost": { - "input": 0.08, - "output": 0.3 + "input": 0.4, + "output": 2 }, "type": "chat" }, { - "id": "deepseek-ai/DeepSeek-V4-Flash", + "id": "deepseek-ai/deepseek-v4-flash", "name": "DeepSeek V4 Flash", "display_name": "DeepSeek V4 Flash", "modalities": { @@ -110020,8 +116202,8 @@ ] }, "limit": { - "context": 1048576, - "output": 16384 + "context": 1000000, + "output": 384000 }, "temperature": true, "tool_call": true, @@ -110046,16 +116228,16 @@ "release_date": "2026-04-24", "last_updated": "2026-04-24", "cost": { - "input": 0.1, - "output": 0.2, - "cache_read": 0.02 + "input": 0.14, + "output": 0.28, + "cache_read": 0.028 }, "type": "chat" }, { - "id": "deepseek-ai/DeepSeek-V4-Pro", - "name": "DeepSeek V4 Pro", - "display_name": "DeepSeek V4 Pro", + "id": "deepseek-ai/DeepSeek-R1", + "name": "deepseek-ai/DeepSeek-R1", + "display_name": "deepseek-ai/DeepSeek-R1", "modalities": { "input": [ "text" @@ -110065,8 +116247,8 @@ ] }, "limit": { - "context": 1048576, - "output": 16384 + "context": 164000, + "output": 164000 }, "temperature": true, "tool_call": true, @@ -110086,21 +116268,19 @@ } }, "attachment": false, - "open_weights": true, - "knowledge": "2025-05", - "release_date": "2026-04-24", - "last_updated": "2026-04-24", + "open_weights": false, + "release_date": "2025-05-28", + "last_updated": "2025-11-25", "cost": { - "input": 1.3, - "output": 2.6, - "cache_read": 0.1 + "input": 0.5, + "output": 2.18 }, "type": "chat" }, { - "id": "deepseek-ai/DeepSeek-V3.2", - "name": "DeepSeek-V3.2", - "display_name": "DeepSeek-V3.2", + "id": "deepseek-ai/DeepSeek-R1-Distill-Qwen-32B", + "name": "deepseek-ai/DeepSeek-R1-Distill-Qwen-32B", + "display_name": "deepseek-ai/DeepSeek-R1-Distill-Qwen-32B", "modalities": { "input": [ "text" @@ -110110,8 +116290,8 @@ ] }, "limit": { - "context": 163840, - "output": 64000 + "context": 131000, + "output": 131000 }, "temperature": true, "tool_call": true, @@ -110119,33 +116299,52 @@ "supported": true, "default": true }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } + "attachment": false, + "open_weights": false, + "release_date": "2025-01-20", + "last_updated": "2025-11-25", + "cost": { + "input": 0.18, + "output": 0.18 + }, + "type": "chat" + }, + { + "id": "deepseek-ai/DeepSeek-V3.1-Terminus", + "name": "deepseek-ai/DeepSeek-V3.1-Terminus", + "display_name": "deepseek-ai/DeepSeek-V3.1-Terminus", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 164000, + "output": 164000 + }, + "temperature": true, + "tool_call": true, + "reasoning": { + "supported": true, + "default": true }, "attachment": false, "open_weights": false, - "knowledge": "2024-12", - "release_date": "2025-12-02", - "last_updated": "2025-12-02", + "release_date": "2025-09-29", + "last_updated": "2025-11-25", "cost": { - "input": 0.26, - "output": 0.38, - "cache_read": 0.13 + "input": 0.27, + "output": 1 }, "type": "chat" }, { - "id": "deepseek-ai/DeepSeek-R1-0528", - "name": "DeepSeek-R1-0528", - "display_name": "DeepSeek-R1-0528", + "id": "deepseek-ai/deepseek-v4-pro", + "name": "DeepSeek V4 Pro", + "display_name": "DeepSeek V4 Pro", "modalities": { "input": [ "text" @@ -110155,11 +116354,11 @@ ] }, "limit": { - "context": 163840, - "output": 64000 + "context": 1000000, + "output": 384000 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { "supported": true, "default": true @@ -110176,21 +116375,21 @@ } }, "attachment": false, - "open_weights": false, - "knowledge": "2024-07", - "release_date": "2025-05-28", - "last_updated": "2025-05-28", + "open_weights": true, + "knowledge": "2025-05", + "release_date": "2026-04-24", + "last_updated": "2026-04-24", "cost": { - "input": 0.5, - "output": 2.15, - "cache_read": 0.35 + "input": 1.74, + "output": 3.48, + "cache_read": 0.145 }, "type": "chat" }, { - "id": "Qwen/Qwen3-Coder-480B-A35B-Instruct-Turbo", - "name": "Qwen3 Coder 480B A35B Instruct Turbo", - "display_name": "Qwen3 Coder 480B A35B Instruct Turbo", + "id": "deepseek-ai/DeepSeek-V3.1", + "name": "deepseek-ai/DeepSeek-V3.1", + "display_name": "deepseek-ai/DeepSeek-V3.1", "modalities": { "input": [ "text" @@ -110200,42 +116399,40 @@ ] }, "limit": { - "context": 262144, - "output": 66536 + "context": 164000, + "output": 164000 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "attachment": false, - "open_weights": true, - "knowledge": "2025-04", - "release_date": "2025-07-23", - "last_updated": "2025-07-23", + "open_weights": false, + "release_date": "2025-08-25", + "last_updated": "2025-11-25", "cost": { - "input": 0.3, - "output": 1.2 + "input": 0.27, + "output": 1 }, "type": "chat" }, { - "id": "Qwen/Qwen3.6-35B-A3B", - "name": "Qwen3.6 35B A3B", - "display_name": "Qwen3.6 35B A3B", + "id": "deepseek-ai/DeepSeek-V3.2-Exp", + "name": "deepseek-ai/DeepSeek-V3.2-Exp", + "display_name": "deepseek-ai/DeepSeek-V3.2-Exp", "modalities": { "input": [ - "text", - "image", - "video" + "text" ], "output": [ "text" ] }, "limit": { - "context": 262144, - "output": 81920 + "context": 164000, + "output": 164000 }, "temperature": true, "tool_call": true, @@ -110243,90 +116440,63 @@ "supported": true, "default": true }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } - }, - "attachment": true, - "open_weights": true, - "release_date": "2026-04-01", - "last_updated": "2026-04-01", + "attachment": false, + "open_weights": false, + "release_date": "2025-10-10", + "last_updated": "2025-11-25", "cost": { - "input": 0.2, - "output": 1 + "input": 0.27, + "output": 0.41 }, "type": "chat" }, { - "id": "Qwen/Qwen3.5-35B-A3B", - "name": "Qwen 3.5 35B A3B", - "display_name": "Qwen 3.5 35B A3B", + "id": "deepseek-ai/deepseek-vl2", + "name": "deepseek-ai/deepseek-vl2", + "display_name": "deepseek-ai/deepseek-vl2", "modalities": { "input": [ "text", - "image", - "video" + "image" ], "output": [ "text" ] }, "limit": { - "context": 262144, - "output": 81920 + "context": 4000, + "output": 4000 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } + "supported": false }, "attachment": true, - "open_weights": true, - "knowledge": "2025-01", - "release_date": "2026-02-01", - "last_updated": "2026-04-20", + "open_weights": false, + "release_date": "2024-12-13", + "last_updated": "2025-11-25", "cost": { - "input": 0.2, - "output": 0.95 + "input": 0.15, + "output": 0.15 }, "type": "chat" }, { - "id": "Qwen/Qwen3.5-397B-A17B", - "name": "Qwen 3.5 397B A17B", - "display_name": "Qwen 3.5 397B A17B", + "id": "deepseek-ai/DeepSeek-V3.2", + "name": "deepseek-ai/DeepSeek-V3.2", + "display_name": "deepseek-ai/DeepSeek-V3.2", "modalities": { "input": [ - "text", - "image", - "video" + "text" ], "output": [ "text" ] }, "limit": { - "context": 262144, - "output": 81920 + "context": 164000, + "output": 164000 }, "temperature": true, "tool_call": true, @@ -110336,75 +116506,65 @@ }, "extra_capabilities": { "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] + "supported": true } }, - "attachment": true, - "open_weights": true, - "knowledge": "2025-01", - "release_date": "2026-02-01", - "last_updated": "2026-04-20", + "attachment": false, + "open_weights": false, + "release_date": "2025-12-03", + "last_updated": "2025-12-03", "cost": { - "input": 0.54, - "output": 3.4 + "input": 0.27, + "output": 0.42 }, "type": "chat" }, { - "id": "google/gemma-4-26B-A4B-it", - "name": "Gemma 4 26B A4B IT", - "display_name": "Gemma 4 26B A4B IT", + "id": "deepseek-ai/DeepSeek-V3", + "name": "deepseek-ai/DeepSeek-V3", + "display_name": "deepseek-ai/DeepSeek-V3", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 262144, - "output": 32768 + "context": 164000, + "output": 164000 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, - "attachment": true, - "open_weights": true, - "release_date": "2026-04-02", - "last_updated": "2026-04-02", + "attachment": false, + "open_weights": false, + "release_date": "2024-12-26", + "last_updated": "2025-11-25", "cost": { - "input": 0.07, - "output": 0.34 + "input": 0.25, + "output": 1 }, "type": "chat" }, { - "id": "google/gemma-4-31B-it", - "name": "Gemma 4 31B IT", - "display_name": "Gemma 4 31B IT", + "id": "deepseek-ai/DeepSeek-R1-Distill-Qwen-14B", + "name": "deepseek-ai/DeepSeek-R1-Distill-Qwen-14B", + "display_name": "deepseek-ai/DeepSeek-R1-Distill-Qwen-14B", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 262144, - "output": 32768 + "context": 131000, + "output": 131000 }, "temperature": true, "tool_call": true, @@ -110412,20 +116572,20 @@ "supported": true, "default": true }, - "attachment": true, - "open_weights": true, - "release_date": "2026-04-02", - "last_updated": "2026-04-02", + "attachment": false, + "open_weights": false, + "release_date": "2025-01-20", + "last_updated": "2025-11-25", "cost": { - "input": 0.13, - "output": 0.38 + "input": 0.1, + "output": 0.1 }, "type": "chat" }, { - "id": "openai/gpt-oss-120b", - "name": "GPT OSS 120B", - "display_name": "GPT OSS 120B", + "id": "MiniMaxAI/MiniMax-M2.1", + "name": "MiniMaxAI/MiniMax-M2.1", + "display_name": "MiniMaxAI/MiniMax-M2.1", "modalities": { "input": [ "text" @@ -110435,14 +116595,13 @@ ] }, "limit": { - "context": 131072, - "output": 16384 + "context": 197000, + "output": 131000 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": true }, "extra_capabilities": { "reasoning": { @@ -110450,19 +116609,19 @@ } }, "attachment": false, - "open_weights": true, - "release_date": "2025-08-05", - "last_updated": "2025-08-05", + "open_weights": false, + "release_date": "2025-12-23", + "last_updated": "2025-12-23", "cost": { - "input": 0.05, - "output": 0.24 + "input": 0.3, + "output": 1.2 }, "type": "chat" }, { - "id": "openai/gpt-oss-20b", - "name": "GPT OSS 20B", - "display_name": "GPT OSS 20B", + "id": "MiniMaxAI/MiniMax-M2.5", + "name": "MiniMaxAI/MiniMax-M2.5", + "display_name": "MiniMaxAI/MiniMax-M2.5", "modalities": { "input": [ "text" @@ -110472,14 +116631,13 @@ ] }, "limit": { - "context": 131072, - "output": 16384 + "context": 197000, + "output": 131000 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": true }, "extra_capabilities": { "reasoning": { @@ -110487,44 +116645,42 @@ } }, "attachment": false, - "open_weights": true, - "release_date": "2025-08-05", - "last_updated": "2025-08-05", + "open_weights": false, + "release_date": "2026-02-15", + "last_updated": "2026-02-15", "cost": { - "input": 0.03, - "output": 0.14 + "input": 0.3, + "output": 1.2 }, "type": "chat" } ] }, - "zhipuai": { - "id": "zhipuai", - "name": "Zhipu AI", - "display_name": "Zhipu AI", - "api": "https://open.bigmodel.cn/api/paas/v4", - "doc": "https://docs.z.ai/guides/overview/pricing", + "umans-ai-coding-plan": { + "id": "umans-ai-coding-plan", + "name": "Umans AI Coding Plan", + "display_name": "Umans AI Coding Plan", + "api": "https://api.code.umans.ai/v1", + "doc": "https://app.umans.ai/offers/code/docs", "models": [ { - "id": "glm-5v-turbo", - "name": "GLM-5V-Turbo", - "display_name": "GLM-5V-Turbo", + "id": "umans-kimi-k2.6", + "name": "Kimi K2.6", + "display_name": "Kimi K2.6", "modalities": { "input": [ "text", - "image", - "video", - "pdf" + "image" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 131072 + "context": 262144, + "output": 262144 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { "supported": true, @@ -110542,21 +116698,22 @@ } }, "attachment": true, - "open_weights": false, - "release_date": "2026-04-01", - "last_updated": "2026-04-01", + "open_weights": true, + "knowledge": "2025-01", + "release_date": "2026-04-21", + "last_updated": "2026-04-21", "cost": { - "input": 5, - "output": 22, - "cache_read": 1.2, + "input": 0, + "output": 0, + "cache_read": 0, "cache_write": 0 }, "type": "chat" }, { - "id": "glm-5", - "name": "GLM-5", - "display_name": "GLM-5", + "id": "umans-glm-5.1", + "name": "GLM 5.1", + "display_name": "GLM 5.1", "modalities": { "input": [ "text" @@ -110588,33 +116745,34 @@ }, "attachment": false, "open_weights": true, - "release_date": "2026-02-11", - "last_updated": "2026-02-11", + "release_date": "2026-03-27", + "last_updated": "2026-03-27", "cost": { - "input": 1, - "output": 3.2, - "cache_read": 0.2, + "input": 0, + "output": 0, + "cache_read": 0, "cache_write": 0 }, "type": "chat" }, { - "id": "glm-5.1", - "name": "GLM-5.1", - "display_name": "GLM-5.1", + "id": "umans-coder", + "name": "Umans Coder", + "display_name": "Umans Coder", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 131072 + "context": 262144, + "output": 262144 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { "supported": true, @@ -110631,137 +116789,140 @@ ] } }, - "attachment": false, - "open_weights": false, - "release_date": "2026-03-27", - "last_updated": "2026-03-27", + "attachment": true, + "open_weights": true, + "knowledge": "2025-01", + "release_date": "2026-04-21", + "last_updated": "2026-04-21", "cost": { - "input": 6, - "output": 24, - "cache_read": 1.3, + "input": 0, + "output": 0, + "cache_read": 0, "cache_write": 0 }, "type": "chat" }, { - "id": "glm-4.5-air", - "name": "GLM-4.5-Air", - "display_name": "GLM-4.5-Air", + "id": "umans-flash", + "name": "Umans Flash", + "display_name": "Umans Flash", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 131072, - "output": 98304 + "context": 262144, + "output": 262144 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { "supported": true, "default": true }, - "attachment": false, + "attachment": true, "open_weights": true, - "knowledge": "2025-04", - "release_date": "2025-07-28", - "last_updated": "2025-07-28", + "release_date": "2026-04-17", + "last_updated": "2026-04-17", "cost": { - "input": 0.2, - "output": 1.1, - "cache_read": 0.03, + "input": 0, + "output": 0, + "cache_read": 0, "cache_write": 0 }, "type": "chat" }, { - "id": "glm-4.5", - "name": "GLM-4.5", - "display_name": "GLM-4.5", + "id": "umans-qwen3.6-35b-a3b", + "name": "Qwen3.6 35B A3B", + "display_name": "Qwen3.6 35B A3B", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 131072, - "output": 98304 + "context": 262144, + "output": 262144 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { "supported": true, "default": true }, - "attachment": false, + "attachment": true, "open_weights": true, - "knowledge": "2025-04", - "release_date": "2025-07-28", - "last_updated": "2025-07-28", + "release_date": "2026-04-17", + "last_updated": "2026-04-17", "cost": { - "input": 0.6, - "output": 2.2, - "cache_read": 0.11, + "input": 0, + "output": 0, + "cache_read": 0, "cache_write": 0 }, "type": "chat" - }, + } + ] + }, + "io-net": { + "id": "io-net", + "name": "IO.NET", + "display_name": "IO.NET", + "api": "https://api.intelligence.io.solutions/api/v1", + "doc": "https://io.net/docs/guides/intelligence/io-intelligence", + "models": [ { - "id": "glm-4.7-flash", - "name": "GLM-4.7-Flash", - "display_name": "GLM-4.7-Flash", + "id": "meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8", + "name": "Llama 4 Maverick 17B 128E Instruct", + "display_name": "Llama 4 Maverick 17B 128E Instruct", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 131072 + "context": 430000, + "output": 4096 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true - } + "supported": false }, "attachment": false, "open_weights": true, - "knowledge": "2025-04", - "release_date": "2026-01-19", - "last_updated": "2026-01-19", + "knowledge": "2024-12", + "release_date": "2025-01-15", + "last_updated": "2025-01-15", "cost": { - "input": 0, - "output": 0, - "cache_read": 0, - "cache_write": 0 + "input": 0.15, + "output": 0.6, + "cache_read": 0.075, + "cache_write": 0.3 }, "type": "chat" }, { - "id": "glm-4.6v", - "name": "GLM-4.6V", - "display_name": "GLM-4.6V", + "id": "meta-llama/Llama-3.3-70B-Instruct", + "name": "Llama 3.3 70B Instruct", + "display_name": "Llama 3.3 70B Instruct", "modalities": { "input": [ - "text", - "image", - "video" + "text" ], "output": [ "text" @@ -110769,64 +116930,65 @@ }, "limit": { "context": 128000, - "output": 32768 + "output": 4096 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, - "attachment": true, + "attachment": false, "open_weights": true, - "knowledge": "2025-04", - "release_date": "2025-12-08", - "last_updated": "2025-12-08", + "knowledge": "2023-12", + "release_date": "2024-12-06", + "last_updated": "2024-12-06", "cost": { - "input": 0.3, - "output": 0.9 + "input": 0.13, + "output": 0.38, + "cache_read": 0.065, + "cache_write": 0.26 }, "type": "chat" }, { - "id": "glm-4.5v", - "name": "GLM-4.5V", - "display_name": "GLM-4.5V", + "id": "meta-llama/Llama-3.2-90B-Vision-Instruct", + "name": "Llama 3.2 90B Vision Instruct", + "display_name": "Llama 3.2 90B Vision Instruct", "modalities": { "input": [ "text", - "image", - "video" + "image" ], "output": [ "text" ] }, "limit": { - "context": 64000, - "output": 16384 + "context": 16000, + "output": 4096 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, - "attachment": true, + "attachment": false, "open_weights": true, - "knowledge": "2025-04", - "release_date": "2025-08-11", - "last_updated": "2025-08-11", + "knowledge": "2023-12", + "release_date": "2024-09-25", + "last_updated": "2024-09-25", "cost": { - "input": 0.6, - "output": 1.8 + "input": 0.35, + "output": 0.4, + "cache_read": 0.175, + "cache_write": 0.7 }, "type": "chat" }, { - "id": "glm-4.7", - "name": "GLM-4.7", - "display_name": "GLM-4.7", + "id": "moonshotai/Kimi-K2-Thinking", + "name": "Kimi K2 Thinking", + "display_name": "Kimi K2 Thinking", "modalities": { "input": [ "text" @@ -110836,8 +116998,8 @@ ] }, "limit": { - "context": 204800, - "output": 131072 + "context": 32768, + "output": 4096 }, "temperature": true, "tool_call": true, @@ -110857,22 +117019,22 @@ } }, "attachment": false, - "open_weights": true, - "knowledge": "2025-04", - "release_date": "2025-12-22", - "last_updated": "2025-12-22", + "open_weights": false, + "knowledge": "2024-08", + "release_date": "2024-11-01", + "last_updated": "2024-11-01", "cost": { - "input": 0.6, - "output": 2.2, - "cache_read": 0.11, - "cache_write": 0 + "input": 0.55, + "output": 2.25, + "cache_read": 0.275, + "cache_write": 1.1 }, "type": "chat" }, { - "id": "glm-4.6", - "name": "GLM-4.6", - "display_name": "GLM-4.6", + "id": "moonshotai/Kimi-K2-Instruct-0905", + "name": "Kimi K2 Instruct", + "display_name": "Kimi K2 Instruct", "modalities": { "input": [ "text" @@ -110882,72 +117044,66 @@ ] }, "limit": { - "context": 204800, - "output": 131072 + "context": 32768, + "output": 4096 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true - } + "supported": false }, "attachment": false, - "open_weights": true, - "knowledge": "2025-04", - "release_date": "2025-09-30", - "last_updated": "2025-09-30", + "open_weights": false, + "knowledge": "2024-08", + "release_date": "2024-09-05", + "last_updated": "2024-09-05", "cost": { - "input": 0.6, - "output": 2.2, - "cache_read": 0.11, - "cache_write": 0 + "input": 0.39, + "output": 1.9, + "cache_read": 0.195, + "cache_write": 0.78 }, "type": "chat" }, { - "id": "glm-4.7-flashx", - "name": "GLM-4.7-FlashX", - "display_name": "GLM-4.7-FlashX", + "id": "Qwen/Qwen2.5-VL-32B-Instruct", + "name": "Qwen 2.5 VL 32B Instruct", + "display_name": "Qwen 2.5 VL 32B Instruct", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 131072 + "context": 32000, + "output": 4096 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, "attachment": false, "open_weights": true, - "knowledge": "2025-04", - "release_date": "2026-01-19", - "last_updated": "2026-01-19", + "knowledge": "2024-09", + "release_date": "2024-11-01", + "last_updated": "2024-11-01", "cost": { - "input": 0.07, - "output": 0.4, - "cache_read": 0.01, - "cache_write": 0 + "input": 0.05, + "output": 0.22, + "cache_read": 0.025, + "cache_write": 0.1 }, "type": "chat" }, { - "id": "glm-4.5-flash", - "name": "GLM-4.5-Flash", - "display_name": "GLM-4.5-Flash", + "id": "Qwen/Qwen3-Next-80B-A3B-Instruct", + "name": "Qwen 3 Next 80B Instruct", + "display_name": "Qwen 3 Next 80B Instruct", "modalities": { "input": [ "text" @@ -110957,41 +117113,31 @@ ] }, "limit": { - "context": 131072, - "output": 98304 + "context": 262144, + "output": 4096 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, "attachment": false, "open_weights": true, - "knowledge": "2025-04", - "release_date": "2025-07-28", - "last_updated": "2025-07-28", + "knowledge": "2024-12", + "release_date": "2025-01-10", + "last_updated": "2025-01-10", "cost": { - "input": 0, - "output": 0, - "cache_read": 0, - "cache_write": 0 + "input": 0.1, + "output": 0.8, + "cache_read": 0.05, + "cache_write": 0.2 }, "type": "chat" - } - ] - }, - "io-net": { - "id": "io-net", - "name": "IO.NET", - "display_name": "IO.NET", - "api": "https://api.intelligence.io.solutions/api/v1", - "doc": "https://io.net/docs/guides/intelligence/io-intelligence", - "models": [ + }, { - "id": "mistralai/Magistral-Small-2506", - "name": "Magistral Small 2506", - "display_name": "Magistral Small 2506", + "id": "Qwen/Qwen3-235B-A22B-Thinking-2507", + "name": "Qwen 3 235B Thinking", + "display_name": "Qwen 3 235B Thinking", "modalities": { "input": [ "text" @@ -111001,66 +117147,82 @@ ] }, "limit": { - "context": 128000, + "context": 262144, "output": 4096 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } }, "attachment": false, - "open_weights": false, - "knowledge": "2025-01", - "release_date": "2025-06-01", - "last_updated": "2025-06-01", + "open_weights": true, + "knowledge": "2024-12", + "release_date": "2025-07-01", + "last_updated": "2025-07-01", "cost": { - "input": 0.5, - "output": 1.5, - "cache_read": 0.25, - "cache_write": 1 + "input": 0.11, + "output": 0.6, + "cache_read": 0.055, + "cache_write": 0.22 }, "type": "chat" }, { - "id": "mistralai/Mistral-Large-Instruct-2411", - "name": "Mistral Large Instruct 2411", - "display_name": "Mistral Large Instruct 2411", + "id": "openai/gpt-oss-120b", + "name": "GPT-OSS 120B", + "display_name": "GPT-OSS 120B", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 128000, + "context": 131072, "output": 4096 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true + } }, "attachment": false, - "open_weights": false, + "open_weights": true, "knowledge": "2024-10", - "release_date": "2024-11-01", - "last_updated": "2024-11-01", + "release_date": "2024-12-01", + "last_updated": "2024-12-01", "cost": { - "input": 2, - "output": 6, - "cache_read": 1, - "cache_write": 4 + "input": 0.04, + "output": 0.4, + "cache_read": 0.02, + "cache_write": 0.08 }, "type": "chat" }, { - "id": "mistralai/Mistral-Nemo-Instruct-2407", - "name": "Mistral Nemo Instruct 2407", - "display_name": "Mistral Nemo Instruct 2407", + "id": "openai/gpt-oss-20b", + "name": "GPT-OSS 20B", + "display_name": "GPT-OSS 20B", "modalities": { "input": [ "text" @@ -111070,24 +117232,29 @@ ] }, "limit": { - "context": 128000, + "context": 64000, "output": 4096 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true + } }, "attachment": false, "open_weights": true, - "knowledge": "2024-05", - "release_date": "2024-07-01", - "last_updated": "2024-07-01", + "knowledge": "2024-10", + "release_date": "2024-12-01", + "last_updated": "2024-12-01", "cost": { - "input": 0.02, - "output": 0.04, - "cache_read": 0.01, - "cache_write": 0.04 + "input": 0.03, + "output": 0.14, + "cache_read": 0.015, + "cache_write": 0.06 }, "type": "chat" }, @@ -111126,9 +117293,9 @@ "type": "chat" }, { - "id": "zai-org/GLM-4.6", - "name": "GLM 4.6", - "display_name": "GLM 4.6", + "id": "mistralai/Magistral-Small-2506", + "name": "Magistral Small 2506", + "display_name": "Magistral Small 2506", "modalities": { "input": [ "text" @@ -111138,46 +117305,42 @@ ] }, "limit": { - "context": 200000, + "context": 128000, "output": 4096 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true - } + "supported": false }, "attachment": false, "open_weights": false, - "knowledge": "2024-10", - "release_date": "2024-11-15", - "last_updated": "2024-11-15", + "knowledge": "2025-01", + "release_date": "2025-06-01", + "last_updated": "2025-06-01", "cost": { - "input": 0.4, - "output": 1.75, - "cache_read": 0.2, - "cache_write": 0.8 + "input": 0.5, + "output": 1.5, + "cache_read": 0.25, + "cache_write": 1 }, "type": "chat" }, { - "id": "Intel/Qwen3-Coder-480B-A35B-Instruct-int4-mixed-ar", - "name": "Qwen 3 Coder 480B", - "display_name": "Qwen 3 Coder 480B", + "id": "mistralai/Mistral-Large-Instruct-2411", + "name": "Mistral Large Instruct 2411", + "display_name": "Mistral Large Instruct 2411", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 106000, + "context": 128000, "output": 4096 }, "temperature": true, @@ -111186,22 +117349,22 @@ "supported": false }, "attachment": false, - "open_weights": true, - "knowledge": "2024-12", - "release_date": "2025-01-15", - "last_updated": "2025-01-15", + "open_weights": false, + "knowledge": "2024-10", + "release_date": "2024-11-01", + "last_updated": "2024-11-01", "cost": { - "input": 0.22, - "output": 0.95, - "cache_read": 0.11, - "cache_write": 0.44 + "input": 2, + "output": 6, + "cache_read": 1, + "cache_write": 4 }, "type": "chat" }, { - "id": "moonshotai/Kimi-K2-Instruct-0905", - "name": "Kimi K2 Instruct", - "display_name": "Kimi K2 Instruct", + "id": "mistralai/Mistral-Nemo-Instruct-2407", + "name": "Mistral Nemo Instruct 2407", + "display_name": "Mistral Nemo Instruct 2407", "modalities": { "input": [ "text" @@ -111211,7 +117374,7 @@ ] }, "limit": { - "context": 32768, + "context": 128000, "output": 4096 }, "temperature": true, @@ -111220,22 +117383,22 @@ "supported": false }, "attachment": false, - "open_weights": false, - "knowledge": "2024-08", - "release_date": "2024-09-05", - "last_updated": "2024-09-05", + "open_weights": true, + "knowledge": "2024-05", + "release_date": "2024-07-01", + "last_updated": "2024-07-01", "cost": { - "input": 0.39, - "output": 1.9, - "cache_read": 0.195, - "cache_write": 0.78 + "input": 0.02, + "output": 0.04, + "cache_read": 0.01, + "cache_write": 0.04 }, "type": "chat" }, { - "id": "moonshotai/Kimi-K2-Thinking", - "name": "Kimi K2 Thinking", - "display_name": "Kimi K2 Thinking", + "id": "Intel/Qwen3-Coder-480B-A35B-Instruct-int4-mixed-ar", + "name": "Qwen 3 Coder 480B", + "display_name": "Qwen 3 Coder 480B", "modalities": { "input": [ "text" @@ -111245,54 +117408,7 @@ ] }, "limit": { - "context": 32768, - "output": 4096 - }, - "temperature": true, - "tool_call": true, - "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } - }, - "attachment": false, - "open_weights": false, - "knowledge": "2024-08", - "release_date": "2024-11-01", - "last_updated": "2024-11-01", - "cost": { - "input": 0.55, - "output": 2.25, - "cache_read": 0.275, - "cache_write": 1.1 - }, - "type": "chat" - }, - { - "id": "meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8", - "name": "Llama 4 Maverick 17B 128E Instruct", - "display_name": "Llama 4 Maverick 17B 128E Instruct", - "modalities": { - "input": [ - "text", - "image" - ], - "output": [ - "text" - ] - }, - "limit": { - "context": 430000, + "context": 106000, "output": 4096 }, "temperature": true, @@ -111306,52 +117422,56 @@ "release_date": "2025-01-15", "last_updated": "2025-01-15", "cost": { - "input": 0.15, - "output": 0.6, - "cache_read": 0.075, - "cache_write": 0.3 + "input": 0.22, + "output": 0.95, + "cache_read": 0.11, + "cache_write": 0.44 }, "type": "chat" }, { - "id": "meta-llama/Llama-3.2-90B-Vision-Instruct", - "name": "Llama 3.2 90B Vision Instruct", - "display_name": "Llama 3.2 90B Vision Instruct", + "id": "zai-org/GLM-4.6", + "name": "GLM 4.6", + "display_name": "GLM 4.6", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 16000, + "context": 200000, "output": 4096 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true + } }, "attachment": false, - "open_weights": true, - "knowledge": "2023-12", - "release_date": "2024-09-25", - "last_updated": "2024-09-25", + "open_weights": false, + "knowledge": "2024-10", + "release_date": "2024-11-15", + "last_updated": "2024-11-15", "cost": { - "input": 0.35, - "output": 0.4, - "cache_read": 0.175, - "cache_write": 0.7 + "input": 0.4, + "output": 1.75, + "cache_read": 0.2, + "cache_write": 0.8 }, "type": "chat" }, { - "id": "meta-llama/Llama-3.3-70B-Instruct", - "name": "Llama 3.3 70B Instruct", - "display_name": "Llama 3.3 70B Instruct", + "id": "deepseek-ai/DeepSeek-R1-0528", + "name": "DeepSeek R1", + "display_name": "DeepSeek R1", "modalities": { "input": [ "text" @@ -111367,25 +117487,46 @@ "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } }, "attachment": false, "open_weights": true, - "knowledge": "2023-12", - "release_date": "2024-12-06", - "last_updated": "2024-12-06", + "knowledge": "2024-07", + "release_date": "2025-01-20", + "last_updated": "2025-05-28", "cost": { - "input": 0.13, - "output": 0.38, - "cache_read": 0.065, - "cache_write": 0.26 + "input": 2, + "output": 8.75, + "cache_read": 1, + "cache_write": 4 }, "type": "chat" - }, + } + ] + }, + "gmicloud": { + "id": "gmicloud", + "name": "GMI Cloud", + "display_name": "GMI Cloud", + "api": "https://api.gmi-serving.com/v1", + "doc": "https://docs.gmicloud.ai/inference-engine/api-reference/llm-api-reference", + "models": [ { - "id": "deepseek-ai/DeepSeek-R1-0528", - "name": "DeepSeek R1", - "display_name": "DeepSeek R1", + "id": "moonshotai/Kimi-K2.6", + "name": "Kimi K2.6", + "display_name": "Kimi K2.6", "modalities": { "input": [ "text" @@ -111395,8 +117536,8 @@ ] }, "limit": { - "context": 128000, - "output": 4096 + "context": 65536, + "output": 65536 }, "temperature": true, "tool_call": true, @@ -111415,23 +117556,22 @@ ] } }, - "attachment": false, + "attachment": true, "open_weights": true, - "knowledge": "2024-07", - "release_date": "2025-01-20", - "last_updated": "2025-05-28", + "knowledge": "2025-01", + "release_date": "2026-04-21", + "last_updated": "2026-04-21", "cost": { - "input": 2, - "output": 8.75, - "cache_read": 1, - "cache_write": 4 + "input": 0.855, + "output": 3.6, + "cache_read": 0.144 }, "type": "chat" }, { - "id": "Qwen/Qwen3-235B-A22B-Thinking-2507", - "name": "Qwen 3 235B Thinking", - "display_name": "Qwen 3 235B Thinking", + "id": "anthropic/claude-opus-4.7", + "name": "Claude Opus 4.7", + "display_name": "Claude Opus 4.7", "modalities": { "input": [ "text" @@ -111441,43 +117581,57 @@ ] }, "limit": { - "context": 262144, - "output": 4096 + "context": 409600, + "output": 128000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { "supported": true, - "default": true + "default": false }, "extra_capabilities": { "reasoning": { "supported": true, + "default_enabled": false, + "mode": "effort", + "effort": "high", + "effort_options": [ + "low", + "medium", + "high", + "xhigh", + "max" + ], "interleaved": true, "summaries": true, - "visibility": "summary", + "visibility": "omitted", "continuation": [ "thinking_blocks" + ], + "notes": [ + "Claude Opus 4.7 and newer Opus models require thinking.type = \"adaptive\" to enable thinking explicitly.", + "Manual budget_tokens requests return 400 on Claude Opus 4.7 and newer adaptive-only Opus models.", + "task_budget is separate from thinking control and should not be treated as a thinking budget." ] } }, - "attachment": false, - "open_weights": true, - "knowledge": "2024-12", - "release_date": "2025-07-01", - "last_updated": "2025-07-01", + "attachment": true, + "open_weights": false, + "knowledge": "2026-01-31", + "release_date": "2026-04-16", + "last_updated": "2026-04-16", "cost": { - "input": 0.11, - "output": 0.6, - "cache_read": 0.055, - "cache_write": 0.22 + "input": 4.5, + "output": 22.5, + "cache_read": 0.45 }, "type": "chat" }, { - "id": "Qwen/Qwen3-Next-80B-A3B-Instruct", - "name": "Qwen 3 Next 80B Instruct", - "display_name": "Qwen 3 Next 80B Instruct", + "id": "anthropic/claude-sonnet-4.6", + "name": "Claude Sonnet 4.6", + "display_name": "Claude Sonnet 4.6", "modalities": { "input": [ "text" @@ -111487,66 +117641,121 @@ ] }, "limit": { - "context": 262144, - "output": 4096 + "context": 409600, + "output": 64000 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": false }, - "attachment": false, - "open_weights": true, - "knowledge": "2024-12", - "release_date": "2025-01-10", - "last_updated": "2025-01-10", + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": false, + "mode": "mixed", + "budget": { + "min": 1024, + "unit": "tokens" + }, + "effort": "high", + "effort_options": [ + "low", + "medium", + "high", + "max" + ], + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ], + "notes": [ + "Anthropic recommends adaptive thinking with effort for Claude 4.6; budget_tokens remains a deprecated compatibility path.", + "Anthropic API defaults effort to high; lower effort levels should be chosen per workload." + ] + } + }, + "attachment": true, + "open_weights": false, + "knowledge": "2025-08-31", + "release_date": "2026-02-17", + "last_updated": "2026-03-13", "cost": { - "input": 0.1, - "output": 0.8, - "cache_read": 0.05, - "cache_write": 0.2 + "input": 3, + "output": 15, + "cache_read": 0.3 }, "type": "chat" }, { - "id": "Qwen/Qwen2.5-VL-32B-Instruct", - "name": "Qwen 2.5 VL 32B Instruct", - "display_name": "Qwen 2.5 VL 32B Instruct", + "id": "anthropic/claude-opus-4.6", + "name": "Claude Opus 4.6", + "display_name": "Claude Opus 4.6", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 32000, - "output": 4096 + "context": 409600, + "output": 128000 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": false }, - "attachment": false, - "open_weights": true, - "knowledge": "2024-09", - "release_date": "2024-11-01", - "last_updated": "2024-11-01", + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": false, + "mode": "mixed", + "budget": { + "min": 1024, + "unit": "tokens" + }, + "effort": "high", + "effort_options": [ + "low", + "medium", + "high", + "max" + ], + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ], + "notes": [ + "Anthropic recommends adaptive thinking with effort for Claude 4.6; budget_tokens remains a deprecated compatibility path.", + "Anthropic API defaults effort to high; lower effort levels should be chosen per workload." + ] + } + }, + "attachment": true, + "open_weights": false, + "knowledge": "2025-05-31", + "release_date": "2026-02-05", + "last_updated": "2026-03-13", "cost": { - "input": 0.05, - "output": 0.22, - "cache_read": 0.025, - "cache_write": 0.1 + "input": 5, + "output": 25, + "cache_read": 0.5 }, "type": "chat" }, { - "id": "openai/gpt-oss-120b", - "name": "GPT-OSS 120B", - "display_name": "GPT-OSS 120B", + "id": "zai-org/GLM-5.1-FP8", + "name": "GLM-5.1", + "display_name": "GLM-5.1", "modalities": { "input": [ "text" @@ -111556,36 +117765,41 @@ ] }, "limit": { - "context": 131072, - "output": 4096 + "context": 202752, + "output": 131072 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true + "supported": true, + "default": true }, "extra_capabilities": { "reasoning": { - "supported": true + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] } }, "attachment": false, "open_weights": true, - "knowledge": "2024-10", - "release_date": "2024-12-01", - "last_updated": "2024-12-01", + "release_date": "2026-03-27", + "last_updated": "2026-03-27", "cost": { - "input": 0.04, - "output": 0.4, - "cache_read": 0.02, - "cache_write": 0.08 + "input": 0.98, + "output": 3.08, + "cache_read": 0.182 }, "type": "chat" }, { - "id": "openai/gpt-oss-20b", - "name": "GPT-OSS 20B", - "display_name": "GPT-OSS 20B", + "id": "zai-org/GLM-5-FP8", + "name": "GLM-5", + "display_name": "GLM-5", "modalities": { "input": [ "text" @@ -111595,71 +117809,86 @@ ] }, "limit": { - "context": 64000, - "output": 4096 + "context": 202752, + "output": 131072 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true + "supported": true, + "default": true }, "extra_capabilities": { "reasoning": { - "supported": true + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] } }, "attachment": false, "open_weights": true, - "knowledge": "2024-10", - "release_date": "2024-12-01", - "last_updated": "2024-12-01", + "release_date": "2026-02-11", + "last_updated": "2026-02-11", "cost": { - "input": 0.03, - "output": 0.14, - "cache_read": 0.015, - "cache_write": 0.06 + "input": 0.6, + "output": 1.92, + "cache_read": 0.12 }, "type": "chat" - } - ] - }, - "groq": { - "id": "groq", - "name": "Groq", - "display_name": "Groq", - "doc": "https://console.groq.com/docs/models", - "models": [ + }, { - "id": "whisper-large-v3-turbo", - "name": "Whisper Large V3 Turbo", - "display_name": "Whisper Large V3 Turbo", + "id": "deepseek-ai/DeepSeek-V4-Flash", + "name": "DeepSeek V4 Flash", + "display_name": "DeepSeek V4 Flash", "modalities": { "input": [ - "audio" + "text" ], "output": [ "text" ] }, "limit": { - "context": 8192, - "output": 8192 + "context": 1048575, + "output": 384000 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } }, "attachment": false, "open_weights": true, - "release_date": "2024-10-01", - "last_updated": "2024-10-01", + "knowledge": "2025-05", + "release_date": "2026-04-24", + "last_updated": "2026-04-24", + "cost": { + "input": 0.112, + "output": 0.224, + "cache_read": 0.022 + }, "type": "chat" }, { - "id": "llama-3.1-8b-instant", - "name": "Llama 3.1 8B", - "display_name": "Llama 3.1 8B", + "id": "deepseek-ai/DeepSeek-V4-Pro", + "name": "DeepSeek V4 Pro", + "display_name": "DeepSeek V4 Pro", "modalities": { "input": [ "text" @@ -111669,99 +117898,125 @@ ] }, "limit": { - "context": 131072, - "output": 131072 + "context": 1048576, + "output": 384000 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": false, - "open_weights": true, - "knowledge": "2023-12", - "release_date": "2024-07-23", - "last_updated": "2024-07-23", + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } + }, + "attachment": false, + "open_weights": true, + "knowledge": "2025-05", + "release_date": "2026-04-24", + "last_updated": "2026-04-24", "cost": { - "input": 0.05, - "output": 0.08 + "input": 1.392, + "output": 2.784, + "cache_read": 0.116 }, "type": "chat" - }, + } + ] + }, + "xiaomi-token-plan-cn": { + "id": "xiaomi-token-plan-cn", + "name": "Xiaomi Token Plan (China)", + "display_name": "Xiaomi Token Plan (China)", + "api": "https://token-plan-cn.xiaomimimo.com/v1", + "doc": "https://platform.xiaomimimo.com/#/docs", + "models": [ { - "id": "whisper-large-v3", - "name": "Whisper", - "display_name": "Whisper", + "id": "mimo-v2.5-tts-voiceclone", + "name": "MiMo-V2.5-TTS-VoiceClone", + "display_name": "MiMo-V2.5-TTS-VoiceClone", "modalities": { "input": [ - "audio" + "text" ], "output": [ - "text" + "audio" ] }, "limit": { "context": 8192, "output": 8192 }, - "temperature": true, "tool_call": false, "reasoning": { "supported": false }, "attachment": false, "open_weights": true, - "release_date": "2023-09-01", - "last_updated": "2025-09-05", + "release_date": "2026-04-22", + "last_updated": "2026-04-22", + "cost": { + "input": 0, + "output": 0 + }, "type": "chat" }, { - "id": "llama-3.3-70b-versatile", - "name": "Llama 3.3 70B", - "display_name": "Llama 3.3 70B", + "id": "mimo-v2.5-tts-voicedesign", + "name": "MiMo-V2.5-TTS-VoiceDesign", + "display_name": "MiMo-V2.5-TTS-VoiceDesign", "modalities": { "input": [ "text" ], "output": [ - "text" + "audio" ] }, "limit": { - "context": 131072, - "output": 32768 + "context": 8192, + "output": 8192 }, - "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": false }, "attachment": false, "open_weights": true, - "knowledge": "2023-12", - "release_date": "2024-12-06", - "last_updated": "2024-12-06", + "release_date": "2026-04-22", + "last_updated": "2026-04-22", "cost": { - "input": 0.59, - "output": 0.79 + "input": 0, + "output": 0 }, "type": "chat" }, { - "id": "qwen/qwen3-32b", - "name": "Qwen3-32B", - "display_name": "Qwen3-32B", + "id": "mimo-v2.5", + "name": "MiMo-V2.5", + "display_name": "MiMo-V2.5", "modalities": { "input": [ - "text" + "text", + "image", + "audio", + "video" ], "output": [ "text" ] }, "limit": { - "context": 131072, - "output": 40960 + "context": 1048576, + "output": 131072 }, "temperature": true, "tool_call": true, @@ -111780,84 +118035,101 @@ ] } }, - "attachment": false, + "attachment": true, "open_weights": true, - "release_date": "2025-06-11", - "last_updated": "2025-06-12", + "knowledge": "2024-12", + "release_date": "2026-04-22", + "last_updated": "2026-04-22", "cost": { - "input": 0.29, - "output": 0.59 + "input": 0, + "output": 0, + "cache_read": 0 }, "type": "chat" }, { - "id": "meta-llama/llama-4-scout-17b-16e-instruct", - "name": "Llama 4 Scout 17B 16E", - "display_name": "Llama 4 Scout 17B 16E", + "id": "mimo-v2-omni", + "name": "MiMo-V2-Omni", + "display_name": "MiMo-V2-Omni", "modalities": { "input": [ "text", - "image" + "image", + "audio", + "video", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 131072, - "output": 8192 + "context": 262144, + "output": 131072 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } }, "attachment": true, - "open_weights": true, - "knowledge": "2024-08", - "release_date": "2025-04-05", - "last_updated": "2025-04-05", + "open_weights": false, + "knowledge": "2024-12", + "release_date": "2026-03-18", + "last_updated": "2026-03-18", "cost": { - "input": 0.11, - "output": 0.34 + "input": 0, + "output": 0, + "cache_read": 0 }, "type": "chat" }, { - "id": "meta-llama/llama-prompt-guard-2-86m", - "name": "Prompt Guard 2 86M", - "display_name": "Prompt Guard 2 86M", + "id": "mimo-v2-tts", + "name": "MiMo-V2-TTS", + "display_name": "MiMo-V2-TTS", "modalities": { "input": [ "text" ], "output": [ - "text" + "audio" ] }, "limit": { - "context": 512, - "output": 512 + "context": 8192, + "output": 8192 }, - "temperature": false, "tool_call": false, "reasoning": { "supported": false }, "attachment": false, "open_weights": true, - "release_date": "2025-05-29", - "last_updated": "2025-05-29", + "release_date": "2026-03-18", + "last_updated": "2026-03-18", "cost": { - "input": 0.04, - "output": 0.04 + "input": 0, + "output": 0 }, "type": "chat" }, { - "id": "meta-llama/llama-prompt-guard-2-22m", - "name": "Llama Prompt Guard 2 22M", - "display_name": "Llama Prompt Guard 2 22M", + "id": "mimo-v2-pro", + "name": "MiMo-V2-Pro", + "display_name": "MiMo-V2-Pro", "modalities": { "input": [ "text" @@ -111867,28 +118139,42 @@ ] }, "limit": { - "context": 512, - "output": 512 + "context": 1048576, + "output": 131072 }, - "temperature": false, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } }, "attachment": false, - "open_weights": true, - "release_date": "2025-05-29", - "last_updated": "2025-05-29", + "open_weights": false, + "knowledge": "2024-12", + "release_date": "2026-03-18", + "last_updated": "2026-03-18", "cost": { - "input": 0.03, - "output": 0.03 + "input": 0, + "output": 0, + "cache_read": 0 }, "type": "chat" }, { - "id": "groq/compound-mini", - "name": "Compound Mini", - "display_name": "Compound Mini", + "id": "mimo-v2.5-pro", + "name": "MiMo-V2.5-Pro", + "display_name": "MiMo-V2.5-Pro", "modalities": { "input": [ "text" @@ -111898,78 +118184,42 @@ ] }, "limit": { - "context": 131072, - "output": 8192 + "context": 1048576, + "output": 131072 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { - "supported": false - }, - "attachment": false, - "open_weights": false, - "release_date": "2025-09-04", - "last_updated": "2025-09-04", - "type": "chat" - }, - { - "id": "groq/compound", - "name": "Compound", - "display_name": "Compound", - "modalities": { - "input": [ - "text" - ], - "output": [ - "text" - ] - }, - "limit": { - "context": 131072, - "output": 8192 + "supported": true, + "default": true }, - "temperature": true, - "tool_call": false, - "reasoning": { - "supported": false + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } }, "attachment": false, - "open_weights": false, - "release_date": "2025-09-04", - "last_updated": "2025-09-04", - "type": "chat" - }, - { - "id": "canopylabs/orpheus-v1-english", - "name": "Canopy Labs Orpheus V1 English", - "display_name": "Canopy Labs Orpheus V1 English", - "modalities": { - "input": [ - "text" - ], - "output": [ - "audio" - ] - }, - "limit": { - "context": 4000, - "output": 50000 - }, - "temperature": false, - "tool_call": false, - "reasoning": { - "supported": false + "open_weights": true, + "knowledge": "2024-12", + "release_date": "2026-04-22", + "last_updated": "2026-04-22", + "cost": { + "input": 0, + "output": 0, + "cache_read": 0 }, - "attachment": false, - "open_weights": false, - "release_date": "2025-12-19", - "last_updated": "2025-12-19", "type": "chat" }, { - "id": "canopylabs/orpheus-arabic-saudi", - "name": "Canopy Labs Orpheus Arabic Saudi", - "display_name": "Canopy Labs Orpheus Arabic Saudi", + "id": "mimo-v2.5-tts", + "name": "MiMo-V2.5-TTS", + "display_name": "MiMo-V2.5-TTS", "modalities": { "input": [ "text" @@ -111979,24 +118229,36 @@ ] }, "limit": { - "context": 4000, - "output": 50000 + "context": 8192, + "output": 8192 }, - "temperature": false, "tool_call": false, "reasoning": { "supported": false }, "attachment": false, - "open_weights": false, - "release_date": "2025-12-16", - "last_updated": "2025-12-16", + "open_weights": true, + "release_date": "2026-04-22", + "last_updated": "2026-04-22", + "cost": { + "input": 0, + "output": 0 + }, "type": "chat" - }, + } + ] + }, + "scaleway": { + "id": "scaleway", + "name": "Scaleway", + "display_name": "Scaleway", + "api": "https://api.scaleway.ai/v1", + "doc": "https://www.scaleway.com/en/docs/generative-apis/", + "models": [ { - "id": "openai/gpt-oss-120b", - "name": "GPT OSS 120B", - "display_name": "GPT OSS 120B", + "id": "qwen3-235b-a22b-instruct-2507", + "name": "Qwen3 235B A22B Instruct 2507", + "display_name": "Qwen3 235B A22B Instruct 2507", "modalities": { "input": [ "text" @@ -112006,8 +118268,8 @@ ] }, "limit": { - "context": 131072, - "output": 65536 + "context": 260000, + "output": 16384 }, "temperature": true, "tool_call": true, @@ -112015,26 +118277,22 @@ "supported": true, "default": true }, - "extra_capabilities": { - "reasoning": { - "supported": true - } - }, "attachment": false, "open_weights": true, - "release_date": "2025-08-05", - "last_updated": "2025-10-21", + "knowledge": "2025-04", + "release_date": "2025-07-01", + "last_updated": "2026-03-17", "cost": { - "input": 0.15, - "output": 0.6, - "cache_read": 0.075 + "input": 0.75, + "output": 2.25, + "reasoning": 8.4 }, "type": "chat" }, { - "id": "openai/gpt-oss-20b", - "name": "GPT OSS 20B", - "display_name": "GPT OSS 20B", + "id": "qwen3-coder-30b-a3b-instruct", + "name": "Qwen3-Coder 30B-A3B Instruct", + "display_name": "Qwen3-Coder 30B-A3B Instruct", "modalities": { "input": [ "text" @@ -112044,35 +118302,29 @@ ] }, "limit": { - "context": 131072, - "output": 65536 + "context": 128000, + "output": 32768 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true - } + "supported": false }, "attachment": false, "open_weights": true, - "release_date": "2025-08-05", - "last_updated": "2025-09-25", + "knowledge": "2025-04", + "release_date": "2025-04", + "last_updated": "2026-03-17", "cost": { - "input": 0.075, - "output": 0.3, - "cache_read": 0.0375 + "input": 0.2, + "output": 0.8 }, "type": "chat" }, { - "id": "openai/gpt-oss-safeguard-20b", - "name": "Safety GPT OSS 20B", - "display_name": "Safety GPT OSS 20B", + "id": "qwen3-embedding-8b", + "name": "Qwen3 Embedding 8B", + "display_name": "Qwen3 Embedding 8B", "modalities": { "input": [ "text" @@ -112082,74 +118334,59 @@ ] }, "limit": { - "context": 131072, - "output": 65536 + "context": 32768, + "output": 4096 }, - "temperature": true, - "tool_call": true, + "temperature": false, + "tool_call": false, "reasoning": { - "supported": true, - "default": true + "supported": false }, "attachment": false, - "open_weights": true, - "release_date": "2025-10-29", - "last_updated": "2025-10-29", + "open_weights": false, + "release_date": "2025-25-11", + "last_updated": "2026-03-17", "cost": { - "input": 0.075, - "output": 0.3, - "cache_read": 0.037 + "input": 0.1, + "output": 0 }, - "type": "chat" - } - ] - }, - "sap-ai-core": { - "id": "sap-ai-core", - "name": "SAP AI Core", - "display_name": "SAP AI Core", - "doc": "https://help.sap.com/docs/sap-ai-core", - "models": [ + "type": "embedding" + }, { - "id": "anthropic--claude-3-sonnet", - "name": "anthropic--claude-3-sonnet", - "display_name": "anthropic--claude-3-sonnet", + "id": "bge-multilingual-gemma2", + "name": "BGE Multilingual Gemma2", + "display_name": "BGE Multilingual Gemma2", "modalities": { "input": [ - "text", - "image", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 4096 + "context": 8191, + "output": 3072 }, - "temperature": true, - "tool_call": true, + "temperature": false, + "tool_call": false, "reasoning": { "supported": false }, - "attachment": true, + "attachment": false, "open_weights": false, - "knowledge": "2023-08-31", - "release_date": "2024-03-04", - "last_updated": "2024-03-04", + "release_date": "2024-07-26", + "last_updated": "2025-06-15", "cost": { - "input": 3, - "output": 15, - "cache_read": 0.3, - "cache_write": 3.75 + "input": 0.1, + "output": 0 }, "type": "chat" }, { - "id": "gpt-5-mini", - "name": "gpt-5-mini", - "display_name": "gpt-5-mini", + "id": "qwen3.6-35b-a3b", + "name": "Qwen3.6 35B A3B", + "display_name": "Qwen3.6 35B A3B", "modalities": { "input": [ "text", @@ -112160,10 +118397,10 @@ ] }, "limit": { - "context": 400000, - "output": 128000 + "context": 128000, + "output": 16384 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, @@ -112172,40 +118409,29 @@ "extra_capabilities": { "reasoning": { "supported": true, - "default_enabled": true, - "mode": "effort", - "effort": "medium", - "effort_options": [ - "minimal", - "low", - "medium", - "high" - ], - "verbosity": "medium", - "verbosity_options": [ - "low", - "medium", - "high" - ], - "visibility": "hidden" + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] } }, "attachment": true, - "open_weights": false, - "knowledge": "2024-05-30", - "release_date": "2025-08-07", - "last_updated": "2025-08-07", + "open_weights": true, + "knowledge": "2025-04", + "release_date": "2026-05-01", + "last_updated": "2026-05-22", "cost": { "input": 0.25, - "output": 2, - "cache_read": 0.025 + "output": 1.5 }, "type": "chat" }, { - "id": "sonar", - "name": "sonar", - "display_name": "sonar", + "id": "llama-3.3-70b-instruct", + "name": "Llama-3.3-70B-Instruct", + "display_name": "Llama-3.3-70B-Instruct", "modalities": { "input": [ "text" @@ -112215,140 +118441,131 @@ ] }, "limit": { - "context": 128000, - "output": 4096 + "context": 100000, + "output": 16384 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { "supported": false }, - "attachment": false, - "open_weights": false, - "knowledge": "2025-09-01", - "release_date": "2024-01-01", - "last_updated": "2025-09-01", + "attachment": true, + "open_weights": true, + "knowledge": "2023-12", + "release_date": "2024-12-06", + "last_updated": "2026-03-17", "cost": { - "input": 1, - "output": 1 + "input": 0.9, + "output": 0.9 }, "type": "chat" }, { - "id": "anthropic--claude-4.6-sonnet", - "name": "anthropic--claude-4.6-sonnet", - "display_name": "anthropic--claude-4.6-sonnet", + "id": "pixtral-12b-2409", + "name": "Pixtral 12B 2409", + "display_name": "Pixtral 12B 2409", "modalities": { "input": [ "text", - "image", - "pdf" + "image" ], "output": [ "text" ] }, "limit": { - "context": 1000000, - "output": 64000 + "context": 128000, + "output": 4096 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, "attachment": true, - "open_weights": false, - "knowledge": "2025-08", - "release_date": "2026-02-17", - "last_updated": "2026-03-13", + "open_weights": true, + "knowledge": "2024-09", + "release_date": "2024-09-25", + "last_updated": "2026-03-17", "cost": { - "input": 3, - "output": 15, - "cache_read": 0.3, - "cache_write": 3.75 + "input": 0.2, + "output": 0.2 }, "type": "chat" }, { - "id": "anthropic--claude-4.6-opus", - "name": "anthropic--claude-4.6-opus", - "display_name": "anthropic--claude-4.6-opus", + "id": "mistral-small-3.2-24b-instruct-2506", + "name": "Mistral Small 3.2 24B Instruct (2506)", + "display_name": "Mistral Small 3.2 24B Instruct (2506)", "modalities": { "input": [ "text", - "image", - "pdf" + "image" ], "output": [ "text" ] }, "limit": { - "context": 1000000, - "output": 128000 + "context": 128000, + "output": 32768 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, - "attachment": true, - "open_weights": false, - "knowledge": "2025-05", - "release_date": "2026-02-05", - "last_updated": "2026-03-13", + "attachment": false, + "open_weights": true, + "knowledge": "2025-03", + "release_date": "2025-06-20", + "last_updated": "2026-03-17", "cost": { - "input": 5, - "output": 25, - "cache_read": 0.5, - "cache_write": 6.25 + "input": 0.15, + "output": 0.35 }, "type": "chat" }, { - "id": "anthropic--claude-4.5-sonnet", - "name": "anthropic--claude-4.5-sonnet", - "display_name": "anthropic--claude-4.5-sonnet", + "id": "gpt-oss-120b", + "name": "GPT-OSS 120B", + "display_name": "GPT-OSS 120B", "modalities": { "input": [ - "text", - "image", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 64000 + "context": 128000, + "output": 32768 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true + } }, "attachment": true, - "open_weights": false, - "knowledge": "2025-07-31", - "release_date": "2025-09-29", - "last_updated": "2025-09-29", + "open_weights": true, + "release_date": "2024-01-01", + "last_updated": "2026-03-17", "cost": { - "input": 3, - "output": 15, - "cache_read": 0.3, - "cache_write": 3.75 + "input": 0.15, + "output": 0.6 }, "type": "chat" }, { - "id": "gpt-5", - "name": "gpt-5", - "display_name": "gpt-5", + "id": "gemma-4-26b-a4b-it", + "name": "Gemma 4 26B A4B IT", + "display_name": "Gemma 4 26B A4B IT", "modalities": { "input": [ "text", @@ -112359,52 +118576,30 @@ ] }, "limit": { - "context": 400000, - "output": 128000 + "context": 256000, + "output": 16384 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, "default": true }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": true, - "mode": "effort", - "effort": "medium", - "effort_options": [ - "minimal", - "low", - "medium", - "high" - ], - "verbosity": "medium", - "verbosity_options": [ - "low", - "medium", - "high" - ], - "visibility": "hidden" - } - }, "attachment": true, - "open_weights": false, - "knowledge": "2024-09-30", - "release_date": "2025-08-07", - "last_updated": "2025-08-07", + "open_weights": true, + "knowledge": "2025-04", + "release_date": "2026-04-01", + "last_updated": "2026-05-22", "cost": { - "input": 1.25, - "output": 10, - "cache_read": 0.125 + "input": 0.25, + "output": 0.5 }, "type": "chat" }, { - "id": "sonar-pro", - "name": "sonar-pro", - "display_name": "sonar-pro", + "id": "mistral-medium-3.5-128b", + "name": "Mistral Medium 3.5 128B", + "display_name": "Mistral Medium 3.5 128B", "modalities": { "input": [ "text", @@ -112415,137 +118610,121 @@ ] }, "limit": { - "context": 200000, - "output": 8192 + "context": 256000, + "output": 16384 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "attachment": true, - "open_weights": false, - "knowledge": "2025-09-01", - "release_date": "2024-01-01", - "last_updated": "2025-09-01", + "open_weights": true, + "release_date": "2026-04-29", + "last_updated": "2026-04-29", "cost": { - "input": 3, - "output": 15 + "input": 1.5, + "output": 7.5 }, "type": "chat" }, { - "id": "gpt-4.1-mini", - "name": "gpt-4.1-mini", - "display_name": "gpt-4.1-mini", + "id": "qwen3.5-397b-a17b", + "name": "Qwen3.5 397B A17B", + "display_name": "Qwen3.5 397B A17B", "modalities": { "input": [ "text", "image", - "pdf" + "video" ], "output": [ "text" ] }, "limit": { - "context": 1047576, - "output": 32768 + "context": 256000, + "output": 16384 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } }, "attachment": true, - "open_weights": false, - "knowledge": "2024-04", - "release_date": "2025-04-14", - "last_updated": "2025-04-14", + "open_weights": true, + "knowledge": "2025-04", + "release_date": "2026-03-17", + "last_updated": "2026-03-17", "cost": { - "input": 0.4, - "output": 1.6, - "cache_read": 0.1 + "input": 0.6, + "output": 3.6 }, "type": "chat" }, { - "id": "gpt-5.4", - "name": "gpt-5.4", - "display_name": "gpt-5.4", + "id": "whisper-large-v3", + "name": "Whisper Large v3", + "display_name": "Whisper Large v3", "modalities": { "input": [ - "text", - "image", - "pdf" + "audio" ], "output": [ "text" ] }, "limit": { - "context": 1050000, - "output": 128000 + "context": 8192, + "output": 8192 }, "temperature": false, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": false - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": false, - "mode": "effort", - "effort": "none", - "effort_options": [ - "none", - "low", - "medium", - "high", - "xhigh" - ], - "verbosity": "medium", - "verbosity_options": [ - "low", - "medium", - "high" - ], - "visibility": "hidden" - } + "supported": false }, - "attachment": true, - "open_weights": false, - "knowledge": "2025-08-31", - "release_date": "2026-03-05", - "last_updated": "2026-03-05", + "attachment": false, + "open_weights": true, + "knowledge": "2023-09", + "release_date": "2023-09-01", + "last_updated": "2026-03-17", "cost": { - "input": 2.5, - "output": 15, - "cache_read": 0.25 + "input": 0.003, + "output": 0 }, "type": "chat" }, { - "id": "anthropic--claude-4.7-opus", - "name": "anthropic--claude-4.7-opus", - "display_name": "anthropic--claude-4.7-opus", + "id": "gemma-3-27b-it", + "name": "Gemma-3-27B-IT", + "display_name": "Gemma-3-27B-IT", "modalities": { "input": [ "text", - "image", - "pdf" + "image" ], "output": [ "text" ] }, "limit": { - "context": 1000000, - "output": 128000 + "context": 40000, + "output": 8192 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, @@ -112553,242 +118732,165 @@ }, "attachment": true, "open_weights": false, - "knowledge": "2026-01-31", - "release_date": "2026-04-16", - "last_updated": "2026-04-16", + "knowledge": "2024-12", + "release_date": "2024-12-01", + "last_updated": "2026-03-17", "cost": { - "input": 5, - "output": 25, - "cache_read": 0.5, - "cache_write": 6.25 + "input": 0.25, + "output": 0.5 }, "type": "chat" }, { - "id": "gpt-5.5", - "name": "gpt-5.5", - "display_name": "gpt-5.5", + "id": "voxtral-small-24b-2507", + "name": "Voxtral Small 24B 2507", + "display_name": "Voxtral Small 24B 2507", "modalities": { "input": [ "text", - "image", - "pdf" + "audio" ], "output": [ "text" ] }, "limit": { - "context": 1050000, - "output": 128000 + "context": 32000, + "output": 16384 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": true, - "mode": "effort", - "effort": "medium", - "effort_options": [ - "low", - "medium", - "high", - "xhigh" - ], - "verbosity": "medium", - "verbosity_options": [ - "low", - "medium", - "high" - ], - "visibility": "hidden" - } + "supported": false }, "attachment": true, - "open_weights": false, - "knowledge": "2025-12-01", - "release_date": "2026-04-23", - "last_updated": "2026-04-23", + "open_weights": true, + "release_date": "2025-07-01", + "last_updated": "2026-03-17", "cost": { - "input": 5, - "output": 30, - "cache_read": 0.5 + "input": 0.15, + "output": 0.35 }, "type": "chat" }, { - "id": "gpt-5-nano", - "name": "gpt-5-nano", - "display_name": "gpt-5-nano", + "id": "devstral-2-123b-instruct-2512", + "name": "Devstral 2 123B Instruct (2512)", + "display_name": "Devstral 2 123B Instruct (2512)", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 400000, - "output": 128000 + "context": 256000, + "output": 16384 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": true, - "mode": "effort", - "effort": "medium", - "effort_options": [ - "minimal", - "low", - "medium", - "high" - ], - "verbosity": "medium", - "verbosity_options": [ - "low", - "medium", - "high" - ], - "visibility": "hidden" - } + "supported": false }, - "attachment": true, - "open_weights": false, - "knowledge": "2024-05-30", - "release_date": "2025-08-07", - "last_updated": "2025-08-07", + "attachment": false, + "open_weights": true, + "knowledge": "2025-12", + "release_date": "2026-01-07", + "last_updated": "2026-03-17", "cost": { - "input": 0.05, - "output": 0.4, - "cache_read": 0.005 + "input": 0.4, + "output": 2 }, "type": "chat" - }, + } + ] + }, + "ovhcloud": { + "id": "ovhcloud", + "name": "OVHcloud AI Endpoints", + "display_name": "OVHcloud AI Endpoints", + "api": "https://oai.endpoints.kepler.ai.cloud.ovh.net/v1", + "doc": "https://www.ovhcloud.com/en/public-cloud/ai-endpoints/catalog//", + "models": [ { - "id": "anthropic--claude-3-haiku", - "name": "anthropic--claude-3-haiku", - "display_name": "anthropic--claude-3-haiku", + "id": "llama-3.1-8b-instruct", + "name": "Llama-3.1-8B-Instruct", + "display_name": "Llama-3.1-8B-Instruct", "modalities": { "input": [ - "text", - "image", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 4096 + "context": 131072, + "output": 131072 }, "temperature": true, "tool_call": true, "reasoning": { "supported": false }, - "attachment": true, - "open_weights": false, - "knowledge": "2023-08-31", - "release_date": "2024-03-13", - "last_updated": "2024-03-13", + "attachment": false, + "open_weights": true, + "release_date": "2025-06-11", + "last_updated": "2025-06-11", "cost": { - "input": 0.25, - "output": 1.25, - "cache_read": 0.03, - "cache_write": 0.3 + "input": 0.11, + "output": 0.11 }, "type": "chat" }, { - "id": "anthropic--claude-3.7-sonnet", - "name": "anthropic--claude-3.7-sonnet", - "display_name": "anthropic--claude-3.7-sonnet", + "id": "qwen3-coder-30b-a3b-instruct", + "name": "Qwen3-Coder-30B-A3B-Instruct", + "display_name": "Qwen3-Coder-30B-A3B-Instruct", "modalities": { "input": [ - "text", - "image", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 64000 + "context": 262144, + "output": 262144 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": false - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": false, - "mode": "budget", - "budget": { - "min": 1024, - "unit": "tokens" - }, - "interleaved": false, - "summaries": false, - "visibility": "full", - "continuation": [ - "thinking_blocks" - ], - "notes": [ - "Anthropic uses thinking budget tokens" - ] - } + "supported": false }, - "attachment": true, - "open_weights": false, - "knowledge": "2024-10-31", - "release_date": "2025-02-24", - "last_updated": "2025-02-24", + "attachment": false, + "open_weights": true, + "release_date": "2025-10-28", + "last_updated": "2025-10-28", "cost": { - "input": 3, - "output": 15, - "cache_read": 0.3, - "cache_write": 3.75 + "input": 0.07, + "output": 0.26 }, "type": "chat" }, { - "id": "gemini-2.5-pro", - "name": "gemini-2.5-pro", - "display_name": "gemini-2.5-pro", + "id": "qwen3-32b", + "name": "Qwen3-32B", + "display_name": "Qwen3-32B", "modalities": { "input": [ - "text", - "image", - "audio", - "video", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 1048576, - "output": 65536 + "context": 32768, + "output": 32768 }, "temperature": true, "tool_call": true, @@ -112798,160 +118900,126 @@ }, "extra_capabilities": { "reasoning": { - "supported": true, - "default_enabled": true, - "mode": "budget", - "budget": { - "default": -1, - "min": 128, - "max": 32768, - "auto": -1, - "unit": "tokens" - }, + "supported": true, + "interleaved": true, "summaries": true, "visibility": "summary", "continuation": [ - "thought_signatures" + "thinking_blocks" ] } }, - "attachment": true, - "open_weights": false, - "knowledge": "2025-01", - "release_date": "2025-03-25", - "last_updated": "2025-06-05", + "attachment": false, + "open_weights": true, + "release_date": "2025-07-16", + "last_updated": "2025-07-16", "cost": { - "input": 1.25, - "output": 10, - "cache_read": 0.125 + "input": 0.09, + "output": 0.25 }, "type": "chat" }, { - "id": "gpt-4.1", - "name": "gpt-4.1", - "display_name": "gpt-4.1", + "id": "qwen3guard-gen-8b", + "name": "Qwen3Guard-Gen-8B", + "display_name": "Qwen3Guard-Gen-8B", "modalities": { "input": [ - "text", - "image", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 1047576, - "output": 32768 + "context": 32768, + "output": 16384 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": false }, - "attachment": true, - "open_weights": false, - "knowledge": "2024-04", - "release_date": "2025-04-14", - "last_updated": "2025-04-14", - "cost": { - "input": 2, - "output": 8, - "cache_read": 0.5 - }, + "attachment": false, + "open_weights": true, + "release_date": "2026-01-22", + "last_updated": "2026-01-22", "type": "chat" }, { - "id": "anthropic--claude-3.5-sonnet", - "name": "anthropic--claude-3.5-sonnet", - "display_name": "anthropic--claude-3.5-sonnet", + "id": "qwen3guard-gen-0.6b", + "name": "Qwen3Guard-Gen-0.6B", + "display_name": "Qwen3Guard-Gen-0.6B", "modalities": { "input": [ - "text", - "image", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 8192 + "context": 32768, + "output": 16384 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": false }, - "attachment": true, - "open_weights": false, - "knowledge": "2024-04-30", - "release_date": "2024-10-22", - "last_updated": "2024-10-22", - "cost": { - "input": 3, - "output": 15, - "cache_read": 0.3, - "cache_write": 3.75 - }, + "attachment": false, + "open_weights": true, + "release_date": "2026-01-22", + "last_updated": "2026-01-22", "type": "chat" }, { - "id": "anthropic--claude-4.5-opus", - "name": "anthropic--claude-4.5-opus", - "display_name": "anthropic--claude-4.5-opus", + "id": "meta-llama-3_3-70b-instruct", + "name": "Meta-Llama-3_3-70B-Instruct", + "display_name": "Meta-Llama-3_3-70B-Instruct", "modalities": { "input": [ - "text", - "image", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 64000 + "context": 131072, + "output": 131072 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, - "attachment": true, - "open_weights": false, - "knowledge": "2025-05", - "release_date": "2025-11-24", - "last_updated": "2025-11-24", + "attachment": false, + "open_weights": true, + "release_date": "2025-04-01", + "last_updated": "2025-04-01", "cost": { - "input": 5, - "output": 25, - "cache_read": 0.5, - "cache_write": 6.25 + "input": 0.74, + "output": 0.74 }, "type": "chat" }, { - "id": "anthropic--claude-3-opus", - "name": "anthropic--claude-3-opus", - "display_name": "anthropic--claude-3-opus", + "id": "mistral-small-3.2-24b-instruct-2506", + "name": "Mistral-Small-3.2-24B-Instruct-2506", + "display_name": "Mistral-Small-3.2-24B-Instruct-2506", "modalities": { "input": [ "text", - "image", - "pdf" + "image" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 4096 + "context": 131072, + "output": 131072 }, "temperature": true, "tool_call": true, @@ -112959,97 +119027,63 @@ "supported": false }, "attachment": true, - "open_weights": false, - "knowledge": "2023-08-31", - "release_date": "2024-02-29", - "last_updated": "2024-02-29", + "open_weights": true, + "release_date": "2025-07-16", + "last_updated": "2025-07-16", "cost": { - "input": 15, - "output": 75, - "cache_read": 1.5, - "cache_write": 18.75 + "input": 0.1, + "output": 0.31 }, "type": "chat" }, { - "id": "gemini-2.5-flash-lite", - "name": "gemini-2.5-flash-lite", - "display_name": "gemini-2.5-flash-lite", + "id": "qwen2.5-vl-72b-instruct", + "name": "Qwen2.5-VL-72B-Instruct", + "display_name": "Qwen2.5-VL-72B-Instruct", "modalities": { "input": [ "text", - "image", - "audio", - "video", - "pdf" + "image" ], "output": [ "text" ] }, "limit": { - "context": 1048576, - "output": 65536 + "context": 32768, + "output": 32768 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": false - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": false, - "mode": "budget", - "budget": { - "default": -1, - "min": 512, - "max": 24576, - "auto": -1, - "unit": "tokens" - }, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thought_signatures" - ] - } + "supported": false }, "attachment": true, - "open_weights": false, - "knowledge": "2025-01", - "release_date": "2025-06-17", - "last_updated": "2025-06-17", + "open_weights": true, + "release_date": "2025-03-31", + "last_updated": "2025-03-31", "cost": { - "input": 0.1, - "output": 0.4, - "cache_read": 0.01, - "input_audio": 0.3 + "input": 1.01, + "output": 1.01 }, "type": "chat" }, { - "id": "gemini-2.5-flash", - "name": "gemini-2.5-flash", - "display_name": "gemini-2.5-flash", + "id": "gpt-oss-120b", + "name": "gpt-oss-120b", + "display_name": "gpt-oss-120b", "modalities": { "input": [ - "text", - "image", - "audio", - "video", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 1048576, - "output": 65536 + "context": 131072, + "output": 131072 }, - "temperature": true, "tool_call": true, "reasoning": { "supported": true, @@ -113057,128 +119091,97 @@ }, "extra_capabilities": { "reasoning": { - "supported": true, - "default_enabled": true, - "mode": "budget", - "budget": { - "default": -1, - "min": 0, - "max": 24576, - "auto": -1, - "off": 0, - "unit": "tokens" - }, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thought_signatures" - ] + "supported": true } }, - "attachment": true, - "open_weights": false, - "knowledge": "2025-01", - "release_date": "2025-04-17", - "last_updated": "2025-06-05", + "attachment": false, + "open_weights": true, + "release_date": "2025-08-28", + "last_updated": "2025-08-28", "cost": { - "input": 0.3, - "output": 2.5, - "cache_read": 0.03, - "input_audio": 1 + "input": 0.09, + "output": 0.47 }, "type": "chat" }, { - "id": "anthropic--claude-4-sonnet", - "name": "anthropic--claude-4-sonnet", - "display_name": "anthropic--claude-4-sonnet", + "id": "mistral-7b-instruct-v0.3", + "name": "Mistral-7B-Instruct-v0.3", + "display_name": "Mistral-7B-Instruct-v0.3", "modalities": { "input": [ - "text", - "image", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 64000 + "context": 65536, + "output": 65536 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, - "attachment": true, - "open_weights": false, - "knowledge": "2025-03-31", - "release_date": "2025-05-22", - "last_updated": "2025-05-22", + "attachment": false, + "open_weights": true, + "release_date": "2025-04-01", + "last_updated": "2025-04-01", "cost": { - "input": 3, - "output": 15, - "cache_read": 0.3, - "cache_write": 3.75 + "input": 0.11, + "output": 0.11 }, "type": "chat" }, { - "id": "anthropic--claude-4.5-haiku", - "name": "anthropic--claude-4.5-haiku", - "display_name": "anthropic--claude-4.5-haiku", + "id": "mistral-nemo-instruct-2407", + "name": "Mistral-Nemo-Instruct-2407", + "display_name": "Mistral-Nemo-Instruct-2407", "modalities": { "input": [ - "text", - "image", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 64000 + "context": 65536, + "output": 65536 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, - "attachment": true, - "open_weights": false, - "knowledge": "2025-02-28", - "release_date": "2025-10-15", - "last_updated": "2025-10-15", + "attachment": false, + "open_weights": true, + "release_date": "2024-11-20", + "last_updated": "2024-11-20", "cost": { - "input": 1, - "output": 5, - "cache_read": 0.1, - "cache_write": 1.25 + "input": 0.14, + "output": 0.14 }, "type": "chat" }, { - "id": "anthropic--claude-4-opus", - "name": "anthropic--claude-4-opus", - "display_name": "anthropic--claude-4-opus", + "id": "qwen3.6-27b", + "name": "Qwen3.6-27B", + "display_name": "Qwen3.6-27B", "modalities": { "input": [ "text", - "image", - "pdf" + "image" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 32000 + "context": 262144, + "output": 262144 }, "temperature": true, "tool_call": true, @@ -113186,621 +119189,398 @@ "supported": true, "default": true }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } + }, "attachment": true, - "open_weights": false, - "knowledge": "2025-03-31", - "release_date": "2025-05-22", - "last_updated": "2025-05-22", + "open_weights": true, + "release_date": "2026-06-01", + "last_updated": "2026-06-01", "cost": { - "input": 15, - "output": 75, - "cache_read": 1.5, - "cache_write": 18.75 + "input": 0.47, + "output": 3.19 }, "type": "chat" }, { - "id": "sonar-deep-research", - "name": "sonar-deep-research", - "display_name": "sonar-deep-research", - "modalities": { - "input": [ - "text" - ], - "output": [ - "text" - ] - }, - "limit": { - "context": 128000, - "output": 32768 - }, - "temperature": false, - "tool_call": false, - "reasoning": { - "supported": true, - "default": true - }, - "attachment": false, - "open_weights": false, - "knowledge": "2025-01", - "release_date": "2025-02-01", - "last_updated": "2025-09-01", - "cost": { - "input": 2, - "output": 8, - "reasoning": 3 - }, - "type": "chat" - } - ] - }, - "freemodel": { - "id": "freemodel", - "name": "FreeModel", - "display_name": "FreeModel", - "api": "https://cc.freemodel.dev/v1", - "doc": "https://freemodel.dev", - "models": [ - { - "id": "claude-sonnet-4-6", - "name": "Claude Sonnet 4.6", - "display_name": "Claude Sonnet 4.6", + "id": "qwen3.5-9b", + "name": "Qwen3.5-9B", + "display_name": "Qwen3.5-9B", "modalities": { "input": [ "text", - "image", - "pdf" + "image" ], "output": [ "text" ] }, "limit": { - "context": 1000000, - "output": 64000 + "context": 262144, + "output": 262144 }, "temperature": true, "tool_call": true, "reasoning": { "supported": true, - "default": false + "default": true }, "extra_capabilities": { "reasoning": { "supported": true, - "default_enabled": false, - "mode": "mixed", - "budget": { - "min": 1024, - "unit": "tokens" - }, - "effort": "high", - "effort_options": [ - "low", - "medium", - "high", - "max" - ], "interleaved": true, "summaries": true, "visibility": "summary", "continuation": [ "thinking_blocks" - ], - "notes": [ - "Anthropic recommends adaptive thinking with effort for Claude 4.6; budget_tokens remains a deprecated compatibility path.", - "Anthropic API defaults effort to high; lower effort levels should be chosen per workload." ] } }, "attachment": true, - "open_weights": false, - "knowledge": "2025-08-31", - "release_date": "2026-02-17", - "last_updated": "2026-03-13", + "open_weights": true, + "release_date": "2026-04-22", + "last_updated": "2026-04-22", "cost": { - "input": 3, - "output": 15, - "cache_read": 0.3, - "cache_write": 3.75 + "input": 0.12, + "output": 0.18 }, "type": "chat" }, { - "id": "claude-haiku-4-5-20251001", - "name": "Claude Haiku 4.5", - "display_name": "Claude Haiku 4.5", + "id": "qwen3.5-397b-a17b", + "name": "Qwen3.5-397B-A17B", + "display_name": "Qwen3.5-397B-A17B", "modalities": { "input": [ "text", - "image", - "pdf" + "image" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 64000 + "context": 262144, + "output": 262144 }, "temperature": true, "tool_call": true, "reasoning": { "supported": true, - "default": false + "default": true }, "extra_capabilities": { "reasoning": { "supported": true, - "default_enabled": false, - "mode": "budget", - "budget": { - "min": 1024, - "unit": "tokens" - }, "interleaved": true, "summaries": true, "visibility": "summary", "continuation": [ "thinking_blocks" - ], - "notes": [ - "Claude 4 manual thinking uses thinking.type = \"enabled\" with budget_tokens.", - "Interleaved thinking requires the interleaved-thinking-2025-05-14 beta header for this model family." ] } }, "attachment": true, - "open_weights": false, - "knowledge": "2025-02-28", - "release_date": "2025-10-15", - "last_updated": "2025-10-15", + "open_weights": true, + "release_date": "2026-05-18", + "last_updated": "2026-05-18", "cost": { - "input": 1, - "output": 5, - "cache_read": 0.1, - "cache_write": 1.25 + "input": 0.71, + "output": 4.25 }, "type": "chat" }, { - "id": "gpt-5.4", - "name": "GPT-5.4", - "display_name": "GPT-5.4", + "id": "gpt-oss-20b", + "name": "gpt-oss-20b", + "display_name": "gpt-oss-20b", "modalities": { "input": [ - "text", - "image", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 1050000, - "output": 128000 + "context": 131072, + "output": 131072 }, - "temperature": false, "tool_call": true, "reasoning": { "supported": true, - "default": false + "default": true }, "extra_capabilities": { "reasoning": { - "supported": true, - "default_enabled": false, - "mode": "effort", - "effort": "none", - "effort_options": [ - "none", - "low", - "medium", - "high", - "xhigh" - ], - "verbosity": "medium", - "verbosity_options": [ - "low", - "medium", - "high" - ], - "visibility": "hidden" + "supported": true } }, - "attachment": true, - "open_weights": false, - "knowledge": "2025-08-31", - "release_date": "2026-03-05", - "last_updated": "2026-03-05", + "attachment": false, + "open_weights": true, + "release_date": "2025-08-28", + "last_updated": "2025-08-28", "cost": { - "input": 2.5, - "output": 15, - "cache_read": 0.25, - "cache_write": 2.5 + "input": 0.05, + "output": 0.18 }, "type": "chat" - }, + } + ] + }, + "friendli": { + "id": "friendli", + "name": "Friendli", + "display_name": "Friendli", + "api": "https://api.friendli.ai/serverless/v1", + "doc": "https://friendli.ai/docs/guides/serverless_endpoints/introduction", + "models": [ { - "id": "gpt-5.5", - "name": "GPT-5.5", - "display_name": "GPT-5.5", + "id": "meta-llama/Llama-3.3-70B-Instruct", + "name": "Llama 3.3 70B Instruct", + "display_name": "Llama 3.3 70B Instruct", "modalities": { "input": [ - "text", - "image", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 1050000, - "output": 128000 + "context": 131072, + "output": 131072 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": true, - "mode": "effort", - "effort": "medium", - "effort_options": [ - "low", - "medium", - "high", - "xhigh" - ], - "verbosity": "medium", - "verbosity_options": [ - "low", - "medium", - "high" - ], - "visibility": "hidden" - } + "supported": false }, - "attachment": true, - "open_weights": false, - "knowledge": "2025-12-01", - "release_date": "2026-04-23", - "last_updated": "2026-04-23", + "attachment": false, + "open_weights": true, + "release_date": "2024-08-01", + "last_updated": "2025-12-23", "cost": { - "input": 5, - "output": 30, - "cache_read": 0.5, - "cache_write": 5 + "input": 0.6, + "output": 0.6 }, "type": "chat" }, { - "id": "gpt-5.3-codex", - "name": "GPT-5.3 Codex", - "display_name": "GPT-5.3 Codex", + "id": "meta-llama/Llama-3.1-8B-Instruct", + "name": "Llama 3.1 8B Instruct", + "display_name": "Llama 3.1 8B Instruct", "modalities": { "input": [ - "text", - "image", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 400000, - "output": 128000 + "context": 131072, + "output": 8000 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": true, - "mode": "effort", - "effort": "medium", - "effort_options": [ - "low", - "medium", - "high", - "xhigh" - ], - "verbosity": "medium", - "verbosity_options": [ - "low", - "medium", - "high" - ], - "visibility": "hidden" - } + "supported": false }, - "attachment": true, - "open_weights": false, - "knowledge": "2025-08-31", - "release_date": "2026-02-05", - "last_updated": "2026-02-05", + "attachment": false, + "open_weights": true, + "release_date": "2024-08-01", + "last_updated": "2025-12-23", "cost": { - "input": 1.75, - "output": 14, - "cache_read": 0.175, - "cache_write": 1.75 + "input": 0.1, + "output": 0.1 }, "type": "chat" }, { - "id": "claude-opus-4-8", - "name": "Claude Opus 4.8", - "display_name": "Claude Opus 4.8", + "id": "Qwen/Qwen3-235B-A22B-Instruct-2507", + "name": "Qwen3 235B A22B Instruct 2507", + "display_name": "Qwen3 235B A22B Instruct 2507", "modalities": { "input": [ - "text", - "image", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 1000000, - "output": 128000 + "context": 262144, + "output": 262144 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": false - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": false, - "mode": "effort", - "effort": "high", - "effort_options": [ - "low", - "medium", - "high", - "xhigh", - "max" - ], - "interleaved": true, - "summaries": true, - "visibility": "omitted", - "continuation": [ - "thinking_blocks" - ], - "notes": [ - "Claude Opus 4.7 and newer Opus models require thinking.type = \"adaptive\" to enable thinking explicitly.", - "Manual budget_tokens requests return 400 on Claude Opus 4.7 and newer adaptive-only Opus models.", - "task_budget is separate from thinking control and should not be treated as a thinking budget." - ] - } + "supported": false }, - "attachment": true, - "open_weights": false, - "release_date": "2026-05-28", - "last_updated": "2026-05-28", + "attachment": false, + "open_weights": true, + "release_date": "2025-07-29", + "last_updated": "2026-01-29", "cost": { - "input": 5, - "output": 25, - "cache_read": 0.5, - "cache_write": 6.25 + "input": 0.2, + "output": 0.8 }, "type": "chat" }, { - "id": "gpt-5.4-mini", - "name": "GPT-5.4 mini", - "display_name": "GPT-5.4 mini", + "id": "zai-org/GLM-5", + "name": "GLM-5", + "display_name": "GLM-5", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 400000, - "output": 128000 + "context": 202752, + "output": 202752 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, - "default": false + "default": true }, "extra_capabilities": { "reasoning": { "supported": true, - "default_enabled": false, - "mode": "effort", - "effort": "none", - "effort_options": [ - "none", - "low", - "medium", - "high", - "xhigh" - ], - "verbosity": "medium", - "verbosity_options": [ - "low", - "medium", - "high" - ], - "visibility": "hidden" + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] } }, - "attachment": true, - "open_weights": false, - "knowledge": "2025-08-31", - "release_date": "2026-03-17", - "last_updated": "2026-03-17", + "attachment": false, + "open_weights": true, + "release_date": "2026-02-12", + "last_updated": "2026-02-12", "cost": { - "input": 0.75, - "output": 4.5, - "cache_read": 0.075, - "cache_write": 0.75 + "input": 1, + "output": 3.2, + "cache_read": 0.5 }, "type": "chat" }, { - "id": "claude-opus-4-6", - "name": "Claude Opus 4.6", - "display_name": "Claude Opus 4.6", + "id": "zai-org/GLM-5.1", + "name": "GLM-5.1", + "display_name": "GLM-5.1", "modalities": { "input": [ - "text", - "image", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 1000000, - "output": 128000 + "context": 202752, + "output": 202752 }, "temperature": true, "tool_call": true, "reasoning": { "supported": true, - "default": false + "default": true }, "extra_capabilities": { "reasoning": { "supported": true, - "default_enabled": false, - "mode": "mixed", - "budget": { - "min": 1024, - "unit": "tokens" - }, - "effort": "high", - "effort_options": [ - "low", - "medium", - "high", - "max" - ], "interleaved": true, "summaries": true, "visibility": "summary", "continuation": [ "thinking_blocks" - ], - "notes": [ - "Anthropic recommends adaptive thinking with effort for Claude 4.6; budget_tokens remains a deprecated compatibility path.", - "Anthropic API defaults effort to high; lower effort levels should be chosen per workload." ] } }, - "attachment": true, - "open_weights": false, - "knowledge": "2025-05-31", - "release_date": "2026-02-05", - "last_updated": "2026-03-13", + "attachment": false, + "open_weights": true, + "release_date": "2026-04-07", + "last_updated": "2026-04-07", "cost": { - "input": 5, - "output": 25, - "cache_read": 0.5, - "cache_write": 6.25 + "input": 1.4, + "output": 4.4, + "cache_read": 0.26 }, "type": "chat" }, { - "id": "claude-opus-4-7", - "name": "Claude Opus 4.7", - "display_name": "Claude Opus 4.7", + "id": "MiniMaxAI/MiniMax-M2.5", + "name": "MiniMax-M2.5", + "display_name": "MiniMax-M2.5", "modalities": { "input": [ - "text", - "image", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 1000000, - "output": 128000 + "context": 196608, + "output": 196608 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, - "default": false + "default": true }, "extra_capabilities": { "reasoning": { "supported": true, - "default_enabled": false, - "mode": "effort", - "effort": "high", - "effort_options": [ - "low", - "medium", - "high", - "xhigh", - "max" - ], "interleaved": true, "summaries": true, - "visibility": "omitted", + "visibility": "summary", "continuation": [ "thinking_blocks" - ], - "notes": [ - "Claude Opus 4.7 and newer Opus models require thinking.type = \"adaptive\" to enable thinking explicitly.", - "Manual budget_tokens requests return 400 on Claude Opus 4.7 and newer adaptive-only Opus models.", - "task_budget is separate from thinking control and should not be treated as a thinking budget." ] } }, - "attachment": true, - "open_weights": false, - "knowledge": "2026-01-31", - "release_date": "2026-04-16", - "last_updated": "2026-04-16", + "attachment": false, + "open_weights": true, + "release_date": "2026-02-12", + "last_updated": "2026-02-12", "cost": { - "input": 5, - "output": 25, - "cache_read": 0.5, - "cache_write": 6.25 + "input": 0.3, + "output": 1.2, + "cache_read": 0.06 }, "type": "chat" } ] }, - "lilac": { - "id": "lilac", - "name": "Lilac", - "display_name": "Lilac", - "api": "https://api.getlilac.com/v1", - "doc": "https://docs.getlilac.com/inference/models", + "tencent-tokenhub": { + "id": "tencent-tokenhub", + "name": "Tencent TokenHub", + "display_name": "Tencent TokenHub", + "api": "https://tokenhub.tencentmaas.com/v1", + "doc": "https://cloud.tencent.com/document/product/1823/130050", "models": [ { - "id": "zai-org/glm-5.1", - "name": "GLM 5.1", - "display_name": "GLM 5.1", + "id": "hy3-preview", + "name": "Hy3 preview", + "display_name": "Hy3 preview", "modalities": { "input": [ "text" @@ -113810,8 +119590,8 @@ ] }, "limit": { - "context": 202800, - "output": 131072 + "context": 256000, + "output": 64000 }, "temperature": true, "tool_call": true, @@ -113821,31 +119601,34 @@ }, "extra_capabilities": { "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] + "supported": true } }, "attachment": false, "open_weights": true, - "knowledge": "2025-04", - "release_date": "2026-03-27", - "last_updated": "2026-03-27", + "release_date": "2026-04-20", + "last_updated": "2026-04-20", "cost": { - "input": 0.9, - "output": 3, - "cache_read": 0.27 + "input": 0, + "output": 0, + "cache_read": 0, + "cache_write": 0 }, "type": "chat" - }, + } + ] + }, + "wandb": { + "id": "wandb", + "name": "Weights & Biases", + "display_name": "Weights & Biases", + "api": "https://api.inference.wandb.ai/v1", + "doc": "https://docs.wandb.ai/guides/integrations/inference/", + "models": [ { - "id": "moonshotai/kimi-k2.6", - "name": "Kimi K2.6", - "display_name": "Kimi K2.6", + "id": "meta-llama/Llama-4-Scout-17B-16E-Instruct", + "name": "Llama 4 Scout 17B 16E Instruct", + "display_name": "Llama 4 Scout 17B 16E Instruct", "modalities": { "input": [ "text", @@ -113856,8 +119639,8 @@ ] }, "limit": { - "context": 262144, - "output": 262144 + "context": 64000, + "output": 64000 }, "temperature": true, "tool_call": true, @@ -113865,33 +119648,21 @@ "supported": true, "default": true }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } - }, - "attachment": true, + "attachment": false, "open_weights": true, - "knowledge": "2025-01", - "release_date": "2026-04-21", - "last_updated": "2026-04-21", + "knowledge": "2024-12", + "release_date": "2025-01-31", + "last_updated": "2026-03-12", "cost": { - "input": 0.7, - "output": 3.5, - "cache_read": 0.2 + "input": 0.17, + "output": 0.66 }, "type": "chat" }, { - "id": "minimaxai/minimax-m2.7", - "name": "MiniMax M2.7", - "display_name": "MiniMax M2.7", + "id": "meta-llama/Llama-3.3-70B-Instruct", + "name": "Llama-3.3-70B-Instruct", + "display_name": "Llama-3.3-70B-Instruct", "modalities": { "input": [ "text" @@ -113901,8 +119672,8 @@ ] }, "limit": { - "context": 204800, - "output": 204800 + "context": 128000, + "output": 128000 }, "temperature": true, "tool_call": true, @@ -113910,88 +119681,52 @@ "supported": true, "default": true }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } - }, "attachment": false, "open_weights": true, - "knowledge": "2025-01", - "release_date": "2026-03-18", - "last_updated": "2026-03-18", + "knowledge": "2023-12", + "release_date": "2024-12-06", + "last_updated": "2026-03-12", "cost": { - "input": 0.3, - "output": 1.2, - "cache_read": 0.055 + "input": 0.71, + "output": 0.71 }, "type": "chat" }, { - "id": "google/gemma-4-31b-it", - "name": "Gemma 4 31B IT", - "display_name": "Gemma 4 31B IT", + "id": "meta-llama/Llama-3.1-70B-Instruct", + "name": "Llama 3.1 70B", + "display_name": "Llama 3.1 70B", "modalities": { "input": [ - "text", - "image", - "video" + "text" ], "output": [ "text" ] }, "limit": { - "context": 262100, - "output": 262100 + "context": 128000, + "output": 128000 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } + "supported": false }, - "attachment": true, + "attachment": false, "open_weights": true, - "knowledge": "2025-01", - "release_date": "2026-04-02", - "last_updated": "2026-04-02", + "release_date": "2024-07-23", + "last_updated": "2026-03-12", "cost": { - "input": 0.11, - "output": 0.35 + "input": 0.8, + "output": 0.8 }, "type": "chat" - } - ] - }, - "stepfun-ai": { - "id": "stepfun-ai", - "name": "StepFun AI", - "display_name": "StepFun AI", - "api": "https://api.stepfun.ai/step_plan/v1", - "doc": "https://platform.stepfun.ai/docs/en/step-plan/integrations/open-code", - "models": [ + }, { - "id": "step-3.5-flash-2603", - "name": "Step 3.5 Flash 2603", - "display_name": "Step 3.5 Flash 2603", + "id": "meta-llama/Llama-3.1-8B-Instruct", + "name": "Meta-Llama-3.1-8B-Instruct", + "display_name": "Meta-Llama-3.1-8B-Instruct", "modalities": { "input": [ "text" @@ -114001,8 +119736,8 @@ ] }, "limit": { - "context": 256000, - "output": 256000 + "context": 128000, + "output": 128000 }, "temperature": true, "tool_call": true, @@ -114012,31 +119747,31 @@ }, "attachment": false, "open_weights": true, - "knowledge": "2025-01", - "release_date": "2026-04-02", - "last_updated": "2026-04-02", + "knowledge": "2023-12", + "release_date": "2024-07-23", + "last_updated": "2026-03-12", "cost": { - "input": 0.1, - "output": 0.3, - "cache_read": 0.02 + "input": 0.22, + "output": 0.22 }, "type": "chat" }, { - "id": "step-3.5-flash", - "name": "Step 3.5 Flash", - "display_name": "Step 3.5 Flash", + "id": "moonshotai/Kimi-K2.5", + "name": "Kimi K2.5", + "display_name": "Kimi K2.5", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 256000, - "output": 256000 + "context": 262144, + "output": 262144 }, "temperature": true, "tool_call": true, @@ -114044,31 +119779,31 @@ "supported": true, "default": true }, - "attachment": false, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } + }, + "attachment": true, "open_weights": true, - "knowledge": "2025-01", - "release_date": "2026-01-29", - "last_updated": "2026-02-13", + "release_date": "2026-01-27", + "last_updated": "2026-03-12", "cost": { - "input": 0.096, - "output": 0.288, - "cache_read": 0.019 + "input": 0.5, + "output": 2.85 }, "type": "chat" - } - ] - }, - "tencent-coding-plan": { - "id": "tencent-coding-plan", - "name": "Tencent Coding Plan (China)", - "display_name": "Tencent Coding Plan (China)", - "api": "https://api.lkeap.cloud.tencent.com/coding/v3", - "doc": "https://cloud.tencent.com/document/product/1772/128947", - "models": [ + }, { - "id": "hunyuan-2.0-instruct", - "name": "Tencent HY 2.0 Instruct", - "display_name": "Tencent HY 2.0 Instruct", + "id": "microsoft/Phi-4-mini-instruct", + "name": "Phi-4-mini-instruct", + "display_name": "Phi-4-mini-instruct", "modalities": { "input": [ "text" @@ -114078,30 +119813,30 @@ ] }, "limit": { - "context": 131072, - "output": 16384 + "context": 128000, + "output": 128000 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "attachment": false, - "open_weights": false, - "release_date": "2026-03-08", - "last_updated": "2026-03-08", + "open_weights": true, + "knowledge": "2023-10", + "release_date": "2024-12-11", + "last_updated": "2026-03-12", "cost": { - "input": 0, - "output": 0, - "cache_read": 0, - "cache_write": 0 + "input": 0.08, + "output": 0.35 }, "type": "chat" }, { - "id": "hunyuan-t1", - "name": "Hunyuan-T1", - "display_name": "Hunyuan-T1", + "id": "Qwen/Qwen3-235B-A22B-Thinking-2507", + "name": "Qwen3-235B-A22B-Thinking-2507", + "display_name": "Qwen3-235B-A22B-Thinking-2507", "modalities": { "input": [ "text" @@ -114111,8 +119846,8 @@ ] }, "limit": { - "context": 131072, - "output": 16384 + "context": 262144, + "output": 262144 }, "temperature": true, "tool_call": true, @@ -114132,21 +119867,20 @@ } }, "attachment": false, - "open_weights": false, - "release_date": "2026-03-08", - "last_updated": "2026-03-08", + "open_weights": true, + "knowledge": "2025-04", + "release_date": "2025-07-25", + "last_updated": "2026-03-12", "cost": { - "input": 0, - "output": 0, - "cache_read": 0, - "cache_write": 0 + "input": 0.1, + "output": 0.1 }, "type": "chat" }, { - "id": "hunyuan-turbos", - "name": "Hunyuan-TurboS", - "display_name": "Hunyuan-TurboS", + "id": "Qwen/Qwen3-Coder-480B-A35B-Instruct", + "name": "Qwen3-Coder-480B-A35B-Instruct", + "display_name": "Qwen3-Coder-480B-A35B-Instruct", "modalities": { "input": [ "text" @@ -114156,8 +119890,8 @@ ] }, "limit": { - "context": 131072, - "output": 16384 + "context": 262144, + "output": 262144 }, "temperature": true, "tool_call": true, @@ -114165,21 +119899,20 @@ "supported": false }, "attachment": false, - "open_weights": false, - "release_date": "2026-03-08", - "last_updated": "2026-03-08", + "open_weights": true, + "knowledge": "2025-04", + "release_date": "2025-07-23", + "last_updated": "2026-03-12", "cost": { - "input": 0, - "output": 0, - "cache_read": 0, - "cache_write": 0 + "input": 1, + "output": 1.5 }, "type": "chat" }, { - "id": "tc-code-latest", - "name": "Auto", - "display_name": "Auto", + "id": "Qwen/Qwen3-30B-A3B-Instruct-2507", + "name": "Qwen3 30B A3B Instruct 2507", + "display_name": "Qwen3 30B A3B Instruct 2507", "modalities": { "input": [ "text" @@ -114189,8 +119922,8 @@ ] }, "limit": { - "context": 131072, - "output": 16384 + "context": 262144, + "output": 262144 }, "temperature": true, "tool_call": true, @@ -114198,21 +119931,19 @@ "supported": false }, "attachment": false, - "open_weights": false, - "release_date": "2026-03-08", - "last_updated": "2026-03-08", + "open_weights": true, + "release_date": "2025-07-29", + "last_updated": "2026-03-12", "cost": { - "input": 0, - "output": 0, - "cache_read": 0, - "cache_write": 0 + "input": 0.1, + "output": 0.3 }, "type": "chat" }, { - "id": "glm-5", - "name": "GLM-5", - "display_name": "GLM-5", + "id": "Qwen/Qwen3-235B-A22B-Instruct-2507", + "name": "Qwen3 235B A22B Instruct 2507", + "display_name": "Qwen3 235B A22B Instruct 2507", "modalities": { "input": [ "text" @@ -114222,42 +119953,29 @@ ] }, "limit": { - "context": 202752, - "output": 16384 + "context": 262144, + "output": 262144 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } + "supported": false }, "attachment": false, - "open_weights": false, - "release_date": "2026-02-11", - "last_updated": "2026-02-11", + "open_weights": true, + "knowledge": "2025-04", + "release_date": "2025-04-28", + "last_updated": "2026-03-12", "cost": { - "input": 0, - "output": 0, - "cache_read": 0, - "cache_write": 0 + "input": 0.1, + "output": 0.1 }, "type": "chat" }, { - "id": "minimax-m2.5", - "name": "MiniMax-M2.5", - "display_name": "MiniMax-M2.5", + "id": "openai/gpt-oss-120b", + "name": "gpt-oss-120b", + "display_name": "gpt-oss-120b", "modalities": { "input": [ "text" @@ -114267,42 +119985,33 @@ ] }, "limit": { - "context": 204800, - "output": 32768 + "context": 131072, + "output": 131072 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": true }, "extra_capabilities": { "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] + "supported": true } }, "attachment": false, - "open_weights": true, - "release_date": "2026-02-12", - "last_updated": "2026-02-12", + "open_weights": false, + "release_date": "2025-08-05", + "last_updated": "2026-03-12", "cost": { - "input": 0, - "output": 0, - "cache_read": 0, - "cache_write": 0 + "input": 0.15, + "output": 0.6 }, "type": "chat" }, { - "id": "hunyuan-2.0-thinking", - "name": "Tencent HY 2.0 Think", - "display_name": "Tencent HY 2.0 Think", + "id": "openai/gpt-oss-20b", + "name": "gpt-oss-20b", + "display_name": "gpt-oss-20b", "modalities": { "input": [ "text" @@ -114313,46 +120022,35 @@ }, "limit": { "context": 131072, - "output": 16384 + "output": 131072 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": true }, "extra_capabilities": { "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] + "supported": true } }, "attachment": false, "open_weights": false, - "release_date": "2026-03-08", - "last_updated": "2026-03-08", + "release_date": "2025-08-05", + "last_updated": "2026-03-12", "cost": { - "input": 0, - "output": 0, - "cache_read": 0, - "cache_write": 0 + "input": 0.05, + "output": 0.2 }, "type": "chat" }, { - "id": "kimi-k2.5", - "name": "Kimi-K2.5", - "display_name": "Kimi-K2.5", + "id": "nvidia/NVIDIA-Nemotron-3-Super-120B-A12B-FP8", + "name": "NVIDIA Nemotron 3 Super 120B", + "display_name": "NVIDIA Nemotron 3 Super 120B", "modalities": { "input": [ - "text", - "image", - "video" + "text" ], "output": [ "text" @@ -114360,201 +120058,100 @@ }, "limit": { "context": 262144, - "output": 32768 + "output": 262144 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } + "supported": false }, - "attachment": true, + "attachment": false, "open_weights": true, - "knowledge": "2025-01", - "release_date": "2026-01-27", - "last_updated": "2026-01-27", + "release_date": "2026-03-11", + "last_updated": "2026-03-12", "cost": { - "input": 0, - "output": 0, - "cache_read": 0, - "cache_write": 0 + "input": 0.2, + "output": 0.8 }, "type": "chat" - } - ] - }, - "opencode-go": { - "id": "opencode-go", - "name": "OpenCode Go", - "display_name": "OpenCode Go", - "api": "https://opencode.ai/zen/go/v1", - "doc": "https://opencode.ai/docs/zen", - "models": [ + }, { - "id": "minimax-m3", - "name": "MiniMax M3", - "display_name": "MiniMax M3", + "id": "OpenPipe/Qwen3-14B-Instruct", + "name": "OpenPipe Qwen3 14B Instruct", + "display_name": "OpenPipe Qwen3 14B Instruct", "modalities": { "input": [ - "text", - "image", - "video" + "text" ], "output": [ "text" ] }, "limit": { - "context": 512000, - "output": 131072 + "context": 32768, + "output": 32768 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true - } + "supported": false }, "attachment": false, "open_weights": true, - "knowledge": "2025-01", - "release_date": "2026-05-31", - "last_updated": "2026-05-31", + "release_date": "2025-04-29", + "last_updated": "2026-03-12", "cost": { - "input": 0.3, - "output": 1.2, - "cache_read": 0.06 + "input": 0.05, + "output": 0.22 }, "type": "chat" }, { - "id": "qwen3.5-plus", - "name": "Qwen3.5 Plus", - "display_name": "Qwen3.5 Plus", + "id": "zai-org/GLM-5-FP8", + "name": "GLM 5", + "display_name": "GLM 5", "modalities": { "input": [ - "text", - "image", - "video" - ], - "output": [ "text" - ] - }, - "limit": { - "context": 262144, - "output": 65536 - }, - "temperature": true, - "tool_call": true, - "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } - }, - "attachment": true, - "open_weights": false, - "knowledge": "2025-04", - "release_date": "2026-02-16", - "last_updated": "2026-02-16", - "cost": { - "input": 0.2, - "output": 1.2, - "cache_read": 0.02, - "cache_write": 0.25 - }, - "type": "chat" - }, - { - "id": "mimo-v2-omni", - "name": "MiMo V2 Omni", - "display_name": "MiMo V2 Omni", - "modalities": { - "input": [ - "text", - "image", - "audio", - "pdf" ], "output": [ "text" ] }, "limit": { - "context": 262144, - "output": 128000 + "context": 200000, + "output": 200000 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } + "supported": false }, - "attachment": true, + "attachment": false, "open_weights": true, - "knowledge": "2024-12", - "release_date": "2026-03-18", - "last_updated": "2026-03-18", + "release_date": "2026-02-11", + "last_updated": "2026-03-12", "cost": { - "input": 0.4, - "output": 2, - "cache_read": 0.08 + "input": 1, + "output": 3.2 }, "type": "chat" }, { - "id": "kimi-k2.6", - "name": "Kimi K2.6", - "display_name": "Kimi K2.6", + "id": "zai-org/GLM-5.1", + "name": "GLM-5.1", + "display_name": "GLM-5.1", "modalities": { "input": [ - "text", - "image", - "video" + "text" ], "output": [ "text" ] }, "limit": { - "context": 262144, - "output": 65536 + "context": 200000, + "output": 131072 }, "temperature": true, "tool_call": true, @@ -114573,22 +120170,22 @@ ] } }, - "attachment": true, + "attachment": false, "open_weights": true, - "knowledge": "2024-10", - "release_date": "2026-04-21", - "last_updated": "2026-04-21", + "release_date": "2026-03-27", + "last_updated": "2026-03-27", "cost": { - "input": 0.95, - "output": 4, - "cache_read": 0.16 + "input": 1.4, + "output": 4.4, + "cache_read": 0.26, + "cache_write": 0 }, "type": "chat" }, { - "id": "qwen3.7-max", - "name": "Qwen3.7 Max", - "display_name": "Qwen3.7 Max", + "id": "deepseek-ai/DeepSeek-V3.1", + "name": "DeepSeek V3.1", + "display_name": "DeepSeek V3.1", "modalities": { "input": [ "text" @@ -114598,102 +120195,73 @@ ] }, "limit": { - "context": 1000000, - "output": 65536 + "context": 161000, + "output": 161000 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true - } + "supported": false }, "attachment": false, - "open_weights": false, - "release_date": "2026-05-21", - "last_updated": "2026-05-21", + "open_weights": true, + "release_date": "2025-08-21", + "last_updated": "2026-03-12", "cost": { - "input": 2.5, - "output": 7.5, - "cache_read": 0.5, - "cache_write": 3.125 + "input": 0.55, + "output": 1.65 }, "type": "chat" }, { - "id": "qwen3.6-plus", - "name": "Qwen3.6 Plus", - "display_name": "Qwen3.6 Plus", + "id": "MiniMaxAI/MiniMax-M2.5", + "name": "MiniMax M2.5", + "display_name": "MiniMax M2.5", "modalities": { "input": [ - "text", - "image", - "video" + "text" ], "output": [ "text" ] }, "limit": { - "context": 1000000, - "output": 65536 + "context": 196608, + "output": 196608 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": true }, "extra_capabilities": { "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] + "supported": true } }, - "attachment": true, - "open_weights": false, - "knowledge": "2025-04", - "release_date": "2026-04-02", - "last_updated": "2026-04-02", + "attachment": false, + "open_weights": true, + "release_date": "2026-02-12", + "last_updated": "2026-03-12", "cost": { - "input": 0.5, - "output": 3, - "cache_read": 0.05, - "cache_write": 0.625, - "tiers": [ - { - "input": 2, - "output": 6, - "cache_read": 0.2, - "cache_write": 2.5, - "tier": { - "type": "context", - "size": 256000 - } - } - ], - "context_over_200k": { - "input": 2, - "output": 6, - "cache_read": 0.2, - "cache_write": 2.5 - } + "input": 0.3, + "output": 1.2 }, "type": "chat" - }, + } + ] + }, + "kuae-cloud-coding-plan": { + "id": "kuae-cloud-coding-plan", + "name": "KUAE Cloud Coding Plan", + "display_name": "KUAE Cloud Coding Plan", + "api": "https://coding-plan-endpoint.kuaecloud.net/v1", + "doc": "https://docs.mthreads.com/kuaecloud/kuaecloud-doc-online/coding_plan/", + "models": [ { - "id": "minimax-m2.7", - "name": "MiniMax M2.7", - "display_name": "MiniMax M2.7", + "id": "GLM-4.7", + "name": "GLM-4.7", + "display_name": "GLM-4.7", "modalities": { "input": [ "text" @@ -114725,31 +120293,42 @@ }, "attachment": false, "open_weights": true, - "knowledge": "2025-01", - "release_date": "2026-03-18", - "last_updated": "2026-03-18", + "knowledge": "2025-04", + "release_date": "2025-12-22", + "last_updated": "2025-12-22", "cost": { - "input": 0.3, - "output": 1.2, - "cache_read": 0.06 + "input": 0, + "output": 0, + "cache_read": 0, + "cache_write": 0 }, "type": "chat" - }, + } + ] + }, + "gitlab": { + "id": "gitlab", + "name": "GitLab Duo", + "display_name": "GitLab Duo", + "doc": "https://docs.gitlab.com/user/duo_agent_platform/", + "models": [ { - "id": "deepseek-v4-flash", - "name": "DeepSeek V4 Flash", - "display_name": "DeepSeek V4 Flash", + "id": "duo-chat-opus-4-5", + "name": "Agentic Chat (Claude Opus 4.5)", + "display_name": "Agentic Chat (Claude Opus 4.5)", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 1000000, - "output": 384000 + "context": 200000, + "output": 64000 }, "temperature": true, "tool_call": true, @@ -114757,183 +120336,137 @@ "supported": true, "default": true }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } - }, - "attachment": false, - "open_weights": true, - "knowledge": "2025-05", - "release_date": "2026-04-24", - "last_updated": "2026-04-24", + "attachment": true, + "open_weights": false, + "knowledge": "2025-03-31", + "release_date": "2026-01-08", + "last_updated": "2026-01-08", "cost": { - "input": 0.14, - "output": 0.28, - "cache_read": 0.0028 + "input": 0, + "output": 0, + "cache_read": 0, + "cache_write": 0 }, "type": "chat" }, { - "id": "glm-5", - "name": "GLM-5", - "display_name": "GLM-5", + "id": "duo-chat-opus-4-8", + "name": "Agentic Chat (Claude Opus 4.8)", + "display_name": "Agentic Chat (Claude Opus 4.8)", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 202752, - "output": 32768 + "context": 1000000, + "output": 128000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { "supported": true, "default": true }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } - }, - "attachment": false, - "open_weights": true, - "knowledge": "2025-04", - "release_date": "2026-02-11", - "last_updated": "2026-02-11", + "attachment": true, + "open_weights": false, + "knowledge": "2026-01-31", + "release_date": "2026-05-28", + "last_updated": "2026-05-28", "cost": { - "input": 1, - "output": 3.2, - "cache_read": 0.2 + "input": 0, + "output": 0, + "cache_read": 0, + "cache_write": 0 }, "type": "chat" }, { - "id": "minimax-m2.5", - "name": "MiniMax M2.5", - "display_name": "MiniMax M2.5", + "id": "duo-chat-opus-4-7", + "name": "Agentic Chat (Claude Opus 4.7)", + "display_name": "Agentic Chat (Claude Opus 4.7)", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 204800, - "output": 65536 + "context": 1000000, + "output": 64000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { "supported": true, "default": true }, - "extra_capabilities": { - "reasoning": { - "supported": true - } - }, - "attachment": false, - "open_weights": true, - "knowledge": "2025-01", - "release_date": "2026-02-12", - "last_updated": "2026-02-12", + "attachment": true, + "open_weights": false, + "knowledge": "2026-01-31", + "release_date": "2026-04-16", + "last_updated": "2026-04-16", "cost": { - "input": 0.3, - "output": 1.2, - "cache_read": 0.03 + "input": 0, + "output": 0, + "cache_read": 0, + "cache_write": 0 }, "type": "chat" }, { - "id": "mimo-v2-pro", - "name": "MiMo V2 Pro", - "display_name": "MiMo V2 Pro", + "id": "duo-chat-gpt-5-2-codex", + "name": "Agentic Chat (GPT-5.2 Codex)", + "display_name": "Agentic Chat (GPT-5.2 Codex)", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 1048576, + "context": 400000, "output": 128000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { "supported": true, "default": true }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } - }, "attachment": true, - "open_weights": true, - "knowledge": "2024-12", - "release_date": "2026-03-18", - "last_updated": "2026-03-18", + "open_weights": false, + "knowledge": "2025-08-31", + "release_date": "2026-01-22", + "last_updated": "2026-01-22", "cost": { - "input": 1, - "output": 3, - "cache_read": 0.2, - "tiers": [ - { - "input": 2, - "output": 6, - "cache_read": 0.4, - "tier": { - "type": "context", - "size": 256000 - } - } - ], - "context_over_200k": { - "input": 2, - "output": 6, - "cache_read": 0.4 - } + "input": 0, + "output": 0 }, "type": "chat" }, { - "id": "qwen3.7-plus", - "name": "Qwen3.7 Plus", - "display_name": "Qwen3.7 Plus", + "id": "duo-chat-fable-5", + "name": "Agentic Chat (Claude Fable 5)", + "display_name": "Agentic Chat (Claude Fable 5)", "modalities": { "input": [ "text", "image", - "video" + "pdf" ], "output": [ "text" @@ -114941,104 +120474,71 @@ }, "limit": { "context": 1000000, - "output": 65536 + "output": 128000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { "supported": true, "default": true }, - "extra_capabilities": { - "reasoning": { - "supported": true - } - }, "attachment": true, "open_weights": false, - "release_date": "2026-06-02", - "last_updated": "2026-06-02", + "knowledge": "2026-01-31", + "release_date": "2026-06-09", + "last_updated": "2026-06-09", "cost": { - "input": 0.4, - "output": 1.6, - "cache_read": 0.04, - "cache_write": 0.5, - "tiers": [ - { - "input": 1.2, - "output": 4.8, - "cache_read": 0.12, - "cache_write": 1.5, - "tier": { - "type": "context", - "size": 256000 - } - } - ], - "context_over_200k": { - "input": 1.2, - "output": 4.8, - "cache_read": 0.12, - "cache_write": 1.5 - } + "input": 0, + "output": 0, + "cache_read": 0, + "cache_write": 0 }, "type": "chat" }, { - "id": "mimo-v2.5", - "name": "MiMo V2.5", - "display_name": "MiMo V2.5", + "id": "duo-chat-gpt-5-5", + "name": "Agentic Chat (GPT-5.5)", + "display_name": "Agentic Chat (GPT-5.5)", "modalities": { "input": [ "text", "image", - "audio", - "video" + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 1000000, + "context": 1050000, "output": 128000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { "supported": true, "default": true }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } - }, "attachment": true, - "open_weights": true, - "knowledge": "2024-12", - "release_date": "2026-04-22", - "last_updated": "2026-04-22", + "open_weights": false, + "knowledge": "2025-08-31", + "release_date": "2026-04-23", + "last_updated": "2026-04-23", "cost": { - "input": 0.14, - "output": 0.28, - "cache_read": 0.0028 + "input": 0, + "output": 0 }, "type": "chat" }, { - "id": "deepseek-v4-pro", - "name": "DeepSeek V4 Pro", - "display_name": "DeepSeek V4 Pro", + "id": "duo-chat-opus-4-6", + "name": "Agentic Chat (Claude Opus 4.6)", + "display_name": "Agentic Chat (Claude Opus 4.6)", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ "text" @@ -115046,7 +120546,7 @@ }, "limit": { "context": 1000000, - "output": 384000 + "output": 64000 }, "temperature": true, "tool_call": true, @@ -115054,178 +120554,126 @@ "supported": true, "default": true }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } - }, - "attachment": false, - "open_weights": true, - "knowledge": "2025-05", - "release_date": "2026-04-24", - "last_updated": "2026-04-24", + "attachment": true, + "open_weights": false, + "knowledge": "2025-05-31", + "release_date": "2026-02-05", + "last_updated": "2026-02-05", "cost": { - "input": 1.74, - "output": 3.48, - "cache_read": 0.0145 + "input": 0, + "output": 0, + "cache_read": 0, + "cache_write": 0 }, "type": "chat" }, { - "id": "kimi-k2.5", - "name": "Kimi K2.5", - "display_name": "Kimi K2.5", + "id": "duo-chat-gpt-5-4", + "name": "Agentic Chat (GPT-5.4)", + "display_name": "Agentic Chat (GPT-5.4)", "modalities": { "input": [ "text", "image", - "video" + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 262144, - "output": 65536 + "context": 1050000, + "output": 128000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { "supported": true, "default": true }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } - }, "attachment": true, - "open_weights": true, - "knowledge": "2024-10", - "release_date": "2026-01-27", - "last_updated": "2026-01-27", + "open_weights": false, + "knowledge": "2025-08-31", + "release_date": "2026-03-05", + "last_updated": "2026-03-05", "cost": { - "input": 0.6, - "output": 3, - "cache_read": 0.1 + "input": 0, + "output": 0 }, "type": "chat" }, { - "id": "glm-5.1", - "name": "GLM-5.1", - "display_name": "GLM-5.1", + "id": "duo-chat-gpt-5-codex", + "name": "Agentic Chat (GPT-5 Codex)", + "display_name": "Agentic Chat (GPT-5 Codex)", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 202752, - "output": 32768 + "context": 400000, + "output": 128000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { "supported": true, "default": true }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } - }, "attachment": false, - "open_weights": true, - "knowledge": "2025-04", - "release_date": "2026-04-07", - "last_updated": "2026-04-07", + "open_weights": false, + "knowledge": "2024-09-30", + "release_date": "2026-01-22", + "last_updated": "2026-01-22", "cost": { - "input": 1.4, - "output": 4.4, - "cache_read": 0.26 + "input": 0, + "output": 0 }, "type": "chat" }, { - "id": "mimo-v2.5-pro", - "name": "MiMo V2.5 Pro", - "display_name": "MiMo V2.5 Pro", + "id": "duo-chat-gpt-5-4-nano", + "name": "Agentic Chat (GPT-5.4 Nano)", + "display_name": "Agentic Chat (GPT-5.4 Nano)", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 1048576, + "context": 400000, "output": 128000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { "supported": true, "default": true }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } - }, "attachment": true, - "open_weights": true, - "knowledge": "2024-12", - "release_date": "2026-04-22", - "last_updated": "2026-04-22", + "open_weights": false, + "knowledge": "2025-08-31", + "release_date": "2026-03-17", + "last_updated": "2026-03-17", "cost": { - "input": 1.74, - "output": 3.48, - "cache_read": 0.0145 + "input": 0, + "output": 0 }, "type": "chat" - } - ] - }, - "gitlab": { - "id": "gitlab", - "name": "GitLab Duo", - "display_name": "GitLab Duo", - "doc": "https://docs.gitlab.com/user/duo_agent_platform/", - "models": [ + }, { - "id": "duo-chat-sonnet-4-5", - "name": "Agentic Chat (Claude Sonnet 4.5)", - "display_name": "Agentic Chat (Claude Sonnet 4.5)", + "id": "duo-chat-sonnet-4-6", + "name": "Agentic Chat (Claude Sonnet 4.6)", + "display_name": "Agentic Chat (Claude Sonnet 4.6)", "modalities": { "input": [ "text", @@ -115237,7 +120685,7 @@ ] }, "limit": { - "context": 200000, + "context": 1000000, "output": 64000 }, "temperature": true, @@ -115248,9 +120696,9 @@ }, "attachment": true, "open_weights": false, - "knowledge": "2025-07-31", - "release_date": "2026-01-08", - "last_updated": "2026-01-08", + "knowledge": "2025-08-31", + "release_date": "2026-02-17", + "last_updated": "2026-02-17", "cost": { "input": 0, "output": 0, @@ -115260,21 +120708,20 @@ "type": "chat" }, { - "id": "duo-chat-gpt-5-4", - "name": "Agentic Chat (GPT-5.4)", - "display_name": "Agentic Chat (GPT-5.4)", + "id": "duo-chat-gpt-5-mini", + "name": "Agentic Chat (GPT-5 Mini)", + "display_name": "Agentic Chat (GPT-5 Mini)", "modalities": { "input": [ "text", - "image", - "pdf" + "image" ], "output": [ "text" ] }, "limit": { - "context": 1050000, + "context": 400000, "output": 128000 }, "temperature": false, @@ -115285,9 +120732,9 @@ }, "attachment": true, "open_weights": false, - "knowledge": "2025-08-31", - "release_date": "2026-03-05", - "last_updated": "2026-03-05", + "knowledge": "2024-05-30", + "release_date": "2026-01-22", + "last_updated": "2026-01-22", "cost": { "input": 0, "output": 0 @@ -115295,9 +120742,9 @@ "type": "chat" }, { - "id": "duo-chat-gpt-5-2", - "name": "Agentic Chat (GPT-5.2)", - "display_name": "Agentic Chat (GPT-5.2)", + "id": "duo-chat-gpt-5-4-mini", + "name": "Agentic Chat (GPT-5.4 Mini)", + "display_name": "Agentic Chat (GPT-5.4 Mini)", "modalities": { "input": [ "text", @@ -115320,8 +120767,8 @@ "attachment": true, "open_weights": false, "knowledge": "2025-08-31", - "release_date": "2026-01-23", - "last_updated": "2026-01-23", + "release_date": "2026-03-17", + "last_updated": "2026-03-17", "cost": { "input": 0, "output": 0 @@ -115329,9 +120776,9 @@ "type": "chat" }, { - "id": "duo-chat-opus-4-7", - "name": "Agentic Chat (Claude Opus 4.7)", - "display_name": "Agentic Chat (Claude Opus 4.7)", + "id": "duo-chat-gpt-5-3-codex", + "name": "Agentic Chat (GPT-5.3 Codex)", + "display_name": "Agentic Chat (GPT-5.3 Codex)", "modalities": { "input": [ "text", @@ -115343,8 +120790,8 @@ ] }, "limit": { - "context": 1000000, - "output": 64000 + "context": 400000, + "output": 128000 }, "temperature": false, "tool_call": true, @@ -115354,21 +120801,19 @@ }, "attachment": true, "open_weights": false, - "knowledge": "2026-01-31", - "release_date": "2026-04-16", - "last_updated": "2026-04-16", + "knowledge": "2025-08-31", + "release_date": "2026-02-05", + "last_updated": "2026-02-05", "cost": { "input": 0, - "output": 0, - "cache_read": 0, - "cache_write": 0 + "output": 0 }, "type": "chat" }, { - "id": "duo-chat-opus-4-5", - "name": "Agentic Chat (Claude Opus 4.5)", - "display_name": "Agentic Chat (Claude Opus 4.5)", + "id": "duo-chat-haiku-4-5", + "name": "Agentic Chat (Claude Haiku 4.5)", + "display_name": "Agentic Chat (Claude Haiku 4.5)", "modalities": { "input": [ "text", @@ -115391,7 +120836,7 @@ }, "attachment": true, "open_weights": false, - "knowledge": "2025-03-31", + "knowledge": "2025-02-28", "release_date": "2026-01-08", "last_updated": "2026-01-08", "cost": { @@ -115403,21 +120848,20 @@ "type": "chat" }, { - "id": "duo-chat-opus-4-8", - "name": "Agentic Chat (Claude Opus 4.8)", - "display_name": "Agentic Chat (Claude Opus 4.8)", + "id": "duo-chat-gpt-5-2", + "name": "Agentic Chat (GPT-5.2)", + "display_name": "Agentic Chat (GPT-5.2)", "modalities": { "input": [ "text", - "image", - "pdf" + "image" ], "output": [ "text" ] }, "limit": { - "context": 1000000, + "context": 400000, "output": 128000 }, "temperature": false, @@ -115428,35 +120872,34 @@ }, "attachment": true, "open_weights": false, - "knowledge": "2026-01-31", - "release_date": "2026-05-28", - "last_updated": "2026-05-28", + "knowledge": "2025-08-31", + "release_date": "2026-01-23", + "last_updated": "2026-01-23", "cost": { "input": 0, - "output": 0, - "cache_read": 0, - "cache_write": 0 + "output": 0 }, "type": "chat" }, { - "id": "duo-chat-gpt-5-4-nano", - "name": "Agentic Chat (GPT-5.4 Nano)", - "display_name": "Agentic Chat (GPT-5.4 Nano)", + "id": "duo-chat-sonnet-4-5", + "name": "Agentic Chat (Claude Sonnet 4.5)", + "display_name": "Agentic Chat (Claude Sonnet 4.5)", "modalities": { "input": [ "text", - "image" + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 400000, - "output": 128000 + "context": 200000, + "output": 64000 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, @@ -115464,19 +120907,21 @@ }, "attachment": true, "open_weights": false, - "knowledge": "2025-08-31", - "release_date": "2026-03-17", - "last_updated": "2026-03-17", + "knowledge": "2025-07-31", + "release_date": "2026-01-08", + "last_updated": "2026-01-08", "cost": { "input": 0, - "output": 0 + "output": 0, + "cache_read": 0, + "cache_write": 0 }, "type": "chat" }, { - "id": "duo-chat-gpt-5-4-mini", - "name": "Agentic Chat (GPT-5.4 Mini)", - "display_name": "Agentic Chat (GPT-5.4 Mini)", + "id": "duo-chat-gpt-5-1", + "name": "Agentic Chat (GPT-5.1)", + "display_name": "Agentic Chat (GPT-5.1)", "modalities": { "input": [ "text", @@ -115498,66 +120943,71 @@ }, "attachment": true, "open_weights": false, - "knowledge": "2025-08-31", - "release_date": "2026-03-17", - "last_updated": "2026-03-17", + "knowledge": "2024-09-30", + "release_date": "2026-01-22", + "last_updated": "2026-01-22", "cost": { "input": 0, "output": 0 }, "type": "chat" - }, + } + ] + }, + "kilo": { + "id": "kilo", + "name": "Kilo Gateway", + "display_name": "Kilo Gateway", + "api": "https://api.kilo.ai/api/gateway", + "doc": "https://kilo.ai", + "models": [ { - "id": "duo-chat-gpt-5-mini", - "name": "Agentic Chat (GPT-5 Mini)", - "display_name": "Agentic Chat (GPT-5 Mini)", + "id": "inclusionai/ling-2.6-1t", + "name": "inclusionAI: Ling-2.6-1T", + "display_name": "inclusionAI: Ling-2.6-1T", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 400000, - "output": 128000 + "context": 262144, + "output": 32768 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, - "attachment": true, + "attachment": false, "open_weights": false, - "knowledge": "2024-05-30", - "release_date": "2026-01-22", - "last_updated": "2026-01-22", + "release_date": "2026-04-23", + "last_updated": "2026-05-16", "cost": { - "input": 0, - "output": 0 + "input": 0.3, + "output": 2.5, + "cache_read": 0.06 }, "type": "chat" }, { - "id": "duo-chat-opus-4-6", - "name": "Agentic Chat (Claude Opus 4.6)", - "display_name": "Agentic Chat (Claude Opus 4.6)", + "id": "inclusionai/ring-2.6-1t", + "name": "inclusionAI: Ring-2.6-1T", + "display_name": "inclusionAI: Ring-2.6-1T", "modalities": { "input": [ - "text", - "image", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 1000000, - "output": 64000 + "context": 262144, + "output": 65536 }, "temperature": true, "tool_call": true, @@ -115565,279 +121015,240 @@ "supported": true, "default": true }, - "attachment": true, + "attachment": false, "open_weights": false, - "knowledge": "2025-05-31", - "release_date": "2026-02-05", - "last_updated": "2026-02-05", + "release_date": "2026-05-08", + "last_updated": "2026-05-16", "cost": { - "input": 0, - "output": 0, - "cache_read": 0, - "cache_write": 0 + "input": 0.075, + "output": 0.625, + "cache_read": 0.015 }, "type": "chat" }, { - "id": "duo-chat-gpt-5-5", - "name": "Agentic Chat (GPT-5.5)", - "display_name": "Agentic Chat (GPT-5.5)", + "id": "inclusionai/ling-2.6-flash", + "name": "inclusionAI: Ling-2.6 Flash", + "display_name": "inclusionAI: Ling-2.6 Flash", "modalities": { "input": [ - "text", - "image", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 1050000, - "output": 128000 + "context": 262144, + "output": 32768 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, - "attachment": true, + "attachment": false, "open_weights": false, - "knowledge": "2025-08-31", - "release_date": "2026-04-23", - "last_updated": "2026-04-23", + "release_date": "2026-04-21", + "last_updated": "2026-05-01", "cost": { - "input": 0, - "output": 0 + "input": 0.08, + "output": 0.24, + "cache_read": 0.016 }, "type": "chat" }, { - "id": "duo-chat-gpt-5-1", - "name": "Agentic Chat (GPT-5.1)", - "display_name": "Agentic Chat (GPT-5.1)", + "id": "ibm-granite/granite-4.0-h-micro", + "name": "IBM: Granite 4.0 Micro", + "display_name": "IBM: Granite 4.0 Micro", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 400000, - "output": 128000 + "context": 131000, + "output": 32768 }, - "temperature": false, - "tool_call": true, + "temperature": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": true + "supported": false }, - "attachment": true, - "open_weights": false, - "knowledge": "2024-09-30", - "release_date": "2026-01-22", - "last_updated": "2026-01-22", + "attachment": false, + "open_weights": true, + "release_date": "2025-10-20", + "last_updated": "2026-03-15", "cost": { - "input": 0, - "output": 0 + "input": 0.017, + "output": 0.11 }, "type": "chat" }, { - "id": "duo-chat-haiku-4-5", - "name": "Agentic Chat (Claude Haiku 4.5)", - "display_name": "Agentic Chat (Claude Haiku 4.5)", + "id": "ibm-granite/granite-4.1-8b", + "name": "IBM: Granite 4.1 8B", + "display_name": "IBM: Granite 4.1 8B", "modalities": { "input": [ - "text", - "image", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 64000 + "context": 131072, + "output": 131072 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, - "attachment": true, + "attachment": false, "open_weights": false, - "knowledge": "2025-02-28", - "release_date": "2026-01-08", - "last_updated": "2026-01-08", + "release_date": "2026-04-30", + "last_updated": "2026-05-01", "cost": { - "input": 0, - "output": 0, - "cache_read": 0, - "cache_write": 0 + "input": 0.05, + "output": 0.1, + "cache_read": 0.05 }, "type": "chat" }, { - "id": "duo-chat-gpt-5-2-codex", - "name": "Agentic Chat (GPT-5.2 Codex)", - "display_name": "Agentic Chat (GPT-5.2 Codex)", + "id": "meta-llama/llama-3.1-8b-instruct", + "name": "Meta: Llama 3.1 8B Instruct", + "display_name": "Meta: Llama 3.1 8B Instruct", "modalities": { "input": [ - "text", - "image", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 400000, - "output": 128000 + "context": 16384, + "output": 16384 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, - "attachment": true, - "open_weights": false, - "knowledge": "2025-08-31", - "release_date": "2026-01-22", - "last_updated": "2026-01-22", + "attachment": false, + "open_weights": true, + "release_date": "2024-07-23", + "last_updated": "2025-12-23", "cost": { - "input": 0, - "output": 0 + "input": 0.02, + "output": 0.05 }, "type": "chat" }, { - "id": "duo-chat-gpt-5-3-codex", - "name": "Agentic Chat (GPT-5.3 Codex)", - "display_name": "Agentic Chat (GPT-5.3 Codex)", + "id": "meta-llama/llama-3-70b-instruct", + "name": "Meta: Llama 3 70B Instruct", + "display_name": "Meta: Llama 3 70B Instruct", "modalities": { "input": [ - "text", - "image", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 400000, - "output": 128000 + "context": 8192, + "output": 8000 }, - "temperature": false, - "tool_call": true, + "temperature": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": true + "supported": false }, - "attachment": true, - "open_weights": false, - "knowledge": "2025-08-31", - "release_date": "2026-02-05", - "last_updated": "2026-02-05", + "attachment": false, + "open_weights": true, + "release_date": "2024-07-23", + "last_updated": "2024-07-23", "cost": { - "input": 0, - "output": 0 + "input": 0.51, + "output": 0.74 }, "type": "chat" }, { - "id": "duo-chat-sonnet-4-6", - "name": "Agentic Chat (Claude Sonnet 4.6)", - "display_name": "Agentic Chat (Claude Sonnet 4.6)", + "id": "meta-llama/llama-3.1-70b-instruct", + "name": "Meta: Llama 3.1 70B Instruct", + "display_name": "Meta: Llama 3.1 70B Instruct", "modalities": { "input": [ - "text", - "image", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 1000000, - "output": 64000 + "context": 131072, + "output": 26215 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, - "attachment": true, - "open_weights": false, - "knowledge": "2025-08-31", - "release_date": "2026-02-17", - "last_updated": "2026-02-17", + "attachment": false, + "open_weights": true, + "release_date": "2024-07-16", + "last_updated": "2024-07-23", "cost": { - "input": 0, - "output": 0, - "cache_read": 0, - "cache_write": 0 + "input": 0.4, + "output": 0.4 }, "type": "chat" }, { - "id": "duo-chat-gpt-5-codex", - "name": "Agentic Chat (GPT-5 Codex)", - "display_name": "Agentic Chat (GPT-5 Codex)", + "id": "meta-llama/llama-3.2-1b-instruct", + "name": "Meta: Llama 3.2 1B Instruct", + "display_name": "Meta: Llama 3.2 1B Instruct", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 400000, - "output": 128000 + "context": 60000, + "output": 12000 }, - "temperature": false, - "tool_call": true, + "temperature": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": true + "supported": false }, "attachment": false, - "open_weights": false, - "knowledge": "2024-09-30", - "release_date": "2026-01-22", - "last_updated": "2026-01-22", + "open_weights": true, + "release_date": "2024-09-18", + "last_updated": "2026-01-27", "cost": { - "input": 0, - "output": 0 + "input": 0.027, + "output": 0.2 }, "type": "chat" - } - ] - }, - "cortecs": { - "id": "cortecs", - "name": "Cortecs", - "display_name": "Cortecs", - "api": "https://api.cortecs.ai/v1", - "doc": "https://api.cortecs.ai/v1/models", - "models": [ + }, { - "id": "nova-pro-v1", - "name": "Nova Pro 1.0", - "display_name": "Nova Pro 1.0", + "id": "meta-llama/llama-4-maverick", + "name": "Meta: Llama 4 Maverick", + "display_name": "Meta: Llama 4 Maverick", "modalities": { "input": [ "text", @@ -115848,85 +121259,60 @@ ] }, "limit": { - "context": 300000, - "output": 5000 + "context": 1048576, + "output": 16384 }, "temperature": true, "tool_call": true, "reasoning": { "supported": false }, - "attachment": false, - "open_weights": false, - "knowledge": "2024-04", - "release_date": "2024-12-03", - "last_updated": "2024-12-03", + "attachment": true, + "open_weights": true, + "release_date": "2025-04-05", + "last_updated": "2025-12-24", "cost": { - "input": 1.016, - "output": 4.061 + "input": 0.15, + "output": 0.6 }, "type": "chat" }, { - "id": "claude-sonnet-4", - "name": "Claude Sonnet 4", - "display_name": "Claude Sonnet 4", + "id": "meta-llama/llama-3.2-11b-vision-instruct", + "name": "Meta: Llama 3.2 11B Vision Instruct", + "display_name": "Meta: Llama 3.2 11B Vision Instruct", "modalities": { "input": [ "text", - "image", - "pdf" + "image" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 64000 + "context": 131072, + "output": 16384 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": false - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": false, - "mode": "budget", - "budget": { - "min": 1024, - "unit": "tokens" - }, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ], - "notes": [ - "Claude 4 manual thinking uses thinking.type = \"enabled\" with budget_tokens.", - "Interleaved thinking requires the interleaved-thinking-2025-05-14 beta header for this model family." - ] - } + "supported": false }, - "attachment": false, - "open_weights": false, - "knowledge": "2025-03", - "release_date": "2025-05-22", - "last_updated": "2025-05-22", + "attachment": true, + "open_weights": true, + "release_date": "2024-09-25", + "last_updated": "2024-09-25", "cost": { - "input": 3.307, - "output": 16.536 + "input": 0.049, + "output": 0.049 }, "type": "chat" }, { - "id": "deepseek-r1-0528", - "name": "DeepSeek R1 0528", - "display_name": "DeepSeek R1 0528", + "id": "meta-llama/llama-3.3-70b-instruct", + "name": "Meta: Llama 3.3 70B Instruct", + "display_name": "Meta: Llama 3.3 70B Instruct", "modalities": { "input": [ "text" @@ -115936,41 +121322,28 @@ ] }, "limit": { - "context": 164000, - "output": 164000 + "context": 131072, + "output": 16384 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } + "supported": false }, "attachment": false, "open_weights": true, - "knowledge": "2024-07", - "release_date": "2025-05-28", - "last_updated": "2025-05-28", + "release_date": "2024-08-01", + "last_updated": "2026-02-04", "cost": { - "input": 0.585, - "output": 2.307 + "input": 0.1, + "output": 0.32 }, "type": "chat" }, { - "id": "qwen3.5-122b-a10b", - "name": "Qwen3.5 122B A10B", - "display_name": "Qwen3.5 122B A10B", + "id": "meta-llama/llama-guard-3-8b", + "name": "Llama Guard 3 8B", + "display_name": "Llama Guard 3 8B", "modalities": { "input": [ "text" @@ -115980,43 +121353,31 @@ ] }, "limit": { - "context": 262144, - "output": 262144 + "context": 131072, + "output": 26215 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } + "supported": false }, "attachment": false, "open_weights": true, - "knowledge": "2026-01", - "release_date": "2026-02-24", - "last_updated": "2026-02-24", + "release_date": "2024-04-18", + "last_updated": "2026-02-04", "cost": { - "input": 0.444, - "output": 3.106 + "input": 0.02, + "output": 0.06 }, "type": "chat" }, { - "id": "llama-3.1-405b-instruct", - "name": "Llama 3.1 405B Instruct", - "display_name": "Llama 3.1 405B Instruct", + "id": "meta-llama/llama-guard-4-12b", + "name": "Meta: Llama Guard 4 12B", + "display_name": "Meta: Llama Guard 4 12B", "modalities": { "input": [ + "image", "text" ], "output": [ @@ -116024,8 +121385,39 @@ ] }, "limit": { - "context": 128000, - "output": 128000 + "context": 163840, + "output": 32768 + }, + "temperature": true, + "tool_call": false, + "reasoning": { + "supported": false + }, + "attachment": true, + "open_weights": true, + "release_date": "2025-04-05", + "last_updated": "2025-04-05", + "cost": { + "input": 0.18, + "output": 0.18 + }, + "type": "chat" + }, + { + "id": "meta-llama/llama-3-8b-instruct", + "name": "Meta: Llama 3 8B Instruct", + "display_name": "Meta: Llama 3 8B Instruct", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 8192, + "output": 16384 }, "temperature": true, "tool_call": true, @@ -116034,62 +121426,81 @@ }, "attachment": false, "open_weights": true, - "knowledge": "2023-12", - "release_date": "2024-07-23", - "last_updated": "2024-07-23", + "release_date": "2024-04-25", + "last_updated": "2025-04-03", "cost": { - "input": 0, - "output": 0 + "input": 0.03, + "output": 0.04 }, "type": "chat" }, { - "id": "qwen3-32b", - "name": "Qwen3 32B", - "display_name": "Qwen3 32B", + "id": "meta-llama/llama-4-scout", + "name": "Meta: Llama 4 Scout", + "display_name": "Meta: Llama 4 Scout", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 16384, + "context": 327680, "output": 16384 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true + "supported": false }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } + "attachment": true, + "open_weights": true, + "release_date": "2025-04-05", + "last_updated": "2025-04-05", + "cost": { + "input": 0.08, + "output": 0.3 + }, + "type": "chat" + }, + { + "id": "meta-llama/llama-3.2-3b-instruct", + "name": "Meta: Llama 3.2 3B Instruct", + "display_name": "Meta: Llama 3.2 3B Instruct", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 80000, + "output": 16384 + }, + "temperature": true, + "tool_call": false, + "reasoning": { + "supported": false }, "attachment": false, "open_weights": true, - "knowledge": "2024-12", - "release_date": "2025-04-29", - "last_updated": "2025-04-29", + "release_date": "2024-09-18", + "last_updated": "2026-03-15", "cost": { - "input": 0.099, - "output": 0.33 + "input": 0.051, + "output": 0.34 }, "type": "chat" }, { - "id": "hermes-4-70b", - "name": "Hermes 4 70B", - "display_name": "Hermes 4 70B", + "id": "kilo-auto/balanced", + "name": "Kilo Auto Balanced", + "display_name": "Kilo Auto Balanced", "modalities": { "input": [ "text" @@ -116099,8 +121510,8 @@ ] }, "limit": { - "context": 128000, - "output": 128000 + "context": 204800, + "output": 131072 }, "temperature": true, "tool_call": true, @@ -116109,22 +121520,22 @@ "default": true }, "attachment": false, - "open_weights": true, - "knowledge": "2023-12", - "release_date": "2025-08-26", - "last_updated": "2025-08-26", + "open_weights": false, + "release_date": "2026-03-15", + "last_updated": "2026-03-15", "cost": { - "input": 0.116, - "output": 0.358 + "input": 0.6, + "output": 3 }, "type": "chat" }, { - "id": "deepseek-v3-0324", - "name": "DeepSeek V3 0324", - "display_name": "DeepSeek V3 0324", + "id": "kilo-auto/small", + "name": "Kilo Auto Small", + "display_name": "Kilo Auto Small", "modalities": { "input": [ + "image", "text" ], "output": [ @@ -116132,29 +121543,29 @@ ] }, "limit": { - "context": 128000, + "context": 400000, "output": 128000 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": false, - "open_weights": true, - "knowledge": "2024-07", - "release_date": "2025-03-24", - "last_updated": "2025-03-24", + "attachment": true, + "open_weights": false, + "release_date": "2026-03-15", + "last_updated": "2026-03-15", "cost": { - "input": 0.551, - "output": 1.654 + "input": 0.05, + "output": 0.4 }, "type": "chat" }, { - "id": "qwen3-coder-30b-a3b-instruct", - "name": "Qwen3 Coder 30B A3B Instruct", - "display_name": "Qwen3 Coder 30B A3B Instruct", + "id": "kilo-auto/free", + "name": "Kilo Auto Free", + "display_name": "Kilo Auto Free", "modalities": { "input": [ "text" @@ -116164,8 +121575,8 @@ ] }, "limit": { - "context": 262000, - "output": 262000 + "context": 204800, + "output": 131072 }, "temperature": true, "tool_call": true, @@ -116174,22 +121585,22 @@ "default": true }, "attachment": false, - "open_weights": true, - "knowledge": "2025-04", - "release_date": "2025-07-31", - "last_updated": "2025-07-31", + "open_weights": false, + "release_date": "2026-03-15", + "last_updated": "2026-03-15", "cost": { - "input": 0.053, - "output": 0.222 + "input": 0, + "output": 0 }, "type": "chat" }, { - "id": "kimi-k2-thinking", - "name": "Kimi K2 Thinking", - "display_name": "Kimi K2 Thinking", + "id": "kilo-auto/frontier", + "name": "Kilo Auto Frontier", + "display_name": "Kilo Auto Frontier", "modalities": { "input": [ + "image", "text" ], "output": [ @@ -116197,8 +121608,8 @@ ] }, "limit": { - "context": 262000, - "output": 262000 + "context": 1000000, + "output": 128000 }, "temperature": true, "tool_call": true, @@ -116206,44 +121617,31 @@ "supported": true, "default": true }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } - }, "attachment": true, - "open_weights": true, - "knowledge": "2025-12", - "release_date": "2025-12-08", - "last_updated": "2025-12-08", + "open_weights": false, + "release_date": "2026-03-15", + "last_updated": "2026-03-15", "cost": { - "input": 0.656, - "output": 2.731 + "input": 5, + "output": 25 }, "type": "chat" }, { - "id": "devstral-small-2512", - "name": "Devstral Small 2 2512", - "display_name": "Devstral Small 2 2512", + "id": "moonshotai/kimi-k2", + "name": "MoonshotAI: Kimi K2 0711", + "display_name": "MoonshotAI: Kimi K2 0711", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 262000, - "output": 262000 + "context": 131000, + "output": 26215 }, "temperature": true, "tool_call": true, @@ -116252,77 +121650,65 @@ }, "attachment": false, "open_weights": true, - "knowledge": "2025-12", - "release_date": "2025-12-09", - "last_updated": "2025-12-09", + "release_date": "2025-07-11", + "last_updated": "2026-03-15", "cost": { - "input": 0, - "output": 0 + "input": 0.55, + "output": 2.2 }, "type": "chat" }, { - "id": "claude-haiku-4-5", - "name": "Claude Haiku 4.5", - "display_name": "Claude Haiku 4.5", + "id": "moonshotai/kimi-k2-thinking", + "name": "MoonshotAI: Kimi K2 Thinking", + "display_name": "MoonshotAI: Kimi K2 Thinking", "modalities": { "input": [ - "text", - "image", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 200000 + "context": 131072, + "output": 65535 }, "temperature": true, "tool_call": true, "reasoning": { "supported": true, - "default": false + "default": true }, "extra_capabilities": { "reasoning": { "supported": true, - "default_enabled": false, - "mode": "budget", - "budget": { - "min": 1024, - "unit": "tokens" - }, "interleaved": true, "summaries": true, "visibility": "summary", "continuation": [ "thinking_blocks" - ], - "notes": [ - "Claude 4 manual thinking uses thinking.type = \"enabled\" with budget_tokens.", - "Interleaved thinking requires the interleaved-thinking-2025-05-14 beta header for this model family." ] } }, - "attachment": true, - "open_weights": false, - "knowledge": "2025-02-28", - "release_date": "2025-10-15", - "last_updated": "2025-10-15", + "attachment": false, + "open_weights": true, + "release_date": "2025-11-06", + "last_updated": "2026-03-15", "cost": { - "input": 1.09, - "output": 5.43 + "input": 0.47, + "output": 2, + "cache_read": 0.2 }, "type": "chat" }, { - "id": "deepseek-v3.2", - "name": "DeepSeek V3.2", - "display_name": "DeepSeek V3.2", + "id": "moonshotai/kimi-k2.5", + "name": "MoonshotAI: Kimi K2.5", + "display_name": "MoonshotAI: Kimi K2.5", "modalities": { "input": [ + "image", "text" ], "output": [ @@ -116330,8 +121716,8 @@ ] }, "limit": { - "context": 163840, - "output": 163840 + "context": 262144, + "output": 65535 }, "temperature": true, "tool_call": true, @@ -116341,82 +121727,197 @@ }, "extra_capabilities": { "reasoning": { - "supported": true + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] } }, - "attachment": false, + "attachment": true, "open_weights": true, - "knowledge": "2024-07", - "release_date": "2025-12-01", - "last_updated": "2025-12-01", + "release_date": "2026-01-27", + "last_updated": "2026-03-15", "cost": { - "input": 0.266, - "output": 0.444 + "input": 0.45, + "output": 2.2 }, "type": "chat" }, { - "id": "gpt-5.4", - "name": "GPT-5.4", - "display_name": "GPT-5.4", + "id": "moonshotai/kimi-k2.6", + "name": "MoonshotAI: Kimi K2.6", + "display_name": "MoonshotAI: Kimi K2.6", "modalities": { "input": [ "text", - "image", - "pdf" + "image" ], "output": [ "text" ] }, "limit": { - "context": 1050000, - "output": 128000 + "context": 262144, + "output": 65535 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, - "default": false + "default": true }, "extra_capabilities": { "reasoning": { - "supported": true, - "default_enabled": false, - "mode": "effort", - "effort": "none", - "effort_options": [ - "none", - "low", - "medium", - "high", - "xhigh" - ], - "verbosity": "medium", - "verbosity_options": [ - "low", - "medium", - "high" - ], - "visibility": "hidden" + "supported": true } }, "attachment": true, - "open_weights": false, - "knowledge": "2025-08-31", - "release_date": "2026-03-05", - "last_updated": "2026-03-05", + "open_weights": true, + "release_date": "2026-04-20", + "last_updated": "2026-05-12", + "cost": { + "input": 0.75, + "output": 3.5, + "cache_read": 0.375 + }, + "type": "chat" + }, + { + "id": "moonshotai/kimi-k2-0905", + "name": "MoonshotAI: Kimi K2 0905", + "display_name": "MoonshotAI: Kimi K2 0905", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 131072, + "output": 26215 + }, + "temperature": true, + "tool_call": true, + "reasoning": { + "supported": false + }, + "attachment": false, + "open_weights": true, + "release_date": "2025-09-05", + "last_updated": "2025-09-05", + "cost": { + "input": 0.4, + "output": 2, + "cache_read": 0.15 + }, + "type": "chat" + }, + { + "id": "baidu/ernie-4.5-300b-a47b", + "name": "Baidu: ERNIE 4.5 300B A47B ", + "display_name": "Baidu: ERNIE 4.5 300B A47B ", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 123000, + "output": 12000 + }, + "temperature": true, + "tool_call": false, + "reasoning": { + "supported": false + }, + "attachment": false, + "open_weights": true, + "release_date": "2025-06-30", + "last_updated": "2026-01", + "cost": { + "input": 0.28, + "output": 1.1 + }, + "type": "chat" + }, + { + "id": "baidu/ernie-4.5-vl-28b-a3b", + "name": "Baidu: ERNIE 4.5 VL 28B A3B", + "display_name": "Baidu: ERNIE 4.5 VL 28B A3B", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 30000, + "output": 8000 + }, + "temperature": true, + "tool_call": true, + "reasoning": { + "supported": true, + "default": true + }, + "attachment": true, + "open_weights": true, + "release_date": "2025-06-30", + "last_updated": "2025-06-30", + "cost": { + "input": 0.14, + "output": 0.56 + }, + "type": "chat" + }, + { + "id": "baidu/ernie-4.5-vl-424b-a47b", + "name": "Baidu: ERNIE 4.5 VL 424B A47B ", + "display_name": "Baidu: ERNIE 4.5 VL 424B A47B ", + "modalities": { + "input": [ + "image", + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 123000, + "output": 16000 + }, + "temperature": true, + "tool_call": false, + "reasoning": { + "supported": true, + "default": true + }, + "attachment": true, + "open_weights": true, + "release_date": "2025-06-30", + "last_updated": "2026-01", "cost": { - "input": 3, - "output": 16.13, - "cache_read": 0.25 + "input": 0.42, + "output": 1.25 }, "type": "chat" }, { - "id": "kimi-k2-instruct", - "name": "Kimi K2 Instruct", - "display_name": "Kimi K2 Instruct", + "id": "baidu/ernie-4.5-21b-a3b-thinking", + "name": "Baidu: ERNIE 4.5 21B A3B Thinking", + "display_name": "Baidu: ERNIE 4.5 21B A3B Thinking", "modalities": { "input": [ "text" @@ -116426,29 +121927,29 @@ ] }, "limit": { - "context": 131000, - "output": 131000 + "context": 131072, + "output": 65536 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": false + "supported": true, + "default": true }, "attachment": false, "open_weights": true, - "knowledge": "2024-07", - "release_date": "2025-07-11", - "last_updated": "2025-09-05", + "release_date": "2025-09-19", + "last_updated": "2025-09-19", "cost": { - "input": 0.551, - "output": 2.646 + "input": 0.07, + "output": 0.28 }, "type": "chat" }, { - "id": "minimax-m2.1", - "name": "MiniMax-M2.1", - "display_name": "MiniMax-M2.1", + "id": "baidu/cobuddy:free", + "name": "Baidu: CoBuddy (free)", + "display_name": "Baidu: CoBuddy (free)", "modalities": { "input": [ "text" @@ -116458,40 +121959,29 @@ ] }, "limit": { - "context": 196000, - "output": 196000 + "context": 131072, + "output": 65536 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { "supported": true, "default": true }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } - }, "attachment": false, - "open_weights": true, - "release_date": "2025-12-23", - "last_updated": "2025-12-23", + "open_weights": false, + "release_date": "2026-05-06", + "last_updated": "2026-05-07", "cost": { - "input": 0.34, - "output": 1.34 + "input": 0, + "output": 0 }, "type": "chat" }, { - "id": "intellect-3", - "name": "INTELLECT 3", - "display_name": "INTELLECT 3", + "id": "baidu/ernie-4.5-21b-a3b", + "name": "Baidu: ERNIE 4.5 21B A3B", + "display_name": "Baidu: ERNIE 4.5 21B A3B", "modalities": { "input": [ "text" @@ -116501,109 +121991,95 @@ ] }, "limit": { - "context": 128000, - "output": 128000 + "context": 120000, + "output": 8000 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, - "attachment": true, + "attachment": false, "open_weights": true, - "knowledge": "2025-11", - "release_date": "2025-11-26", - "last_updated": "2025-11-26", + "release_date": "2025-06-30", + "last_updated": "2025-06-30", "cost": { - "input": 0.219, - "output": 1.202 + "input": 0.07, + "output": 0.28 }, "type": "chat" }, { - "id": "kimi-k2.6", - "name": "Kimi K2.6", - "display_name": "Kimi K2.6", + "id": "baidu/qianfan-ocr-fast", + "name": "Baidu: Qianfan-OCR-Fast", + "display_name": "Baidu: Qianfan-OCR-Fast", "modalities": { "input": [ - "text", - "image" + "image", + "text" ], "output": [ "text" ] }, "limit": { - "context": 256000, - "output": 256000 + "context": 65536, + "output": 28672 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": true, "default": true }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } - }, - "attachment": false, - "open_weights": true, - "release_date": "2026-04-17", - "last_updated": "2026-04-17", + "attachment": true, + "open_weights": false, + "release_date": "2026-04-20", + "last_updated": "2026-05-16", "cost": { - "input": 0.81, - "output": 3.54, - "cache_read": 0.2 + "input": 0.68, + "output": 2.81 }, "type": "chat" }, { - "id": "mistral-large-2512", - "name": "Mistral Large 3 2512", - "display_name": "Mistral Large 3 2512", + "id": "perceptron/perceptron-mk1", + "name": "Perceptron: Perceptron Mk1", + "display_name": "Perceptron: Perceptron Mk1", "modalities": { "input": [ + "image", "text", - "image" + "video" ], "output": [ "text" ] }, "limit": { - "context": 256000, - "output": 256000 + "context": 32768, + "output": 8192 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": false + "supported": true, + "default": true }, "attachment": true, - "open_weights": true, - "knowledge": "2025-12", - "release_date": "2025-12-01", - "last_updated": "2025-12-01", + "open_weights": false, + "release_date": "2026-05-12", + "last_updated": "2026-05-16", "cost": { - "input": 0.5, - "output": 1.5, - "cache_read": 0.05 + "input": 0.15, + "output": 1.5 }, "type": "chat" }, { - "id": "glm-4.7", - "name": "GLM 4.7", - "display_name": "GLM 4.7", + "id": "alfredpros/codellama-7b-instruct-solidity", + "name": "AlfredPros: CodeLLaMa 7B Instruct Solidity", + "display_name": "AlfredPros: CodeLLaMa 7B Instruct Solidity", "modalities": { "input": [ "text" @@ -116613,78 +122089,72 @@ ] }, "limit": { - "context": 198000, - "output": 198000 + "context": 4096, + "output": 4096 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } + "supported": false }, "attachment": false, "open_weights": true, - "knowledge": "2025-04", - "release_date": "2025-12-22", - "last_updated": "2025-12-22", + "release_date": "2025-04-14", + "last_updated": "2026-03-15", "cost": { - "input": 0.45, - "output": 2.23 + "input": 0.8, + "output": 1.2 }, "type": "chat" }, { - "id": "gpt-oss-120b", - "name": "GPT Oss 120b", - "display_name": "GPT Oss 120b", + "id": "google/gemini-3.1-flash-lite", + "name": "Google: Gemini 3.1 Flash Lite", + "display_name": "Google: Gemini 3.1 Flash Lite", "modalities": { "input": [ - "text" + "audio", + "image", + "pdf", + "text", + "video" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 128000 + "context": 1048576, + "output": 65536 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true + "supported": true, + "default": true }, "extra_capabilities": { "reasoning": { "supported": true } }, - "attachment": false, - "open_weights": true, - "knowledge": "2024-01", - "release_date": "2025-08-05", - "last_updated": "2025-08-05", + "attachment": true, + "open_weights": false, + "release_date": "2026-05-07", + "last_updated": "2026-05-16", "cost": { - "input": 0, - "output": 0 + "input": 0.25, + "output": 1.5, + "reasoning": 1.5, + "cache_read": 0.025, + "cache_write": 0.08333 }, "type": "chat" }, { - "id": "qwen3-coder-next", - "name": "Qwen3 Coder Next 80B", - "display_name": "Qwen3 Coder Next 80B", + "id": "google/gemma-3n-e4b-it", + "name": "Google: Gemma 3n 4B", + "display_name": "Google: Gemma 3n 4B", "modalities": { "input": [ "text" @@ -116694,34 +122164,35 @@ ] }, "limit": { - "context": 256000, - "output": 65536 + "context": 32768, + "output": 6554 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": true + "supported": false }, "attachment": false, "open_weights": true, - "knowledge": "2025-04", - "release_date": "2026-02-04", - "last_updated": "2026-02-04", + "release_date": "2025-05-20", + "last_updated": "2025-05-20", "cost": { - "input": 0.158, - "output": 0.84 + "input": 0.02, + "output": 0.04 }, "type": "chat" }, { - "id": "gemini-2.5-pro", - "name": "Gemini 2.5 Pro", - "display_name": "Gemini 2.5 Pro", + "id": "google/gemini-2.5-pro", + "name": "Google: Gemini 2.5 Pro", + "display_name": "Google: Gemini 2.5 Pro", "modalities": { "input": [ + "audio", + "image", + "pdf", "text", - "image" + "video" ], "output": [ "text" @@ -116729,7 +122200,7 @@ }, "limit": { "context": 1048576, - "output": 65535 + "output": 65536 }, "temperature": true, "tool_call": true, @@ -116756,255 +122227,283 @@ ] } }, - "attachment": false, + "attachment": true, "open_weights": false, - "knowledge": "2025-01", "release_date": "2025-03-20", - "last_updated": "2025-06-17", + "last_updated": "2026-03-15", "cost": { - "input": 1.654, - "output": 11.024 + "input": 1.25, + "output": 10, + "reasoning": 10, + "cache_read": 0.125, + "cache_write": 0.375 }, "type": "chat" }, { - "id": "gpt-4.1", - "name": "GPT 4.1", - "display_name": "GPT 4.1", + "id": "google/gemini-2.5-flash", + "name": "Google: Gemini 2.5 Flash", + "display_name": "Google: Gemini 2.5 Flash", "modalities": { "input": [ + "audio", + "image", + "pdf", "text", - "image" + "video" ], "output": [ "text" ] }, "limit": { - "context": 1047576, - "output": 32768 + "context": 1048576, + "output": 65535 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": false, + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": true, + "mode": "budget", + "budget": { + "default": -1, + "min": 0, + "max": 24576, + "auto": -1, + "off": 0, + "unit": "tokens" + }, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thought_signatures" + ] + } + }, + "attachment": true, "open_weights": false, - "knowledge": "2024-06", - "release_date": "2025-04-14", - "last_updated": "2025-04-14", + "release_date": "2025-07-17", + "last_updated": "2026-03-15", "cost": { - "input": 2.354, - "output": 9.417 + "input": 0.3, + "output": 2.5, + "reasoning": 2.5, + "cache_read": 0.03, + "cache_write": 0.083333 }, "type": "chat" }, { - "id": "qwen3-coder-480b-a35b-instruct", - "name": "Qwen3 Coder 480B A35B Instruct", - "display_name": "Qwen3 Coder 480B A35B Instruct", + "id": "google/gemini-3.5-flash", + "name": "Google: Gemini 3.5 Flash", + "display_name": "Google: Gemini 3.5 Flash", "modalities": { "input": [ - "text" + "audio", + "image", + "pdf", + "text", + "video" ], "output": [ "text" ] }, "limit": { - "context": 262000, - "output": 262000 + "context": 1048576, + "output": 65536 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": false, - "open_weights": true, - "knowledge": "2025-01", - "release_date": "2025-07-25", - "last_updated": "2025-07-25", + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": true, + "mode": "level", + "level": "high", + "level_options": [ + "minimal", + "low", + "medium", + "high" + ], + "summaries": true, + "visibility": "summary", + "continuation": [ + "thought_signatures" + ] + } + }, + "attachment": true, + "open_weights": false, + "release_date": "2026-05-19", + "last_updated": "2026-05-27", "cost": { - "input": 0.441, - "output": 1.984 + "input": 1.5, + "output": 9, + "reasoning": 9, + "cache_read": 0.15, + "cache_write": 0.08333 }, "type": "chat" }, { - "id": "claude-opus4-5", - "name": "Claude Opus 4.5", - "display_name": "Claude Opus 4.5", + "id": "google/gemini-2.0-flash-lite-001", + "name": "Google: Gemini 2.0 Flash Lite", + "display_name": "Google: Gemini 2.0 Flash Lite", "modalities": { "input": [ - "text", + "audio", "image", - "pdf" + "pdf", + "text", + "video" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 200000 + "context": 1048576, + "output": 8192 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, "attachment": true, "open_weights": false, - "knowledge": "2025-03-31", - "release_date": "2025-11-24", - "last_updated": "2025-11-24", + "release_date": "2024-12-11", + "last_updated": "2026-03-15", "cost": { - "input": 5.98, - "output": 29.89 + "input": 0.075, + "output": 0.3 }, "type": "chat" }, { - "id": "qwen3-next-80b-a3b-thinking", - "name": "Qwen3 Next 80B A3B Thinking", - "display_name": "Qwen3 Next 80B A3B Thinking", + "id": "google/gemini-2.5-flash-lite-preview-09-2025", + "name": "Google: Gemini 2.5 Flash Lite Preview 09-2025", + "display_name": "Google: Gemini 2.5 Flash Lite Preview 09-2025", "modalities": { "input": [ - "text" + "audio", + "image", + "pdf", + "text", + "video" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 128000 + "context": 1048576, + "output": 65536 }, "temperature": true, "tool_call": true, "reasoning": { "supported": true, - "default": true + "default": false }, "extra_capabilities": { "reasoning": { "supported": true, - "interleaved": true, + "default_enabled": false, + "mode": "budget", + "budget": { + "default": -1, + "min": 512, + "max": 24576, + "auto": -1, + "unit": "tokens" + }, "summaries": true, "visibility": "summary", "continuation": [ - "thinking_blocks" + "thought_signatures" ] } }, - "attachment": false, - "open_weights": true, - "knowledge": "2025-04", - "release_date": "2025-09-11", - "last_updated": "2025-09-11", - "cost": { - "input": 0.164, - "output": 1.311 - }, - "type": "chat" - }, - { - "id": "mixtral-8x7B-instruct-v0.1", - "name": "Mixtral 8x7B Instruct v0.1", - "display_name": "Mixtral 8x7B Instruct v0.1", - "modalities": { - "input": [ - "text" - ], - "output": [ - "text" - ] - }, - "limit": { - "context": 32000, - "output": 32000 - }, - "temperature": true, - "tool_call": false, - "reasoning": { - "supported": true, - "default": true - }, - "attachment": false, - "open_weights": true, - "knowledge": "2023-09", - "release_date": "2023-12-11", - "last_updated": "2023-12-11", + "attachment": true, + "open_weights": false, + "release_date": "2025-09-25", + "last_updated": "2026-03-15", "cost": { - "input": 0.438, - "output": 0.68 + "input": 0.1, + "output": 0.4, + "reasoning": 0.4, + "cache_read": 0.01, + "cache_write": 0.083333 }, "type": "chat" }, { - "id": "glm-4.7-flash", - "name": "GLM-4.7-Flash", - "display_name": "GLM-4.7-Flash", + "id": "google/gemini-2.0-flash-001", + "name": "Google: Gemini 2.0 Flash", + "display_name": "Google: Gemini 2.0 Flash", "modalities": { "input": [ - "text" + "audio", + "image", + "pdf", + "text", + "video" ], "output": [ "text" ] }, "limit": { - "context": 203000, - "output": 203000 + "context": 1048576, + "output": 8192 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } + "supported": false }, - "attachment": false, - "open_weights": true, - "knowledge": "2025-04", - "release_date": "2025-08-08", - "last_updated": "2025-08-08", + "attachment": true, + "open_weights": false, + "release_date": "2024-12-11", + "last_updated": "2026-03-15", "cost": { - "input": 0.09, - "output": 0.53 + "input": 0.1, + "output": 0.4, + "cache_read": 0.025, + "cache_write": 0.083333 }, "type": "chat" }, { - "id": "claude-opus4-6", - "name": "Claude Opus 4.6", - "display_name": "Claude Opus 4.6", + "id": "google/gemma-4-31b-it", + "name": "Google: Gemma 4 31B", + "display_name": "Google: Gemma 4 31B", "modalities": { "input": [ - "text", "image", - "pdf" + "text", + "video" ], "output": [ "text" ] }, "limit": { - "context": 1000000, - "output": 1000000 + "context": 262144, + "output": 131072 }, "temperature": true, "tool_call": true, @@ -117013,66 +122512,59 @@ "default": true }, "attachment": true, - "open_weights": false, - "knowledge": "2025-05-31", - "release_date": "2026-02-05", - "last_updated": "2026-03-13", + "open_weights": true, + "release_date": "2026-04-02", + "last_updated": "2026-04-11", "cost": { - "input": 5.98, - "output": 29.89 + "input": 0.14, + "output": 0.4 }, "type": "chat" }, { - "id": "minimax-m2.7", - "name": "MiniMax-m2.7", - "display_name": "MiniMax-m2.7", + "id": "google/lyria-3-clip-preview", + "name": "Google: Lyria 3 Clip Preview", + "display_name": "Google: Lyria 3 Clip Preview", "modalities": { "input": [ + "image", "text" ], "output": [ + "audio", "text" ] }, "limit": { - "context": 202752, - "output": 196072 + "context": 1048576, + "output": 65536 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } + "supported": false }, - "attachment": false, - "open_weights": true, - "release_date": "2026-03-18", - "last_updated": "2026-03-18", + "attachment": true, + "open_weights": false, + "release_date": "2026-03-30", + "last_updated": "2026-04-11", "cost": { - "input": 0.47, - "output": 1.4 + "input": 0, + "output": 0 }, "type": "chat" }, { - "id": "deepseek-v4-flash", - "name": "DeepSeek V4 Flash", - "display_name": "DeepSeek V4 Flash", + "id": "google/gemini-3.1-pro-preview-customtools", + "name": "Google: Gemini 3.1 Pro Preview Custom Tools", + "display_name": "Google: Gemini 3.1 Pro Preview Custom Tools", "modalities": { "input": [ - "text" + "audio", + "image", + "pdf", + "text", + "video" ], "output": [ "text" @@ -117080,7 +122572,7 @@ }, "limit": { "context": 1048576, - "output": 384000 + "output": 65536 }, "temperature": true, "tool_call": true, @@ -117091,44 +122583,51 @@ "extra_capabilities": { "reasoning": { "supported": true, - "interleaved": true, + "default_enabled": true, + "mode": "level", + "level": "high", + "level_options": [ + "low", + "high" + ], "summaries": true, "visibility": "summary", "continuation": [ - "thinking_blocks" + "thought_signatures" ] } }, - "attachment": false, - "open_weights": true, - "knowledge": "2025-05", - "release_date": "2026-04-24", - "last_updated": "2026-04-24", + "attachment": true, + "open_weights": false, + "release_date": "2026-02-26", + "last_updated": "2026-03-15", "cost": { - "input": 0.133, - "output": 0.266, - "cache_read": 0.0028 + "input": 2, + "output": 12, + "reasoning": 12 }, "type": "chat" }, { - "id": "glm-5", - "name": "GLM 5", - "display_name": "GLM 5", + "id": "google/gemini-3-pro-image-preview", + "name": "Google: Nano Banana Pro (Gemini 3 Pro Image Preview)", + "display_name": "Google: Nano Banana Pro (Gemini 3 Pro Image Preview)", "modalities": { "input": [ + "image", "text" ], "output": [ + "image", "text" ] }, "limit": { - "context": 202752, - "output": 202752 + "context": 65536, + "output": 32768 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": true, "default": true @@ -117136,150 +122635,180 @@ "extra_capabilities": { "reasoning": { "supported": true, - "interleaved": true, + "default_enabled": true, + "mode": "level", + "level": "high", + "level_options": [ + "low", + "high" + ], "summaries": true, "visibility": "summary", "continuation": [ - "thinking_blocks" + "thought_signatures" ] } }, - "attachment": false, - "open_weights": true, - "release_date": "2026-02-11", - "last_updated": "2026-02-11", + "attachment": true, + "open_weights": false, + "release_date": "2025-11-20", + "last_updated": "2026-03-15", "cost": { - "input": 1.08, - "output": 3.44 + "input": 2, + "output": 12, + "reasoning": 12 }, - "type": "chat" + "type": "imageGeneration" }, { - "id": "devstral-2512", - "name": "Devstral 2 2512", - "display_name": "Devstral 2 2512", + "id": "google/gemini-2.5-flash-image", + "name": "Google: Nano Banana (Gemini 2.5 Flash Image)", + "display_name": "Google: Nano Banana (Gemini 2.5 Flash Image)", "modalities": { "input": [ + "image", "text" ], "output": [ + "image", "text" ] }, "limit": { - "context": 262000, - "output": 262000 + "context": 32768, + "output": 32768 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": false }, - "attachment": false, - "open_weights": true, - "knowledge": "2025-12", - "release_date": "2025-12-09", - "last_updated": "2025-12-09", + "attachment": true, + "open_weights": false, + "release_date": "2025-10-08", + "last_updated": "2026-03-15", "cost": { - "input": 0, - "output": 0 + "input": 0.3, + "output": 2.5 }, - "type": "chat" + "type": "imageGeneration" }, { - "id": "glm-4.5", - "name": "GLM 4.5", - "display_name": "GLM 4.5", + "id": "google/gemini-2.5-flash-lite", + "name": "Google: Gemini 2.5 Flash Lite", + "display_name": "Google: Gemini 2.5 Flash Lite", "modalities": { "input": [ - "text" + "audio", + "image", + "pdf", + "text", + "video" ], "output": [ "text" ] }, "limit": { - "context": 131072, - "output": 131072 + "context": 1048576, + "output": 65535 }, "temperature": true, "tool_call": true, "reasoning": { "supported": true, - "default": true + "default": false }, "extra_capabilities": { "reasoning": { "supported": true, - "interleaved": true, + "default_enabled": false, + "mode": "budget", + "budget": { + "default": -1, + "min": 512, + "max": 24576, + "auto": -1, + "unit": "tokens" + }, "summaries": true, "visibility": "summary", "continuation": [ - "thinking_blocks" + "thought_signatures" ] } }, - "attachment": false, - "open_weights": true, - "knowledge": "2025-04", - "release_date": "2025-07-29", - "last_updated": "2025-07-29", + "attachment": true, + "open_weights": false, + "release_date": "2025-06-17", + "last_updated": "2026-03-15", "cost": { - "input": 0.67, - "output": 2.46 + "input": 0.1, + "output": 0.4, + "reasoning": 0.4, + "cache_read": 0.01, + "cache_write": 0.083333 }, "type": "chat" }, { - "id": "qwen3-235b-a22b-instruct-2507", - "name": "Qwen3 235B A22B Instruct 2507", - "display_name": "Qwen3 235B A22B Instruct 2507", + "id": "google/gemini-3.1-flash-image-preview", + "name": "Google: Nano Banana 2 (Gemini 3.1 Flash Image Preview)", + "display_name": "Google: Nano Banana 2 (Gemini 3.1 Flash Image Preview)", "modalities": { "input": [ + "image", "text" ], "output": [ + "image", "text" ] }, "limit": { - "context": 131000, - "output": 131000 + "context": 65536, + "output": 65536 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": true, "default": true }, - "attachment": false, - "open_weights": true, - "knowledge": "2025-04", - "release_date": "2025-07-23", - "last_updated": "2025-07-23", + "extra_capabilities": { + "reasoning": { + "supported": true + } + }, + "attachment": true, + "open_weights": false, + "release_date": "2026-02-26", + "last_updated": "2026-03-15", "cost": { - "input": 0.062, - "output": 0.408 + "input": 0.5, + "output": 3 }, - "type": "chat" + "type": "imageGeneration" }, { - "id": "claude-4-6-sonnet", - "name": "Claude Sonnet 4.6", - "display_name": "Claude Sonnet 4.6", + "id": "google/gemini-2.5-pro-preview-05-06", + "name": "Google: Gemini 2.5 Pro Preview 05-06", + "display_name": "Google: Gemini 2.5 Pro Preview 05-06", "modalities": { "input": [ - "text", + "audio", "image", - "pdf" + "pdf", + "text", + "video" ], "output": [ "text" ] }, "limit": { - "context": 1000000, - "output": 1000000 + "context": 1048576, + "output": 65535 }, "temperature": true, "tool_call": true, @@ -117287,32 +122816,57 @@ "supported": true, "default": true }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": true, + "mode": "budget", + "budget": { + "default": -1, + "min": 128, + "max": 32768, + "auto": -1, + "unit": "tokens" + }, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thought_signatures" + ] + } + }, "attachment": true, "open_weights": false, - "knowledge": "2025-08-31", - "release_date": "2026-02-17", - "last_updated": "2026-03-13", + "release_date": "2025-05-06", + "last_updated": "2026-03-15", "cost": { - "input": 3.59, - "output": 17.92 + "input": 1.25, + "output": 10, + "reasoning": 10, + "cache_read": 0.125, + "cache_write": 0.375 }, "type": "chat" }, { - "id": "qwen3.5-397b-a17b", - "name": "Qwen3.5 397B A17B", - "display_name": "Qwen3.5 397B A17B", + "id": "google/gemini-3.1-pro-preview", + "name": "Google: Gemini 3.1 Pro Preview", + "display_name": "Google: Gemini 3.1 Pro Preview", "modalities": { "input": [ - "text" + "audio", + "image", + "pdf", + "text", + "video" ], "output": [ "text" ] }, "limit": { - "context": 250000, - "output": 250000 + "context": 1048576, + "output": 65536 }, "temperature": true, "tool_call": true, @@ -117323,68 +122877,74 @@ "extra_capabilities": { "reasoning": { "supported": true, - "interleaved": true, + "default_enabled": true, + "mode": "level", + "level": "high", + "level_options": [ + "low", + "high" + ], "summaries": true, "visibility": "summary", "continuation": [ - "thinking_blocks" + "thought_signatures" ] } }, - "attachment": false, - "open_weights": true, - "knowledge": "2026-01", - "release_date": "2026-02-16", - "last_updated": "2026-02-16", + "attachment": true, + "open_weights": false, + "release_date": "2026-02-19", + "last_updated": "2026-03-15", "cost": { - "input": 0.6, - "output": 3.6 + "input": 2, + "output": 12, + "reasoning": 12 }, "type": "chat" }, { - "id": "claude-opus4-7", - "name": "Claude Opus 4.7", - "display_name": "Claude Opus 4.7", + "id": "google/gemma-4-26b-a4b-it", + "name": "Google: Gemma 4 26B A4B", + "display_name": "Google: Gemma 4 26B A4B", "modalities": { "input": [ - "text", "image", - "pdf" + "text", + "video" ], "output": [ "text" ] }, "limit": { - "context": 1000000, - "output": 128000 + "context": 262144, + "output": 262144 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, "default": true }, "attachment": true, - "open_weights": false, - "knowledge": "2026-01-31", - "release_date": "2026-04-16", - "last_updated": "2026-04-16", + "open_weights": true, + "release_date": "2026-04-03", + "last_updated": "2026-04-11", "cost": { - "input": 5.6, - "output": 27.99, - "cache_read": 0.56, - "cache_write": 6.99 + "input": 0.12, + "output": 0.4 }, "type": "chat" }, { - "id": "codestral-2508", - "name": "Codestral 2508", - "display_name": "Codestral 2508", + "id": "google/gemini-2.5-pro-preview", + "name": "Google: Gemini 2.5 Pro Preview 06-05", + "display_name": "Google: Gemini 2.5 Pro Preview 06-05", "modalities": { "input": [ + "audio", + "image", + "pdf", "text" ], "output": [ @@ -117392,41 +122952,66 @@ ] }, "limit": { - "context": 256000, - "output": 256000 + "context": 1048576, + "output": 65536 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": false, - "open_weights": true, - "knowledge": "2025-03", - "release_date": "2025-07-30", - "last_updated": "2025-07-30", + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": true, + "mode": "budget", + "budget": { + "default": -1, + "min": 128, + "max": 32768, + "auto": -1, + "unit": "tokens" + }, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thought_signatures" + ] + } + }, + "attachment": true, + "open_weights": false, + "release_date": "2025-06-05", + "last_updated": "2026-03-15", "cost": { - "input": 0.3, - "output": 0.9, - "cache_read": 0.03 + "input": 1.25, + "output": 10, + "reasoning": 10, + "cache_read": 0.125, + "cache_write": 0.375 }, "type": "chat" }, { - "id": "minimax-m2", - "name": "MiniMax-M2", - "display_name": "MiniMax-M2", + "id": "google/gemini-3-flash-preview", + "name": "Google: Gemini 3 Flash Preview", + "display_name": "Google: Gemini 3 Flash Preview", "modalities": { "input": [ - "text" + "audio", + "image", + "pdf", + "text", + "video" ], "output": [ "text" ] }, "limit": { - "context": 400000, - "output": 400000 + "context": 1048576, + "output": 65536 }, "temperature": true, "tool_call": true, @@ -117437,31 +123022,75 @@ "extra_capabilities": { "reasoning": { "supported": true, - "interleaved": true, + "default_enabled": true, + "mode": "level", + "level": "high", + "level_options": [ + "minimal", + "low", + "medium", + "high" + ], "summaries": true, "visibility": "summary", "continuation": [ - "thinking_blocks" + "thought_signatures" ] } }, - "attachment": false, + "attachment": true, + "open_weights": false, + "release_date": "2025-12-17", + "last_updated": "2026-03-15", + "cost": { + "input": 0.5, + "output": 3, + "reasoning": 3, + "cache_read": 0.05, + "cache_write": 0.083333 + }, + "type": "chat" + }, + { + "id": "google/gemma-3-12b-it", + "name": "Google: Gemma 3 12B", + "display_name": "Google: Gemma 3 12B", + "modalities": { + "input": [ + "image", + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 131072, + "output": 131072 + }, + "temperature": true, + "tool_call": false, + "reasoning": { + "supported": false + }, + "attachment": true, "open_weights": true, - "knowledge": "2024-11", - "release_date": "2025-10-27", - "last_updated": "2025-10-27", + "release_date": "2025-03-13", + "last_updated": "2026-03-15", "cost": { - "input": 0.39, - "output": 1.57 + "input": 0.04, + "output": 0.13, + "cache_read": 0.015 }, "type": "chat" }, { - "id": "minimax-m2.5", - "name": "MiniMax-M2.5", - "display_name": "MiniMax-M2.5", + "id": "google/gemma-3-4b-it", + "name": "Google: Gemma 3 4B", + "display_name": "Google: Gemma 3 4B", "modalities": { "input": [ + "image", "text" ], "output": [ @@ -117469,108 +123098,94 @@ ] }, "limit": { - "context": 196608, - "output": 196608 + "context": 131072, + "output": 19200 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } + "supported": false }, - "attachment": false, + "attachment": true, "open_weights": true, - "release_date": "2026-02-12", - "last_updated": "2026-02-12", + "release_date": "2025-03-13", + "last_updated": "2026-03-15", "cost": { - "input": 0.32, - "output": 1.18 + "input": 0.04, + "output": 0.08 }, "type": "chat" }, { - "id": "claude-4-5-sonnet", - "name": "Claude 4.5 Sonnet", - "display_name": "Claude 4.5 Sonnet", + "id": "google/gemma-3-27b-it", + "name": "Google: Gemma 3 27B", + "display_name": "Google: Gemma 3 27B", "modalities": { "input": [ - "text", "image", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 200000 + "context": 128000, + "output": 65536 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, "attachment": true, - "open_weights": false, - "knowledge": "2025-07-31", - "release_date": "2025-09-29", - "last_updated": "2025-09-29", + "open_weights": true, + "release_date": "2025-03-12", + "last_updated": "2026-03-15", "cost": { - "input": 3.259, - "output": 16.296 + "input": 0.03, + "output": 0.11, + "cache_read": 0.02 }, "type": "chat" }, { - "id": "nemotron-3-super-120b-a12b", - "name": "Nemotron 3 Super 120B A12B", - "display_name": "Nemotron 3 Super 120B A12B", + "id": "google/lyria-3-pro-preview", + "name": "Google: Lyria 3 Pro Preview", + "display_name": "Google: Lyria 3 Pro Preview", "modalities": { "input": [ + "image", "text" ], "output": [ + "audio", "text" ] }, "limit": { - "context": 262144, - "output": 262144 + "context": 1048576, + "output": 65536 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": true + "supported": false }, - "attachment": false, - "open_weights": true, - "knowledge": "2025-12", - "release_date": "2026-03-11", - "last_updated": "2026-03-11", + "attachment": true, + "open_weights": false, + "release_date": "2026-03-30", + "last_updated": "2026-04-11", "cost": { - "input": 0.266, - "output": 0.799 + "input": 0, + "output": 0 }, "type": "chat" }, { - "id": "llama-3.3-70b-instruct", - "name": "Llama 3.3 70B Instruct", - "display_name": "Llama 3.3 70B Instruct", + "id": "google/gemma-2-27b-it", + "name": "Google: Gemma 2 27B", + "display_name": "Google: Gemma 2 27B", "modalities": { "input": [ "text" @@ -117580,33 +123195,35 @@ ] }, "limit": { - "context": 131000, - "output": 131000 + "context": 8192, + "output": 2048 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": true + "supported": false }, "attachment": false, "open_weights": true, - "knowledge": "2023-12", - "release_date": "2024-12-06", - "last_updated": "2024-12-06", + "release_date": "2024-06-24", + "last_updated": "2024-06-24", "cost": { - "input": 0.089, - "output": 0.275 + "input": 0.65, + "output": 0.65 }, "type": "chat" }, { - "id": "deepseek-v4-pro", - "name": "DeepSeek V4 Pro", - "display_name": "DeepSeek V4 Pro", + "id": "google/gemini-3.1-flash-lite-preview", + "name": "Google: Gemini 3.1 Flash Lite Preview", + "display_name": "Google: Gemini 3.1 Flash Lite Preview", "modalities": { "input": [ - "text" + "audio", + "image", + "pdf", + "text", + "video" ], "output": [ "text" @@ -117614,7 +123231,7 @@ }, "limit": { "context": 1048576, - "output": 384000 + "output": 65536 }, "temperature": true, "tool_call": true, @@ -117624,79 +123241,59 @@ }, "extra_capabilities": { "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] + "supported": true } }, - "attachment": false, - "open_weights": true, - "knowledge": "2025-05", - "release_date": "2026-04-24", - "last_updated": "2026-04-24", + "attachment": true, + "open_weights": false, + "release_date": "2026-03-03", + "last_updated": "2026-03-15", "cost": { - "input": 1.553, - "output": 3.106, - "cache_read": 0.003625 + "input": 0.25, + "output": 1.5, + "reasoning": 1.5 }, "type": "chat" }, { - "id": "kimi-k2.5", - "name": "Kimi K2.5", - "display_name": "Kimi K2.5", + "id": "liquid/lfm-2-24b-a2b", + "name": "LiquidAI: LFM2-24B-A2B", + "display_name": "LiquidAI: LFM2-24B-A2B", "modalities": { "input": [ - "text", - "image", - "video" + "text" ], "output": [ "text" ] }, "limit": { - "context": 256000, - "output": 256000 + "context": 32768, + "output": 32768 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } + "supported": false }, "attachment": false, "open_weights": true, - "knowledge": "2025-01", - "release_date": "2026-01-27", - "last_updated": "2026-01-27", + "release_date": "2026-02-26", + "last_updated": "2026-03-15", "cost": { - "input": 0.55, - "output": 2.76 + "input": 0.03, + "output": 0.12 }, "type": "chat" }, { - "id": "glm-4.5-air", - "name": "GLM 4.5 Air", - "display_name": "GLM 4.5 Air", + "id": "x-ai/grok-4.20", + "name": "xAI: Grok 4.20", + "display_name": "xAI: Grok 4.20", "modalities": { "input": [ + "image", + "pdf", "text" ], "output": [ @@ -117704,8 +123301,8 @@ ] }, "limit": { - "context": 131072, - "output": 131072 + "context": 2000000, + "output": 2000000 }, "temperature": true, "tool_call": true, @@ -117713,32 +123310,34 @@ "supported": true, "default": true }, - "attachment": false, - "open_weights": true, - "knowledge": "2025-04", - "release_date": "2025-08-01", - "last_updated": "2025-08-01", + "attachment": true, + "open_weights": false, + "release_date": "2026-03-31", + "last_updated": "2026-04-11", "cost": { - "input": 0.22, - "output": 1.34 + "input": 2, + "output": 6, + "cache_read": 0.2 }, "type": "chat" }, { - "id": "glm-5.1", - "name": "GLM-5.1", - "display_name": "GLM-5.1", + "id": "x-ai/grok-4.3", + "name": "xAI: Grok 4.3", + "display_name": "xAI: Grok 4.3", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 204800, - "output": 131072 + "context": 1000000, + "output": 4096 }, "temperature": true, "tool_call": true, @@ -117748,32 +123347,28 @@ }, "extra_capabilities": { "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] + "supported": true } }, - "attachment": false, - "open_weights": true, - "release_date": "2026-04-14", - "last_updated": "2026-04-14", + "attachment": true, + "open_weights": false, + "release_date": "2026-05-01", + "last_updated": "2026-05-01", "cost": { - "input": 1.31, - "output": 4.1, - "cache_read": 0.24 + "input": 1.25, + "output": 2.5, + "cache_read": 0.2 }, "type": "chat" }, { - "id": "qwen-2.5-72b-instruct", - "name": "Qwen2.5 72B Instruct", - "display_name": "Qwen2.5 72B Instruct", + "id": "x-ai/grok-4.20-multi-agent", + "name": "xAI: Grok 4.20 Multi-Agent", + "display_name": "xAI: Grok 4.20 Multi-Agent", "modalities": { "input": [ + "image", + "pdf", "text" ], "output": [ @@ -117781,40 +123376,33 @@ ] }, "limit": { - "context": 33000, - "output": 33000 + "context": 2000000, + "output": 2000000 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": false, - "open_weights": true, - "knowledge": "2024-06", - "release_date": "2024-09-19", - "last_updated": "2024-09-19", + "attachment": true, + "open_weights": false, + "release_date": "2026-03-31", + "last_updated": "2026-04-11", "cost": { - "input": 0.062, - "output": 0.231 + "input": 2, + "output": 6, + "cache_read": 0.2 }, "type": "chat" - } - ] - }, - "auriko": { - "id": "auriko", - "name": "Auriko", - "display_name": "Auriko", - "api": "https://api.auriko.ai/v1", - "doc": "https://docs.auriko.ai", - "models": [ + }, { - "id": "minimax-m2-7", - "name": "MiniMax-M2.7", - "display_name": "MiniMax-M2.7", + "id": "x-ai/grok-build-0.1", + "name": "xAI: Grok Build 0.1", + "display_name": "xAI: Grok Build 0.1", "modalities": { "input": [ + "image", "text" ], "output": [ @@ -117822,8 +123410,8 @@ ] }, "limit": { - "context": 204800, - "output": 131072 + "context": 256000, + "output": 256000 }, "temperature": true, "tool_call": true, @@ -117831,86 +123419,58 @@ "supported": true, "default": true }, - "attachment": false, - "open_weights": true, - "release_date": "2026-03-18", - "last_updated": "2026-03-18", + "extra_capabilities": { + "reasoning": { + "supported": true + } + }, + "attachment": true, + "open_weights": false, + "release_date": "2026-05-20", + "last_updated": "2026-05-27", "cost": { - "input": 0.3, - "output": 1.2, - "cache_write": 0.375 + "input": 1, + "output": 2, + "cache_read": 0.2 }, "type": "chat" }, { - "id": "claude-sonnet-4-6", - "name": "Claude Sonnet 4.6", - "display_name": "Claude Sonnet 4.6", + "id": "microsoft/phi-4-mini-instruct", + "name": "Microsoft: Phi 4 Mini Instruct", + "display_name": "Microsoft: Phi 4 Mini Instruct", "modalities": { "input": [ - "text", - "image", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 1000000, - "output": 64000 + "context": 128000, + "output": 128000 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": false - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": false, - "mode": "mixed", - "budget": { - "min": 1024, - "unit": "tokens" - }, - "effort": "high", - "effort_options": [ - "low", - "medium", - "high", - "max" - ], - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ], - "notes": [ - "Anthropic recommends adaptive thinking with effort for Claude 4.6; budget_tokens remains a deprecated compatibility path.", - "Anthropic API defaults effort to high; lower effort levels should be chosen per workload." - ] - } + "supported": false }, - "attachment": true, - "open_weights": false, - "knowledge": "2025-08-31", - "release_date": "2026-02-17", - "last_updated": "2026-03-13", + "attachment": false, + "open_weights": true, + "release_date": "2025-10-17", + "last_updated": "2026-05-07", "cost": { - "input": 3, - "output": 15, - "cache_read": 0.3, - "cache_write": 3.75 + "input": 0.08, + "output": 0.35, + "cache_read": 0.08 }, "type": "chat" }, { - "id": "minimax-m2-7-highspeed", - "name": "MiniMax-M2.7-highspeed", - "display_name": "MiniMax-M2.7-highspeed", + "id": "microsoft/phi-4", + "name": "Microsoft: Phi 4", + "display_name": "Microsoft: Phi 4", "modalities": { "input": [ "text" @@ -117920,92 +123480,70 @@ ] }, "limit": { - "context": 204800, - "output": 131072 + "context": 16384, + "output": 16384 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": true + "supported": false }, "attachment": false, "open_weights": true, - "release_date": "2026-03-18", - "last_updated": "2026-03-18", + "release_date": "2024-12-11", + "last_updated": "2024-12-11", "cost": { - "input": 0.6, - "output": 2.4, - "cache_write": 0.375 + "input": 0.06, + "output": 0.14 }, "type": "chat" }, { - "id": "kimi-k2.6", - "name": "Kimi K2.6", - "display_name": "Kimi K2.6", + "id": "microsoft/wizardlm-2-8x22b", + "name": "WizardLM-2 8x22B", + "display_name": "WizardLM-2 8x22B", "modalities": { "input": [ - "text", - "image", - "video" + "text" ], "output": [ "text" ] }, "limit": { - "context": 262144, - "output": 262144 + "context": 65535, + "output": 8000 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } + "supported": false }, - "attachment": true, + "attachment": false, "open_weights": true, - "knowledge": "2025-01", - "release_date": "2026-04-21", - "last_updated": "2026-04-21", + "release_date": "2024-04-24", + "last_updated": "2024-04-24", "cost": { - "input": 0.95, - "output": 4, - "cache_read": 0.16 + "input": 0.62, + "output": 0.62 }, "type": "chat" }, { - "id": "gemini-2.5-pro", - "name": "Gemini 2.5 Pro", - "display_name": "Gemini 2.5 Pro", + "id": "poolside/laguna-xs.2:free", + "name": "Poolside: Laguna XS.2 (free)", + "display_name": "Poolside: Laguna XS.2 (free)", "modalities": { "input": [ - "text", - "image", - "audio", - "video", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 1048576, - "output": 65536 + "context": 131072, + "output": 8192 }, "temperature": true, "tool_call": true, @@ -118013,70 +123551,31 @@ "supported": true, "default": true }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": true, - "mode": "budget", - "budget": { - "default": -1, - "min": 128, - "max": 32768, - "auto": -1, - "unit": "tokens" - }, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thought_signatures" - ] - } - }, - "attachment": true, + "attachment": false, "open_weights": false, - "knowledge": "2025-01", - "release_date": "2025-03-20", - "last_updated": "2025-06-05", + "release_date": "2026-04-28", + "last_updated": "2026-05-01", "cost": { - "input": 1.25, - "output": 10, - "cache_read": 0.125, - "tiers": [ - { - "input": 2.5, - "output": 15, - "cache_read": 0.25, - "tier": { - "type": "context", - "size": 200000 - } - } - ], - "context_over_200k": { - "input": 2.5, - "output": 15, - "cache_read": 0.25 - } + "input": 0, + "output": 0 }, "type": "chat" }, { - "id": "grok-4.3", - "name": "Grok 4.3", - "display_name": "Grok 4.3", + "id": "poolside/laguna-m.1:free", + "name": "Poolside: Laguna M.1 (free)", + "display_name": "Poolside: Laguna M.1 (free)", "modalities": { "input": [ - "text", - "image", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 1000000, - "output": 30000 + "context": 131072, + "output": 8192 }, "temperature": true, "tool_call": true, @@ -118084,128 +123583,62 @@ "supported": true, "default": true }, - "extra_capabilities": { - "reasoning": { - "supported": true - } - }, - "attachment": true, + "attachment": false, "open_weights": false, - "release_date": "2026-04-17", - "last_updated": "2026-04-17", + "release_date": "2026-04-28", + "last_updated": "2026-05-01", "cost": { - "input": 1.25, - "output": 2.5, - "cache_read": 0.2, - "tiers": [ - { - "input": 2.5, - "output": 5, - "cache_read": 0.4, - "tier": { - "type": "context", - "size": 200000 - } - } - ], - "context_over_200k": { - "input": 2.5, - "output": 5, - "cache_read": 0.4 - } + "input": 0, + "output": 0 }, "type": "chat" }, { - "id": "gemini-3.1-pro-preview", - "name": "Gemini 3.1 Pro Preview", - "display_name": "Gemini 3.1 Pro Preview", + "id": "writer/palmyra-x5", + "name": "Writer: Palmyra X5", + "display_name": "Writer: Palmyra X5", "modalities": { "input": [ - "text", - "image", - "video", - "audio", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 1048576, - "output": 65536 + "context": 1040000, + "output": 8192 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": true, - "mode": "level", - "level": "high", - "level_options": [ - "low", - "high" - ], - "summaries": true, - "visibility": "summary", - "continuation": [ - "thought_signatures" - ] - } + "supported": false }, - "attachment": true, + "attachment": false, "open_weights": false, - "knowledge": "2025-01", - "release_date": "2026-02-19", - "last_updated": "2026-02-19", + "release_date": "2025-04-28", + "last_updated": "2025-04-28", "cost": { - "input": 2, - "output": 12, - "cache_read": 0.2, - "tiers": [ - { - "input": 4, - "output": 18, - "cache_read": 0.4, - "tier": { - "type": "context", - "size": 200000 - } - } - ], - "context_over_200k": { - "input": 4, - "output": 18, - "cache_read": 0.4 - } + "input": 0.6, + "output": 6 }, "type": "chat" }, { - "id": "gemini-2.5-flash", - "name": "Gemini 2.5 Flash", - "display_name": "Gemini 2.5 Flash", + "id": "z-ai/glm-4.7", + "name": "Z.ai: GLM 4.7", + "display_name": "Z.ai: GLM 4.7", "modalities": { "input": [ - "text", - "image", - "audio", - "video", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 1048576, - "output": 65536 + "context": 202752, + "output": 65535 }, "temperature": true, "tool_call": true, @@ -118216,52 +123649,41 @@ "extra_capabilities": { "reasoning": { "supported": true, - "default_enabled": true, - "mode": "budget", - "budget": { - "default": -1, - "min": 0, - "max": 24576, - "auto": -1, - "off": 0, - "unit": "tokens" - }, + "interleaved": true, "summaries": true, "visibility": "summary", "continuation": [ - "thought_signatures" + "thinking_blocks" ] } }, - "attachment": true, - "open_weights": false, - "knowledge": "2025-01", - "release_date": "2025-03-20", - "last_updated": "2025-06-05", + "attachment": false, + "open_weights": true, + "release_date": "2025-12-22", + "last_updated": "2026-03-15", "cost": { - "input": 0.3, - "output": 2.5, - "cache_read": 0.03 + "input": 0.38, + "output": 1.98, + "cache_read": 0.2 }, "type": "chat" }, { - "id": "qwen-3.6-plus", - "name": "Qwen3.6 Plus", - "display_name": "Qwen3.6 Plus", + "id": "z-ai/glm-4.5v", + "name": "Z.ai: GLM 4.5V", + "display_name": "Z.ai: GLM 4.5V", "modalities": { "input": [ "text", - "image", - "video" + "image" ], "output": [ "text" ] }, "limit": { - "context": 1000000, - "output": 65536 + "context": 65536, + "output": 16384 }, "temperature": true, "tool_call": true, @@ -118269,40 +123691,21 @@ "supported": true, "default": true }, - "attachment": false, - "open_weights": false, - "knowledge": "2025-04", - "release_date": "2026-04-02", - "last_updated": "2026-04-02", + "attachment": true, + "open_weights": true, + "release_date": "2025-08-11", + "last_updated": "2025-08-11", "cost": { - "input": 0.5, - "output": 3, - "cache_read": 0.1, - "tiers": [ - { - "input": 2, - "output": 6, - "cache_read": 0.2, - "cache_write": 2.5, - "tier": { - "type": "context", - "size": 256000 - } - } - ], - "context_over_200k": { - "input": 2, - "output": 6, - "cache_read": 0.2, - "cache_write": 2.5 - } + "input": 0.6, + "output": 1.8, + "cache_read": 0.11 }, "type": "chat" }, { - "id": "deepseek-v4-flash", - "name": "DeepSeek V4 Flash", - "display_name": "DeepSeek V4 Flash", + "id": "z-ai/glm-4.5", + "name": "Z.ai: GLM 4.5", + "display_name": "Z.ai: GLM 4.5", "modalities": { "input": [ "text" @@ -118312,8 +123715,8 @@ ] }, "limit": { - "context": 1000000, - "output": 384000 + "context": 131072, + "output": 98304 }, "temperature": true, "tool_call": true, @@ -118321,98 +123724,58 @@ "supported": true, "default": true }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } - }, "attachment": false, "open_weights": true, - "knowledge": "2025-05", - "release_date": "2026-04-24", - "last_updated": "2026-04-24", + "release_date": "2025-07-28", + "last_updated": "2026-03-15", "cost": { - "input": 0.14, - "output": 0.28, - "cache_read": 0.0028 + "input": 0.6, + "output": 2.2, + "cache_read": 0.175 }, "type": "chat" }, { - "id": "claude-opus-4-6", - "name": "Claude Opus 4.6", - "display_name": "Claude Opus 4.6", + "id": "z-ai/glm-5.1", + "name": "Z.ai: GLM 5.1", + "display_name": "Z.ai: GLM 5.1", "modalities": { "input": [ - "text", - "image", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 1000000, - "output": 128000 + "context": 202752, + "output": 131072 }, "temperature": true, "tool_call": true, "reasoning": { "supported": true, - "default": false + "default": true }, "extra_capabilities": { "reasoning": { - "supported": true, - "default_enabled": false, - "mode": "mixed", - "budget": { - "min": 1024, - "unit": "tokens" - }, - "effort": "high", - "effort_options": [ - "low", - "medium", - "high", - "max" - ], - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ], - "notes": [ - "Anthropic recommends adaptive thinking with effort for Claude 4.6; budget_tokens remains a deprecated compatibility path.", - "Anthropic API defaults effort to high; lower effort levels should be chosen per workload." - ] + "supported": true } }, - "attachment": true, - "open_weights": false, - "knowledge": "2025-05-31", - "release_date": "2026-02-05", - "last_updated": "2026-03-13", + "attachment": false, + "open_weights": true, + "release_date": "2026-03-27", + "last_updated": "2026-03-27", "cost": { - "input": 5, - "output": 25, - "cache_read": 0.5, - "cache_write": 6.25 + "input": 1.26, + "output": 3.96 }, "type": "chat" }, { - "id": "deepseek-v4-pro", - "name": "DeepSeek V4 Pro", - "display_name": "DeepSeek V4 Pro", + "id": "z-ai/glm-4.6", + "name": "Z.ai: GLM 4.6", + "display_name": "Z.ai: GLM 4.6", "modalities": { "input": [ "text" @@ -118422,8 +123785,8 @@ ] }, "limit": { - "context": 1000000, - "output": 384000 + "context": 204800, + "output": 204800 }, "temperature": true, "tool_call": true, @@ -118433,150 +123796,101 @@ }, "extra_capabilities": { "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] + "supported": true } }, "attachment": false, "open_weights": true, - "knowledge": "2025-05", - "release_date": "2026-04-24", - "last_updated": "2026-04-24", + "release_date": "2025-09-30", + "last_updated": "2026-03-15", "cost": { - "input": 0.435, - "output": 0.87, - "cache_read": 0.003625 + "input": 0.39, + "output": 1.9, + "cache_read": 0.175 }, "type": "chat" }, { - "id": "kimi-k2.5", - "name": "Kimi K2.5", - "display_name": "Kimi K2.5", + "id": "z-ai/glm-4-32b", + "name": "Z.ai: GLM 4 32B ", + "display_name": "Z.ai: GLM 4 32B ", "modalities": { "input": [ - "text", - "image", - "video" + "text" ], "output": [ "text" ] }, "limit": { - "context": 262144, - "output": 262144 + "context": 128000, + "output": 32768 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } + "supported": false }, "attachment": false, "open_weights": true, - "knowledge": "2025-01", - "release_date": "2026-01", - "last_updated": "2026-01", + "release_date": "2025-07-25", + "last_updated": "2026-03-15", "cost": { - "input": 0.5, - "output": 2.8 + "input": 0.1, + "output": 0.1 }, "type": "chat" }, { - "id": "claude-opus-4-7", - "name": "Claude Opus 4.7", - "display_name": "Claude Opus 4.7", + "id": "z-ai/glm-4.6v", + "name": "Z.ai: GLM 4.6V", + "display_name": "Z.ai: GLM 4.6V", "modalities": { "input": [ - "text", "image", - "pdf" + "text", + "video" ], "output": [ "text" ] }, "limit": { - "context": 1000000, - "output": 128000 + "context": 131072, + "output": 131072 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, - "default": false - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": false, - "mode": "effort", - "effort": "high", - "effort_options": [ - "low", - "medium", - "high", - "xhigh", - "max" - ], - "interleaved": true, - "summaries": true, - "visibility": "omitted", - "continuation": [ - "thinking_blocks" - ], - "notes": [ - "Claude Opus 4.7 and newer Opus models require thinking.type = \"adaptive\" to enable thinking explicitly.", - "Manual budget_tokens requests return 400 on Claude Opus 4.7 and newer adaptive-only Opus models.", - "task_budget is separate from thinking control and should not be treated as a thinking budget." - ] - } + "default": true }, "attachment": true, - "open_weights": false, - "knowledge": "2026-01-31", - "release_date": "2026-04-16", - "last_updated": "2026-04-16", + "open_weights": true, + "release_date": "2025-09-30", + "last_updated": "2026-01-10", "cost": { - "input": 5, - "output": 25, - "cache_read": 0.5, - "cache_write": 6.25 + "input": 0.3, + "output": 0.9 }, "type": "chat" }, { - "id": "glm-5.1", - "name": "GLM-5.1", - "display_name": "GLM-5.1", + "id": "z-ai/glm-5v-turbo", + "name": "Z.ai: GLM 5V Turbo", + "display_name": "Z.ai: GLM 5V Turbo", "modalities": { "input": [ - "text" + "image", + "text", + "video" ], "output": [ "text" ] }, "limit": { - "context": 200000, + "context": 202752, "output": 131072 }, "temperature": true, @@ -118585,44 +123899,23 @@ "supported": true, "default": true }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } - }, - "attachment": false, + "attachment": true, "open_weights": true, - "release_date": "2026-03-27", - "last_updated": "2026-03-27", + "release_date": "2026-04-01", + "last_updated": "2026-04-11", "cost": { - "input": 1.4, - "output": 4.4, - "cache_read": 0.26 + "input": 1.2, + "output": 4, + "cache_read": 0.24 }, "type": "chat" - } - ] - }, - "berget": { - "id": "berget", - "name": "Berget.AI", - "display_name": "Berget.AI", - "api": "https://api.berget.ai/v1", - "doc": "https://api.berget.ai", - "models": [ + }, { - "id": "mistralai/Mistral-Medium-3.5-128B", - "name": "Mistral Medium 3.5 128B", - "display_name": "Mistral Medium 3.5 128B", + "id": "z-ai/glm-4.5-air", + "name": "Z.ai: GLM 4.5 Air", + "display_name": "Z.ai: GLM 4.5 Air", "modalities": { "input": [ - "image", "text" ], "output": [ @@ -118630,8 +123923,8 @@ ] }, "limit": { - "context": 262144, - "output": 131072 + "context": 131072, + "output": 98304 }, "temperature": true, "tool_call": true, @@ -118639,21 +123932,21 @@ "supported": true, "default": true }, - "attachment": true, + "attachment": false, "open_weights": true, - "knowledge": "2026-04", - "release_date": "2026-04-29", - "last_updated": "2026-04-29", + "release_date": "2025-07-28", + "last_updated": "2025-07-28", "cost": { - "input": 1.65, - "output": 5.5 + "input": 0.13, + "output": 0.85, + "cache_read": 0.025 }, "type": "chat" }, { - "id": "mistralai/Mistral-Small-3.2-24B-Instruct-2506", - "name": "Mistral Small 3.2 24B Instruct 2506", - "display_name": "Mistral Small 3.2 24B Instruct 2506", + "id": "z-ai/glm-4.7-flash", + "name": "Z.ai: GLM 4.7 Flash", + "display_name": "Z.ai: GLM 4.7 Flash", "modalities": { "input": [ "text" @@ -118663,8 +123956,8 @@ ] }, "limit": { - "context": 32000, - "output": 8192 + "context": 202752, + "output": 40551 }, "temperature": true, "tool_call": true, @@ -118672,21 +123965,26 @@ "supported": true, "default": true }, + "extra_capabilities": { + "reasoning": { + "supported": true + } + }, "attachment": false, "open_weights": true, - "knowledge": "2025-09", - "release_date": "2025-10-01", - "last_updated": "2025-10-01", + "release_date": "2026-01-19", + "last_updated": "2026-01-19", "cost": { - "input": 0.33, - "output": 0.33 + "input": 0.06, + "output": 0.4, + "cache_read": 0.01 }, "type": "chat" }, { - "id": "zai-org/GLM-4.7", - "name": "GLM 4.7", - "display_name": "GLM 4.7", + "id": "z-ai/glm-5", + "name": "Z.ai: GLM 5", + "display_name": "Z.ai: GLM 5", "modalities": { "input": [ "text" @@ -118696,8 +123994,8 @@ ] }, "limit": { - "context": 128000, - "output": 8192 + "context": 202752, + "output": 131072 }, "temperature": true, "tool_call": true, @@ -118718,32 +124016,29 @@ }, "attachment": false, "open_weights": true, - "knowledge": "2025-12", - "release_date": "2026-01-19", - "last_updated": "2026-01-19", + "release_date": "2026-02-12", + "last_updated": "2026-03-15", "cost": { - "input": 0.77, - "output": 2.75 + "input": 0.72, + "output": 2.3 }, "type": "chat" }, { - "id": "moonshotai/Kimi-K2.6", - "name": "Kimi K2.6", - "display_name": "Kimi K2.6", + "id": "z-ai/glm-5-turbo", + "name": "Z.ai: GLM 5 Turbo", + "display_name": "Z.ai: GLM 5 Turbo", "modalities": { "input": [ - "text", - "image", - "video" + "text" ], "output": [ "text" ] }, "limit": { - "context": 262144, - "output": 262144 + "context": 202752, + "output": 131072 }, "temperature": true, "tool_call": true, @@ -118753,33 +124048,28 @@ }, "extra_capabilities": { "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] + "supported": true } }, - "attachment": true, + "attachment": false, "open_weights": true, - "knowledge": "2025-01", - "release_date": "2026-05-07", - "last_updated": "2026-05-07", + "release_date": "2026-03-15", + "last_updated": "2026-04-11", "cost": { - "input": 0.83, - "output": 3.85, - "cache_read": 0.16 + "input": 1.2, + "output": 4, + "cache_read": 0.24 }, "type": "chat" }, { - "id": "meta-llama/Llama-3.3-70B-Instruct", - "name": "Llama 3.3 70B Instruct", - "display_name": "Llama 3.3 70B Instruct", + "id": "openai/gpt-4o-mini-2024-07-18", + "name": "OpenAI: GPT-4o-mini (2024-07-18)", + "display_name": "OpenAI: GPT-4o-mini (2024-07-18)", "modalities": { "input": [ + "image", + "pdf", "text" ], "output": [ @@ -118788,43 +124078,38 @@ }, "limit": { "context": 128000, - "output": 8192 + "output": 16384 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, - "attachment": false, - "open_weights": true, - "knowledge": "2023-12", - "release_date": "2025-04-27", - "last_updated": "2025-04-27", + "attachment": true, + "open_weights": false, + "release_date": "2024-07-18", + "last_updated": "2026-03-15", "cost": { - "input": 0.99, - "output": 0.99 + "input": 0.15, + "output": 0.6 }, "type": "chat" }, { - "id": "google/gemma-4-31B-it", - "name": "Gemma 4 31B Instruct", - "display_name": "Gemma 4 31B Instruct", + "id": "openai/gpt-oss-safeguard-20b", + "name": "OpenAI: gpt-oss-safeguard-20b", + "display_name": "OpenAI: gpt-oss-safeguard-20b", "modalities": { "input": [ - "audio", - "image", - "text", - "video" + "text" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 8192 + "context": 131072, + "output": 65536 }, "temperature": true, "tool_call": true, @@ -118832,21 +124117,21 @@ "supported": true, "default": true }, - "attachment": true, - "open_weights": true, - "knowledge": "2025-12", - "release_date": "2026-04-02", - "last_updated": "2026-04-02", + "attachment": false, + "open_weights": false, + "release_date": "2025-10-29", + "last_updated": "2025-10-29", "cost": { - "input": 0.275, - "output": 0.55 + "input": 0.075, + "output": 0.3, + "cache_read": 0.037 }, "type": "chat" }, { - "id": "openai/gpt-oss-120b", - "name": "GPT-OSS-120B", - "display_name": "GPT-OSS-120B", + "id": "openai/gpt-3.5-turbo-instruct", + "name": "OpenAI: GPT-3.5 Turbo Instruct", + "display_name": "OpenAI: GPT-3.5 Turbo Instruct", "modalities": { "input": [ "text" @@ -118856,112 +124141,67 @@ ] }, "limit": { - "context": 128000, - "output": 8192 + "context": 4095, + "output": 4096 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true - } + "supported": false }, "attachment": false, - "open_weights": true, - "knowledge": "2025-08", - "release_date": "2025-08-05", - "last_updated": "2025-08-05", + "open_weights": false, + "release_date": "2023-03-01", + "last_updated": "2023-09-21", "cost": { - "input": 0.44, - "output": 0.99 + "input": 1.5, + "output": 2 }, "type": "chat" - } - ] - }, - "cloudflare-ai-gateway": { - "id": "cloudflare-ai-gateway", - "name": "Cloudflare AI Gateway", - "display_name": "Cloudflare AI Gateway", - "doc": "https://developers.cloudflare.com/ai-gateway/", - "models": [ + }, { - "id": "anthropic/claude-opus-4-5", - "name": "Claude Opus 4.5 (latest)", - "display_name": "Claude Opus 4.5 (latest)", + "id": "openai/gpt-5.2-chat", + "name": "OpenAI: GPT-5.2 Chat", + "display_name": "OpenAI: GPT-5.2 Chat", "modalities": { "input": [ - "text", "image", - "pdf" + "pdf", + "text" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 64000 + "context": 128000, + "output": 16384 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { - "supported": true, - "default": false - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": false, - "mode": "mixed", - "budget": { - "min": 1024, - "unit": "tokens" - }, - "effort": "high", - "effort_options": [ - "low", - "medium", - "high" - ], - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ], - "notes": [ - "Claude Opus 4.5 uses manual thinking.type = \"enabled\" with budget_tokens; effort can be used alongside the thinking budget.", - "Interleaved thinking requires the interleaved-thinking-2025-05-14 beta header." - ] - } + "supported": false }, "attachment": true, "open_weights": false, - "knowledge": "2025-03-31", - "release_date": "2025-11-24", - "last_updated": "2025-11-24", + "release_date": "2025-12-11", + "last_updated": "2026-03-15", "cost": { - "input": 5, - "output": 25, - "cache_read": 0.5, - "cache_write": 6.25 + "input": 1.75, + "output": 14, + "cache_read": 0.175 }, "type": "chat" }, { - "id": "anthropic/claude-sonnet-4", - "name": "Claude Sonnet 4 (latest)", - "display_name": "Claude Sonnet 4 (latest)", + "id": "openai/o3", + "name": "OpenAI: o3", + "display_name": "OpenAI: o3", "modalities": { "input": [ - "text", "image", - "pdf" + "pdf", + "text" ], "output": [ "text" @@ -118969,371 +124209,308 @@ }, "limit": { "context": 200000, - "output": 64000 + "output": 100000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { "supported": true, - "default": false + "default": true }, "extra_capabilities": { "reasoning": { "supported": true, - "default_enabled": false, - "mode": "budget", - "budget": { - "min": 1024, - "unit": "tokens" - }, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" + "default_enabled": true, + "mode": "effort", + "effort": "medium", + "effort_options": [ + "low", + "medium", + "high" ], - "notes": [ - "Claude 4 manual thinking uses thinking.type = \"enabled\" with budget_tokens.", - "Interleaved thinking requires the interleaved-thinking-2025-05-14 beta header for this model family." - ] + "visibility": "hidden" } }, "attachment": true, "open_weights": false, - "knowledge": "2025-03-31", - "release_date": "2025-05-22", - "last_updated": "2025-05-22", + "release_date": "2025-04-16", + "last_updated": "2026-03-15", "cost": { - "input": 3, - "output": 15, - "cache_read": 0.3, - "cache_write": 3.75 + "input": 2, + "output": 8, + "cache_read": 0.5 }, "type": "chat" }, { - "id": "anthropic/claude-sonnet-4-6", - "name": "Claude Sonnet 4.6", - "display_name": "Claude Sonnet 4.6", + "id": "openai/o4-mini-high", + "name": "OpenAI: o4 Mini High", + "display_name": "OpenAI: o4 Mini High", "modalities": { "input": [ - "text", "image", - "pdf" + "pdf", + "text" ], "output": [ "text" ] }, "limit": { - "context": 1000000, - "output": 64000 + "context": 200000, + "output": 100000 }, - "temperature": true, "tool_call": true, "reasoning": { "supported": true, - "default": false + "default": true }, "extra_capabilities": { "reasoning": { "supported": true, - "default_enabled": false, - "mode": "mixed", - "budget": { - "min": 1024, - "unit": "tokens" - }, - "effort": "high", + "default_enabled": true, + "mode": "effort", + "effort": "medium", "effort_options": [ "low", "medium", - "high", - "max" - ], - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" + "high" ], - "notes": [ - "Anthropic recommends adaptive thinking with effort for Claude 4.6; budget_tokens remains a deprecated compatibility path.", - "Anthropic API defaults effort to high; lower effort levels should be chosen per workload." - ] + "visibility": "hidden" } }, "attachment": true, "open_weights": false, - "knowledge": "2025-08-31", - "release_date": "2026-02-17", - "last_updated": "2026-02-17", + "release_date": "2025-04-17", + "last_updated": "2026-03-15", "cost": { - "input": 3, - "output": 15, - "cache_read": 0.3, - "cache_write": 3.75, - "tiers": [ - { - "input": 6, - "output": 22.5, - "cache_read": 0.6, - "cache_write": 7.5, - "tier": { - "type": "context", - "size": 200000 - } - } - ], - "context_over_200k": { - "input": 6, - "output": 22.5, - "cache_read": 0.6, - "cache_write": 7.5 - } + "input": 1.1, + "output": 4.4 }, "type": "chat" }, { - "id": "anthropic/claude-3-sonnet", - "name": "Claude Sonnet 3", - "display_name": "Claude Sonnet 3", + "id": "openai/gpt-audio", + "name": "OpenAI: GPT Audio", + "display_name": "OpenAI: GPT Audio", "modalities": { "input": [ - "text", - "image", - "pdf" + "audio", + "text" ], "output": [ + "audio", "text" ] }, "limit": { - "context": 200000, - "output": 4096 + "context": 128000, + "output": 16384 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": false }, - "attachment": true, + "attachment": false, "open_weights": false, - "knowledge": "2023-08-31", - "release_date": "2024-03-04", - "last_updated": "2024-03-04", + "release_date": "2026-01-20", + "last_updated": "2026-03-15", "cost": { - "input": 3, - "output": 15, - "cache_read": 0.3, - "cache_write": 0.3 + "input": 2.5, + "output": 10 }, "type": "chat" }, { - "id": "anthropic/claude-haiku-4-5", - "name": "Claude Haiku 4.5 (latest)", - "display_name": "Claude Haiku 4.5 (latest)", + "id": "openai/gpt-5.2-pro", + "name": "OpenAI: GPT-5.2 Pro", + "display_name": "OpenAI: GPT-5.2 Pro", "modalities": { "input": [ - "text", "image", - "pdf" + "pdf", + "text" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 64000 + "context": 400000, + "output": 128000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { "supported": true, - "default": false + "default": true }, "extra_capabilities": { "reasoning": { "supported": true, - "default_enabled": false, - "mode": "budget", - "budget": { - "min": 1024, - "unit": "tokens" - }, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" + "default_enabled": true, + "mode": "effort", + "effort": "high", + "effort_options": [ + "medium", + "high", + "xhigh" ], - "notes": [ - "Claude 4 manual thinking uses thinking.type = \"enabled\" with budget_tokens.", - "Interleaved thinking requires the interleaved-thinking-2025-05-14 beta header for this model family." - ] + "verbosity": "medium", + "verbosity_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" } }, "attachment": true, "open_weights": false, - "knowledge": "2025-02-28", - "release_date": "2025-10-15", - "last_updated": "2025-10-15", + "release_date": "2025-12-11", + "last_updated": "2026-03-15", "cost": { - "input": 1, - "output": 5, - "cache_read": 0.1, - "cache_write": 1.25 + "input": 21, + "output": 168 }, "type": "chat" }, { - "id": "anthropic/claude-opus-4-1", - "name": "Claude Opus 4.1 (latest)", - "display_name": "Claude Opus 4.1 (latest)", + "id": "openai/gpt-4o-mini-search-preview", + "name": "OpenAI: GPT-4o-mini Search Preview", + "display_name": "OpenAI: GPT-4o-mini Search Preview", "modalities": { "input": [ - "text", - "image", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 32000 + "context": 128000, + "output": 16384 }, - "temperature": true, - "tool_call": true, + "temperature": false, + "tool_call": false, "reasoning": { - "supported": true, - "default": false - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": false, - "mode": "budget", - "budget": { - "min": 1024, - "unit": "tokens" - }, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ], - "notes": [ - "Claude 4 manual thinking uses thinking.type = \"enabled\" with budget_tokens.", - "Interleaved thinking requires the interleaved-thinking-2025-05-14 beta header for this model family." - ] - } + "supported": false }, - "attachment": true, + "attachment": false, "open_weights": false, - "knowledge": "2025-03-31", - "release_date": "2025-08-05", - "last_updated": "2025-08-05", + "release_date": "2025-01", + "last_updated": "2025-01", "cost": { - "input": 15, - "output": 75, - "cache_read": 1.5, - "cache_write": 18.75 + "input": 0.15, + "output": 0.6 }, "type": "chat" }, { - "id": "anthropic/claude-3.5-haiku", - "name": "Claude Haiku 3.5 (latest)", - "display_name": "Claude Haiku 3.5 (latest)", + "id": "openai/gpt-5", + "name": "OpenAI: GPT-5", + "display_name": "OpenAI: GPT-5", "modalities": { "input": [ - "text", "image", - "pdf" + "pdf", + "text" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 8192 + "context": 400000, + "output": 128000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": true, + "mode": "effort", + "effort": "medium", + "effort_options": [ + "minimal", + "low", + "medium", + "high" + ], + "verbosity": "medium", + "verbosity_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" + } }, "attachment": true, "open_weights": false, - "knowledge": "2024-07-31", - "release_date": "2024-10-22", - "last_updated": "2024-10-22", + "release_date": "2025-08-07", + "last_updated": "2026-03-15", "cost": { - "input": 0.8, - "output": 4, - "cache_read": 0.08, - "cache_write": 1 + "input": 1.25, + "output": 10, + "cache_read": 0.125 }, "type": "chat" }, { - "id": "anthropic/claude-3.5-sonnet", - "name": "Claude Sonnet 3.5 v2", - "display_name": "Claude Sonnet 3.5 v2", + "id": "openai/gpt-5-chat", + "name": "OpenAI: GPT-5 Chat", + "display_name": "OpenAI: GPT-5 Chat", "modalities": { "input": [ - "text", "image", - "pdf" + "pdf", + "text" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 8192 + "context": 128000, + "output": 16384 }, - "temperature": true, - "tool_call": true, + "temperature": false, + "tool_call": false, "reasoning": { "supported": false }, "attachment": true, "open_weights": false, - "knowledge": "2024-04-30", - "release_date": "2024-10-22", - "last_updated": "2024-10-22", + "release_date": "2025-08-07", + "last_updated": "2026-03-15", "cost": { - "input": 3, - "output": 15, - "cache_read": 0.3, - "cache_write": 3.75 + "input": 1.25, + "output": 10, + "cache_read": 0.125 }, "type": "chat" }, { - "id": "anthropic/claude-3-haiku", - "name": "Claude Haiku 3", - "display_name": "Claude Haiku 3", + "id": "openai/gpt-3.5-turbo", + "name": "OpenAI: GPT-3.5 Turbo", + "display_name": "OpenAI: GPT-3.5 Turbo", "modalities": { "input": [ - "text", - "image", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 200000, + "context": 16385, "output": 4096 }, "temperature": true, @@ -119341,35 +124518,32 @@ "reasoning": { "supported": false }, - "attachment": true, + "attachment": false, "open_weights": false, - "knowledge": "2023-08-31", - "release_date": "2024-03-13", - "last_updated": "2024-03-13", + "release_date": "2023-03-01", + "last_updated": "2023-11-06", "cost": { - "input": 0.25, - "output": 1.25, - "cache_read": 0.03, - "cache_write": 0.3 + "input": 0.5, + "output": 1.5 }, "type": "chat" }, { - "id": "anthropic/claude-fable-5", - "name": "Claude Fable 5", - "display_name": "Claude Fable 5", + "id": "openai/gpt-5-pro", + "name": "OpenAI: GPT-5 Pro", + "display_name": "OpenAI: GPT-5 Pro", "modalities": { "input": [ - "text", "image", - "pdf" + "pdf", + "text" ], "output": [ "text" ] }, "limit": { - "context": 1000000, + "context": 400000, "output": 128000 }, "temperature": false, @@ -119382,58 +124556,44 @@ "reasoning": { "supported": true, "default_enabled": true, - "mode": "effort", + "mode": "fixed", "effort": "high", - "effort_options": [ + "verbosity": "medium", + "verbosity_options": [ "low", "medium", - "high", - "xhigh", - "max" - ], - "interleaved": true, - "summaries": true, - "visibility": "omitted", - "continuation": [ - "thinking_blocks" + "high" ], - "notes": [ - "Adaptive thinking is always on for Claude Fable 5 and Claude Mythos 5; thinking.type = \"disabled\" is rejected.", - "Manual budget_tokens requests return 400 on Claude Fable 5 and Claude Mythos 5.", - "thinking.display defaults to omitted; set display to summarized to receive readable thinking summaries." - ] + "visibility": "hidden" } }, "attachment": true, "open_weights": false, - "knowledge": "2026-01-31", - "release_date": "2026-06-09", - "last_updated": "2026-06-09", + "release_date": "2025-10-06", + "last_updated": "2026-03-15", "cost": { - "input": 10, - "output": 50, - "cache_read": 1, - "cache_write": 12.5 + "input": 15, + "output": 120 }, "type": "chat" }, { - "id": "anthropic/claude-3-5-haiku", - "name": "Claude Haiku 3.5 (latest)", - "display_name": "Claude Haiku 3.5 (latest)", + "id": "openai/gpt-4o", + "name": "OpenAI: GPT-4o", + "display_name": "OpenAI: GPT-4o", "modalities": { "input": [ - "text", "image", - "pdf" + "pdf", + "text" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 8192 + "context": 128000, + "output": 16384 }, "temperature": true, "tool_call": true, @@ -119442,33 +124602,29 @@ }, "attachment": true, "open_weights": false, - "knowledge": "2024-07-31", - "release_date": "2024-10-22", - "last_updated": "2024-10-22", + "release_date": "2024-05-13", + "last_updated": "2026-03-15", "cost": { - "input": 0.8, - "output": 4, - "cache_read": 0.08, - "cache_write": 1 + "input": 2.5, + "output": 10, + "cache_read": 1.25 }, "type": "chat" }, { - "id": "anthropic/claude-3-opus", - "name": "Claude Opus 3", - "display_name": "Claude Opus 3", + "id": "openai/gpt-4", + "name": "OpenAI: GPT-4", + "display_name": "OpenAI: GPT-4", "modalities": { "input": [ - "text", - "image", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 200000, + "context": 8191, "output": 4096 }, "temperature": true, @@ -119476,238 +124632,258 @@ "reasoning": { "supported": false }, - "attachment": true, + "attachment": false, "open_weights": false, - "knowledge": "2023-08-31", - "release_date": "2024-02-29", - "last_updated": "2024-02-29", + "release_date": "2023-03-14", + "last_updated": "2024-04-09", "cost": { - "input": 15, - "output": 75, - "cache_read": 1.5, - "cache_write": 18.75 + "input": 30, + "output": 60 }, "type": "chat" }, { - "id": "anthropic/claude-opus-4-8", - "name": "Claude Opus 4.8", - "display_name": "Claude Opus 4.8", + "id": "openai/o4-mini", + "name": "OpenAI: o4 Mini", + "display_name": "OpenAI: o4 Mini", "modalities": { "input": [ - "text", "image", - "pdf" + "pdf", + "text" ], "output": [ "text" ] }, "limit": { - "context": 1000000, - "output": 128000 + "context": 200000, + "output": 100000 }, "temperature": false, "tool_call": true, "reasoning": { "supported": true, - "default": false + "default": true }, "extra_capabilities": { "reasoning": { "supported": true, - "default_enabled": false, + "default_enabled": true, "mode": "effort", - "effort": "high", + "effort": "medium", "effort_options": [ "low", "medium", - "high", - "xhigh", - "max" - ], - "interleaved": true, - "summaries": true, - "visibility": "omitted", - "continuation": [ - "thinking_blocks" + "high" ], - "notes": [ - "Claude Opus 4.7 and newer Opus models require thinking.type = \"adaptive\" to enable thinking explicitly.", - "Manual budget_tokens requests return 400 on Claude Opus 4.7 and newer adaptive-only Opus models.", - "task_budget is separate from thinking control and should not be treated as a thinking budget." - ] + "visibility": "hidden" } }, "attachment": true, "open_weights": false, - "release_date": "2026-05-28", - "last_updated": "2026-05-28", + "release_date": "2025-04-16", + "last_updated": "2026-03-15", "cost": { - "input": 5, - "output": 25, - "cache_read": 0.5, - "cache_write": 6.25 + "input": 1.1, + "output": 4.4, + "cache_read": 0.275 }, "type": "chat" }, { - "id": "anthropic/claude-sonnet-4-5", - "name": "Claude Sonnet 4.5 (latest)", - "display_name": "Claude Sonnet 4.5 (latest)", + "id": "openai/gpt-3.5-turbo-16k", + "name": "OpenAI: GPT-3.5 Turbo 16k", + "display_name": "OpenAI: GPT-3.5 Turbo 16k", "modalities": { "input": [ - "text", - "image", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 64000 + "context": 16385, + "output": 4096 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": false - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": false, - "mode": "budget", - "budget": { - "min": 1024, - "unit": "tokens" - }, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ], - "notes": [ - "Claude 4 manual thinking uses thinking.type = \"enabled\" with budget_tokens.", - "Interleaved thinking requires the interleaved-thinking-2025-05-14 beta header for this model family." - ] - } + "supported": false }, - "attachment": true, + "attachment": false, "open_weights": false, - "knowledge": "2025-07-31", - "release_date": "2025-09-29", - "last_updated": "2025-09-29", + "release_date": "2023-08-28", + "last_updated": "2026-03-15", "cost": { "input": 3, - "output": 15, - "cache_read": 0.3, - "cache_write": 3.75 + "output": 4 }, "type": "chat" }, { - "id": "anthropic/claude-opus-4-6", - "name": "Claude Opus 4.6 (latest)", - "display_name": "Claude Opus 4.6 (latest)", + "id": "openai/o3-pro", + "name": "OpenAI: o3 Pro", + "display_name": "OpenAI: o3 Pro", "modalities": { "input": [ - "text", "image", - "pdf" + "pdf", + "text" ], "output": [ "text" ] }, "limit": { - "context": 1000000, - "output": 128000 + "context": 200000, + "output": 100000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { "supported": true, - "default": false + "default": true }, "extra_capabilities": { "reasoning": { "supported": true, - "default_enabled": false, - "mode": "mixed", - "budget": { - "min": 1024, - "unit": "tokens" - }, - "effort": "high", + "default_enabled": true, + "mode": "effort", + "effort": "medium", "effort_options": [ "low", "medium", - "high", - "max" - ], - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" + "high" ], - "notes": [ - "Anthropic recommends adaptive thinking with effort for Claude 4.6; budget_tokens remains a deprecated compatibility path.", - "Anthropic API defaults effort to high; lower effort levels should be chosen per workload." - ] + "visibility": "hidden" } }, "attachment": true, "open_weights": false, - "knowledge": "2025-05-31", - "release_date": "2026-02-05", - "last_updated": "2026-02-05", + "release_date": "2025-04-16", + "last_updated": "2026-03-15", + "cost": { + "input": 20, + "output": 80 + }, + "type": "chat" + }, + { + "id": "openai/gpt-5.1-chat", + "name": "OpenAI: GPT-5.1 Chat", + "display_name": "OpenAI: GPT-5.1 Chat", + "modalities": { + "input": [ + "image", + "pdf", + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 128000, + "output": 16384 + }, + "temperature": false, + "tool_call": true, + "reasoning": { + "supported": false + }, + "attachment": true, + "open_weights": false, + "release_date": "2025-11-13", + "last_updated": "2026-03-15", + "cost": { + "input": 1.25, + "output": 10, + "cache_read": 0.125 + }, + "type": "chat" + }, + { + "id": "openai/gpt-4o-2024-05-13", + "name": "OpenAI: GPT-4o (2024-05-13)", + "display_name": "OpenAI: GPT-4o (2024-05-13)", + "modalities": { + "input": [ + "image", + "pdf", + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 128000, + "output": 4096 + }, + "temperature": true, + "tool_call": true, + "reasoning": { + "supported": false + }, + "attachment": true, + "open_weights": false, + "release_date": "2024-05-13", + "last_updated": "2026-03-15", "cost": { "input": 5, - "output": 25, - "cache_read": 0.5, - "cache_write": 6.25, - "tiers": [ - { - "input": 10, - "output": 37.5, - "cache_read": 1, - "cache_write": 12.5, - "tier": { - "type": "context", - "size": 200000 - } - } + "output": 15 + }, + "type": "chat" + }, + { + "id": "openai/gpt-4-0314", + "name": "OpenAI: GPT-4 (older v0314)", + "display_name": "OpenAI: GPT-4 (older v0314)", + "modalities": { + "input": [ + "text" ], - "context_over_200k": { - "input": 10, - "output": 37.5, - "cache_read": 1, - "cache_write": 12.5 - } + "output": [ + "text" + ] + }, + "limit": { + "context": 8191, + "output": 4096 + }, + "temperature": true, + "tool_call": true, + "reasoning": { + "supported": false + }, + "attachment": false, + "open_weights": false, + "release_date": "2023-05-28", + "last_updated": "2026-03-15", + "cost": { + "input": 30, + "output": 60 }, "type": "chat" }, { - "id": "anthropic/claude-opus-4-7", - "name": "Claude Opus 4.7", - "display_name": "Claude Opus 4.7", + "id": "openai/gpt-5.4-nano", + "name": "OpenAI: GPT-5.4 Nano", + "display_name": "OpenAI: GPT-5.4 Nano", "modalities": { "input": [ - "text", "image", - "pdf" + "pdf", + "text" ], "output": [ "text" ] }, "limit": { - "context": 1000000, + "context": 400000, "output": 128000 }, "temperature": false, @@ -119721,136 +124897,136 @@ "supported": true, "default_enabled": false, "mode": "effort", - "effort": "high", + "effort": "none", "effort_options": [ + "none", "low", "medium", "high", - "xhigh", - "max" + "xhigh" ], - "interleaved": true, - "summaries": true, - "visibility": "omitted", - "continuation": [ - "thinking_blocks" + "verbosity": "medium", + "verbosity_options": [ + "low", + "medium", + "high" ], - "notes": [ - "Claude Opus 4.7 and newer Opus models require thinking.type = \"adaptive\" to enable thinking explicitly.", - "Manual budget_tokens requests return 400 on Claude Opus 4.7 and newer adaptive-only Opus models.", - "task_budget is separate from thinking control and should not be treated as a thinking budget." - ] + "visibility": "hidden" } }, "attachment": true, "open_weights": false, - "knowledge": "2026-01", - "release_date": "2026-04-16", - "last_updated": "2026-04-16", + "release_date": "2026-03-17", + "last_updated": "2026-04-11", + "cost": { + "input": 0.2, + "output": 1.25, + "cache_read": 0.02 + }, + "type": "chat" + }, + { + "id": "openai/gpt-5.3-chat", + "name": "OpenAI: GPT-5.3 Chat", + "display_name": "OpenAI: GPT-5.3 Chat", + "modalities": { + "input": [ + "image", + "pdf", + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 128000, + "output": 16384 + }, + "tool_call": true, + "reasoning": { + "supported": false + }, + "attachment": true, + "open_weights": false, + "release_date": "2026-03-04", + "last_updated": "2026-03-15", "cost": { - "input": 5, - "output": 25, - "cache_read": 0.5, - "cache_write": 6.25 + "input": 1.75, + "output": 14 }, "type": "chat" }, { - "id": "anthropic/claude-opus-4", - "name": "Claude Opus 4 (latest)", - "display_name": "Claude Opus 4 (latest)", + "id": "openai/gpt-3.5-turbo-0613", + "name": "OpenAI: GPT-3.5 Turbo (older v0613)", + "display_name": "OpenAI: GPT-3.5 Turbo (older v0613)", "modalities": { "input": [ - "text", - "image", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 32000 + "context": 4095, + "output": 4096 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": false - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": false, - "mode": "budget", - "budget": { - "min": 1024, - "unit": "tokens" - }, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ], - "notes": [ - "Claude 4 manual thinking uses thinking.type = \"enabled\" with budget_tokens.", - "Interleaved thinking requires the interleaved-thinking-2025-05-14 beta header for this model family." - ] - } + "supported": false }, - "attachment": true, + "attachment": false, "open_weights": false, - "knowledge": "2025-03-31", - "release_date": "2025-05-22", - "last_updated": "2025-05-22", + "release_date": "2023-06-13", + "last_updated": "2023-06-13", "cost": { - "input": 15, - "output": 75, - "cache_read": 1.5, - "cache_write": 18.75 + "input": 1, + "output": 2 }, "type": "chat" }, { - "id": "openai/gpt-4o", - "name": "GPT-4o", - "display_name": "GPT-4o", + "id": "openai/gpt-5-image-mini", + "name": "OpenAI: GPT-5 Image Mini", + "display_name": "OpenAI: GPT-5 Image Mini", "modalities": { "input": [ - "text", - "image" + "image", + "pdf", + "text" ], "output": [ + "image", "text" ] }, "limit": { - "context": 128000, - "output": 16384 + "context": 400000, + "output": 128000 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "attachment": true, "open_weights": false, - "knowledge": "2023-09", - "release_date": "2024-05-13", - "last_updated": "2024-08-06", + "release_date": "2025-10-16", + "last_updated": "2026-03-15", "cost": { "input": 2.5, - "output": 10, - "cache_read": 1.25 + "output": 2 }, "type": "chat" }, { - "id": "openai/gpt-5.2", - "name": "GPT-5.2", - "display_name": "GPT-5.2", + "id": "openai/gpt-5.1-codex", + "name": "OpenAI: GPT-5.1-Codex", + "display_name": "OpenAI: GPT-5.1-Codex", "modalities": { "input": [ "text", @@ -119880,8 +125056,7 @@ "none", "low", "medium", - "high", - "xhigh" + "high" ], "verbosity": "medium", "verbosity_options": [ @@ -119894,20 +125069,19 @@ }, "attachment": true, "open_weights": false, - "knowledge": "2025-08-31", - "release_date": "2025-12-11", - "last_updated": "2025-12-11", + "release_date": "2025-11-13", + "last_updated": "2025-11-13", "cost": { - "input": 1.75, - "output": 14, - "cache_read": 0.175 + "input": 1.25, + "output": 10, + "cache_read": 0.125 }, "type": "chat" }, { - "id": "openai/o3", - "name": "o3", - "display_name": "o3", + "id": "openai/gpt-5.1-codex-max", + "name": "OpenAI: GPT-5.1-Codex-Max", + "display_name": "OpenAI: GPT-5.1-Codex-Max", "modalities": { "input": [ "text", @@ -119918,22 +125092,29 @@ ] }, "limit": { - "context": 200000, - "output": 100000 + "context": 400000, + "output": 128000 }, "temperature": false, "tool_call": true, "reasoning": { "supported": true, - "default": true + "default": false }, "extra_capabilities": { "reasoning": { "supported": true, - "default_enabled": true, + "default_enabled": false, "mode": "effort", - "effort": "medium", + "effort": "none", "effort_options": [ + "none", + "low", + "medium", + "high" + ], + "verbosity": "medium", + "verbosity_options": [ "low", "medium", "high" @@ -119943,72 +125124,57 @@ }, "attachment": true, "open_weights": false, - "knowledge": "2024-05", - "release_date": "2025-04-16", - "last_updated": "2025-04-16", + "release_date": "2025-11-13", + "last_updated": "2025-11-13", "cost": { - "input": 2, - "output": 8, - "cache_read": 0.5 + "input": 1.25, + "output": 10, + "cache_read": 0.125 }, "type": "chat" }, { - "id": "openai/o3-pro", - "name": "o3-pro", - "display_name": "o3-pro", + "id": "openai/gpt-4o-2024-08-06", + "name": "OpenAI: GPT-4o (2024-08-06)", + "display_name": "OpenAI: GPT-4o (2024-08-06)", "modalities": { "input": [ - "text", - "image" + "image", + "pdf", + "text" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 100000 + "context": 128000, + "output": 16384 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": true, - "mode": "effort", - "effort": "medium", - "effort_options": [ - "low", - "medium", - "high" - ], - "visibility": "hidden" - } + "supported": false }, "attachment": true, "open_weights": false, - "knowledge": "2024-05", - "release_date": "2025-06-10", - "last_updated": "2025-06-10", + "release_date": "2024-08-06", + "last_updated": "2026-03-15", "cost": { - "input": 20, - "output": 80 + "input": 2.5, + "output": 10, + "cache_read": 1.25 }, "type": "chat" }, { - "id": "openai/o4-mini", - "name": "o4-mini", - "display_name": "o4-mini", + "id": "openai/o3-mini", + "name": "OpenAI: o3 Mini", + "display_name": "OpenAI: o3 Mini", "modalities": { "input": [ - "text", - "image" + "pdf", + "text" ], "output": [ "text" @@ -120040,32 +125206,31 @@ }, "attachment": true, "open_weights": false, - "knowledge": "2024-05", - "release_date": "2025-04-16", - "last_updated": "2025-04-16", + "release_date": "2024-12-20", + "last_updated": "2026-03-15", "cost": { "input": 1.1, "output": 4.4, - "cache_read": 0.28 + "cache_read": 0.55 }, "type": "chat" }, { - "id": "openai/gpt-5.4", - "name": "GPT-5.4", - "display_name": "GPT-5.4", + "id": "openai/gpt-5.2", + "name": "OpenAI: GPT-5.2", + "display_name": "OpenAI: GPT-5.2", "modalities": { "input": [ - "text", "image", - "pdf" + "pdf", + "text" ], "output": [ "text" ] }, "limit": { - "context": 1050000, + "context": 400000, "output": 128000 }, "temperature": false, @@ -120098,22 +125263,22 @@ }, "attachment": true, "open_weights": false, - "knowledge": "2025-08-31", - "release_date": "2026-03-05", - "last_updated": "2026-03-05", + "release_date": "2025-12-11", + "last_updated": "2026-03-15", "cost": { - "input": 2.5, - "output": 15, - "cache_read": 0.25 + "input": 1.75, + "output": 14, + "cache_read": 0.175 }, "type": "chat" }, { - "id": "openai/o3-mini", - "name": "o3-mini", - "display_name": "o3-mini", + "id": "openai/gpt-5.3-codex", + "name": "OpenAI: GPT-5.3-Codex", + "display_name": "OpenAI: GPT-5.3-Codex", "modalities": { "input": [ + "image", "text" ], "output": [ @@ -120121,10 +125286,9 @@ ] }, "limit": { - "context": 200000, - "output": 100000 + "context": 400000, + "output": 128000 }, - "temperature": false, "tool_call": true, "reasoning": { "supported": true, @@ -120137,6 +125301,13 @@ "mode": "effort", "effort": "medium", "effort_options": [ + "low", + "medium", + "high", + "xhigh" + ], + "verbosity": "medium", + "verbosity_options": [ "low", "medium", "high" @@ -120144,53 +125315,83 @@ "visibility": "hidden" } }, + "attachment": true, + "open_weights": false, + "release_date": "2026-02-25", + "last_updated": "2026-03-15", + "cost": { + "input": 1.75, + "output": 14 + }, + "type": "chat" + }, + { + "id": "openai/gpt-audio-mini", + "name": "OpenAI: GPT Audio Mini", + "display_name": "OpenAI: GPT Audio Mini", + "modalities": { + "input": [ + "audio", + "text" + ], + "output": [ + "audio", + "text" + ] + }, + "limit": { + "context": 128000, + "output": 16384 + }, + "temperature": true, + "tool_call": false, + "reasoning": { + "supported": false + }, "attachment": false, "open_weights": false, - "knowledge": "2024-05", - "release_date": "2024-12-20", - "last_updated": "2025-01-29", + "release_date": "2026-01-20", + "last_updated": "2026-03-15", "cost": { - "input": 1.1, - "output": 4.4, - "cache_read": 0.55 + "input": 0.6, + "output": 2.4 }, "type": "chat" }, { - "id": "openai/gpt-5.5", - "name": "GPT-5.5", - "display_name": "GPT-5.5", + "id": "openai/gpt-5.1-codex-mini", + "name": "OpenAI: GPT-5.1-Codex-Mini", + "display_name": "OpenAI: GPT-5.1-Codex-Mini", "modalities": { "input": [ - "text", "image", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 1050000, - "output": 128000 + "context": 400000, + "output": 100000 }, "temperature": false, "tool_call": true, "reasoning": { "supported": true, - "default": true + "default": false }, "extra_capabilities": { "reasoning": { "supported": true, - "default_enabled": true, + "default_enabled": false, "mode": "effort", - "effort": "medium", + "effort": "none", "effort_options": [ + "none", "low", "medium", - "high", - "xhigh" + "high" ], "verbosity": "medium", "verbosity_options": [ @@ -120203,69 +125404,46 @@ }, "attachment": true, "open_weights": false, - "knowledge": "2025-12-01", - "release_date": "2026-04-23", - "last_updated": "2026-04-23", + "release_date": "2025-11-13", + "last_updated": "2025-11-13", "cost": { - "input": 5, - "output": 30, - "cache_read": 0.5, - "tiers": [ - { - "input": 10, - "output": 45, - "cache_read": 1, - "tier": { - "type": "context", - "size": 272000 - } - } - ], - "context_over_200k": { - "input": 10, - "output": 45, - "cache_read": 1 - } + "input": 0.25, + "output": 2, + "cache_read": 0.025 }, "type": "chat" }, { - "id": "openai/gpt-5.1", - "name": "GPT-5.1", - "display_name": "GPT-5.1", + "id": "openai/o4-mini-deep-research", + "name": "OpenAI: o4 Mini Deep Research", + "display_name": "OpenAI: o4 Mini Deep Research", "modalities": { "input": [ - "text", - "image" + "image", + "pdf", + "text" ], "output": [ "text" ] }, "limit": { - "context": 400000, - "output": 128000 + "context": 200000, + "output": 100000 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, - "default": false + "default": true }, "extra_capabilities": { "reasoning": { "supported": true, - "default_enabled": false, + "default_enabled": true, "mode": "effort", - "effort": "none", + "effort": "medium", "effort_options": [ - "none", - "low", - "medium", - "high" - ], - "verbosity": "medium", - "verbosity_options": [ "low", "medium", "high" @@ -120275,32 +125453,32 @@ }, "attachment": true, "open_weights": false, - "knowledge": "2024-09-30", - "release_date": "2025-11-13", - "last_updated": "2025-11-13", + "release_date": "2024-06-26", + "last_updated": "2026-03-15", "cost": { - "input": 1.25, - "output": 10, - "cache_read": 0.13 + "input": 2, + "output": 8, + "cache_read": 0.5 }, "type": "chat" }, { - "id": "openai/gpt-4o-mini", - "name": "GPT-4o mini", - "display_name": "GPT-4o mini", + "id": "openai/gpt-4.1-nano", + "name": "OpenAI: GPT-4.1 Nano", + "display_name": "OpenAI: GPT-4.1 Nano", "modalities": { "input": [ - "text", - "image" + "image", + "pdf", + "text" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 16384 + "context": 1047576, + "output": 32768 }, "temperature": true, "tool_call": true, @@ -120309,35 +125487,32 @@ }, "attachment": true, "open_weights": false, - "knowledge": "2023-09", - "release_date": "2024-07-18", - "last_updated": "2024-07-18", + "release_date": "2025-04-14", + "last_updated": "2026-03-15", "cost": { - "input": 0.15, - "output": 0.6, - "cache_read": 0.08 + "input": 0.1, + "output": 0.4, + "cache_read": 0.025 }, "type": "chat" }, { - "id": "openai/gpt-5.3-codex", - "name": "GPT-5.3 Codex", - "display_name": "GPT-5.3 Codex", + "id": "openai/gpt-oss-120b", + "name": "OpenAI: gpt-oss-120b", + "display_name": "OpenAI: gpt-oss-120b", "modalities": { "input": [ - "text", - "image", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 400000, - "output": 128000 + "context": 131072, + "output": 26215 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, @@ -120345,43 +125520,27 @@ }, "extra_capabilities": { "reasoning": { - "supported": true, - "default_enabled": true, - "mode": "effort", - "effort": "medium", - "effort_options": [ - "low", - "medium", - "high", - "xhigh" - ], - "verbosity": "medium", - "verbosity_options": [ - "low", - "medium", - "high" - ], - "visibility": "hidden" + "supported": true } }, - "attachment": true, - "open_weights": false, - "knowledge": "2025-08-31", - "release_date": "2026-02-05", - "last_updated": "2026-02-05", + "attachment": false, + "open_weights": true, + "release_date": "2025-08-05", + "last_updated": "2025-08-05", "cost": { - "input": 1.75, - "output": 14, - "cache_read": 0.175 + "input": 0.039, + "output": 0.19 }, "type": "chat" }, { - "id": "openai/gpt-3.5-turbo", - "name": "GPT-3.5-turbo", - "display_name": "GPT-3.5-turbo", + "id": "openai/gpt-4o-2024-11-20", + "name": "OpenAI: GPT-4o (2024-11-20)", + "display_name": "OpenAI: GPT-4o (2024-11-20)", "modalities": { "input": [ + "image", + "pdf", "text" ], "output": [ @@ -120389,43 +125548,42 @@ ] }, "limit": { - "context": 16385, - "output": 4096 + "context": 128000, + "output": 16384 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { "supported": false }, - "attachment": false, + "attachment": true, "open_weights": false, - "knowledge": "2021-09-01", - "release_date": "2023-03-01", - "last_updated": "2023-11-06", + "release_date": "2024-11-20", + "last_updated": "2026-03-15", "cost": { - "input": 0.5, - "output": 1.5, + "input": 2.5, + "output": 10, "cache_read": 1.25 }, "type": "chat" }, { - "id": "openai/gpt-5.2-codex", - "name": "GPT-5.2 Codex", - "display_name": "GPT-5.2 Codex", + "id": "openai/o1", + "name": "OpenAI: o1", + "display_name": "OpenAI: o1", "modalities": { "input": [ - "text", "image", - "pdf" + "pdf", + "text" ], "output": [ "text" ] }, "limit": { - "context": 400000, - "output": 128000 + "context": 200000, + "output": 100000 }, "temperature": false, "tool_call": true, @@ -120440,13 +125598,6 @@ "mode": "effort", "effort": "medium", "effort_options": [ - "low", - "medium", - "high", - "xhigh" - ], - "verbosity": "medium", - "verbosity_options": [ "low", "medium", "high" @@ -120456,53 +125607,46 @@ }, "attachment": true, "open_weights": false, - "knowledge": "2025-08-31", - "release_date": "2025-12-11", - "last_updated": "2025-12-11", + "release_date": "2024-12-05", + "last_updated": "2026-03-15", "cost": { - "input": 1.75, - "output": 14, - "cache_read": 0.175 + "input": 15, + "output": 60, + "cache_read": 7.5 }, "type": "chat" }, { - "id": "openai/gpt-5.1-codex", - "name": "GPT-5.1 Codex", - "display_name": "GPT-5.1 Codex", + "id": "openai/o1-pro", + "name": "OpenAI: o1-pro", + "display_name": "OpenAI: o1-pro", "modalities": { "input": [ - "text", - "image" + "image", + "pdf", + "text" ], "output": [ "text" ] }, "limit": { - "context": 400000, - "output": 128000 + "context": 200000, + "output": 100000 }, "temperature": false, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": true, - "default": false + "default": true }, "extra_capabilities": { "reasoning": { "supported": true, - "default_enabled": false, + "default_enabled": true, "mode": "effort", - "effort": "none", + "effort": "medium", "effort_options": [ - "none", - "low", - "medium", - "high" - ], - "verbosity": "medium", - "verbosity_options": [ "low", "medium", "high" @@ -120512,104 +125656,97 @@ }, "attachment": true, "open_weights": false, - "knowledge": "2024-09-30", - "release_date": "2025-11-13", - "last_updated": "2025-11-13", + "release_date": "2025-03-19", + "last_updated": "2026-03-15", "cost": { - "input": 1.25, - "output": 10, - "cache_read": 0.125 + "input": 150, + "output": 600 }, "type": "chat" }, { - "id": "openai/gpt-4-turbo", - "name": "GPT-4 Turbo", - "display_name": "GPT-4 Turbo", + "id": "openai/gpt-chat-latest", + "name": "OpenAI: GPT Chat Latest", + "display_name": "OpenAI: GPT Chat Latest", "modalities": { "input": [ - "text", - "image" + "image", + "pdf", + "text" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 4096 + "context": 400000, + "output": 128000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true + } }, "attachment": true, "open_weights": false, - "knowledge": "2023-12", - "release_date": "2023-11-06", - "last_updated": "2024-04-09", + "release_date": "2026-05-05", + "last_updated": "2026-05-07", "cost": { - "input": 10, - "output": 30 + "input": 5, + "output": 30, + "cache_read": 0.5 }, "type": "chat" }, { - "id": "openai/o1", - "name": "o1", - "display_name": "o1", + "id": "openai/gpt-5-image", + "name": "OpenAI: GPT-5 Image", + "display_name": "OpenAI: GPT-5 Image", "modalities": { "input": [ - "text", - "image" + "image", + "pdf", + "text" ], "output": [ + "image", "text" ] }, "limit": { - "context": 200000, - "output": 100000 + "context": 400000, + "output": 128000 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, "default": true }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": true, - "mode": "effort", - "effort": "medium", - "effort_options": [ - "low", - "medium", - "high" - ], - "visibility": "hidden" - } - }, "attachment": true, "open_weights": false, - "knowledge": "2023-09", - "release_date": "2024-12-05", - "last_updated": "2024-12-05", + "release_date": "2025-10-14", + "last_updated": "2026-03-15", "cost": { - "input": 15, - "output": 60, - "cache_read": 7.5 + "input": 10, + "output": 10 }, "type": "chat" }, { - "id": "openai/gpt-4", - "name": "GPT-4", - "display_name": "GPT-4", + "id": "openai/gpt-5.4", + "name": "OpenAI: GPT-5.4", + "display_name": "OpenAI: GPT-5.4", "modalities": { "input": [ + "image", + "pdf", "text" ], "output": [ @@ -120617,53 +125754,65 @@ ] }, "limit": { - "context": 8192, - "output": 8192 + "context": 1050000, + "output": 128000 }, - "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": false + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": false, + "mode": "effort", + "effort": "none", + "effort_options": [ + "none", + "low", + "medium", + "high", + "xhigh" + ], + "verbosity": "medium", + "verbosity_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" + } }, "attachment": true, "open_weights": false, - "knowledge": "2023-11", - "release_date": "2023-11-06", - "last_updated": "2024-04-09", + "release_date": "2026-03-06", + "last_updated": "2026-03-15", "cost": { - "input": 30, - "output": 60 + "input": 2.5, + "output": 15 }, "type": "chat" - } - ] - }, - "requesty": { - "id": "requesty", - "name": "Requesty", - "display_name": "Requesty", - "api": "https://router.requesty.ai/v1", - "doc": "https://requesty.ai/solution/llm-routing/models", - "models": [ + }, { - "id": "anthropic/claude-opus-4-5", - "name": "Claude Opus 4.5", - "display_name": "Claude Opus 4.5", + "id": "openai/gpt-5.4-mini", + "name": "OpenAI: GPT-5.4 Mini", + "display_name": "OpenAI: GPT-5.4 Mini", "modalities": { "input": [ - "text", "image", - "pdf" + "pdf", + "text" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 64000 + "context": 400000, + "output": 128000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { "supported": true, @@ -120673,505 +125822,421 @@ "reasoning": { "supported": true, "default_enabled": false, - "mode": "mixed", - "budget": { - "min": 1024, - "unit": "tokens" - }, - "effort": "high", + "mode": "effort", + "effort": "none", "effort_options": [ + "none", "low", "medium", - "high" + "high", + "xhigh" ], - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" + "verbosity": "medium", + "verbosity_options": [ + "low", + "medium", + "high" ], - "notes": [ - "Claude Opus 4.5 uses manual thinking.type = \"enabled\" with budget_tokens; effort can be used alongside the thinking budget.", - "Interleaved thinking requires the interleaved-thinking-2025-05-14 beta header." - ] + "visibility": "hidden" } }, "attachment": true, "open_weights": false, - "knowledge": "2025-03-31", - "release_date": "2025-11-24", - "last_updated": "2025-11-24", + "release_date": "2026-03-17", + "last_updated": "2026-04-11", "cost": { - "input": 5, - "output": 25, - "cache_read": 0.5, - "cache_write": 6.25 + "input": 0.75, + "output": 4.5, + "cache_read": 0.075 }, "type": "chat" }, { - "id": "anthropic/claude-sonnet-4", - "name": "Claude Sonnet 4", - "display_name": "Claude Sonnet 4", + "id": "openai/gpt-4.1", + "name": "OpenAI: GPT-4.1", + "display_name": "OpenAI: GPT-4.1", "modalities": { "input": [ - "text", "image", - "pdf" + "pdf", + "text" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 64000 + "context": 1047576, + "output": 32768 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": false - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": false, - "mode": "budget", - "budget": { - "min": 1024, - "unit": "tokens" - }, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ], - "notes": [ - "Claude 4 manual thinking uses thinking.type = \"enabled\" with budget_tokens.", - "Interleaved thinking requires the interleaved-thinking-2025-05-14 beta header for this model family." - ] - } + "supported": false }, "attachment": true, "open_weights": false, - "knowledge": "2025-03-31", - "release_date": "2025-05-22", - "last_updated": "2025-05-22", + "release_date": "2025-04-14", + "last_updated": "2026-03-15", "cost": { - "input": 3, - "output": 15, - "cache_read": 0.3, - "cache_write": 3.75 + "input": 2, + "output": 8, + "cache_read": 0.5 }, "type": "chat" }, { - "id": "anthropic/claude-sonnet-4-6", - "name": "Claude Sonnet 4.6", - "display_name": "Claude Sonnet 4.6", + "id": "openai/gpt-4o-audio-preview", + "name": "OpenAI: GPT-4o Audio", + "display_name": "OpenAI: GPT-4o Audio", "modalities": { "input": [ - "text", - "image" + "audio", + "text" ], "output": [ + "audio", "text" ] }, "limit": { - "context": 1000000, - "output": 128000 + "context": 128000, + "output": 16384 + }, + "temperature": true, + "tool_call": true, + "reasoning": { + "supported": false + }, + "attachment": false, + "open_weights": false, + "release_date": "2025-08-15", + "last_updated": "2026-03-15", + "cost": { + "input": 2.5, + "output": 10 + }, + "type": "chat" + }, + { + "id": "openai/o3-deep-research", + "name": "OpenAI: o3 Deep Research", + "display_name": "OpenAI: o3 Deep Research", + "modalities": { + "input": [ + "image", + "pdf", + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 200000, + "output": 100000 }, "temperature": true, "tool_call": true, "reasoning": { "supported": true, - "default": false + "default": true }, "extra_capabilities": { "reasoning": { "supported": true, - "default_enabled": false, - "mode": "mixed", - "budget": { - "min": 1024, - "unit": "tokens" - }, - "effort": "high", + "default_enabled": true, + "mode": "effort", + "effort": "medium", "effort_options": [ "low", "medium", - "high", - "max" - ], - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" + "high" ], - "notes": [ - "Anthropic recommends adaptive thinking with effort for Claude 4.6; budget_tokens remains a deprecated compatibility path.", - "Anthropic API defaults effort to high; lower effort levels should be chosen per workload." - ] + "visibility": "hidden" } }, "attachment": true, "open_weights": false, - "knowledge": "2025-08-31", - "release_date": "2026-02-17", - "last_updated": "2026-02-17", + "release_date": "2024-06-26", + "last_updated": "2026-03-15", "cost": { - "input": 3, - "output": 15, - "cache_read": 0.3, - "cache_write": 3.75, - "tiers": [ - { - "input": 6, - "output": 22.5, - "cache_read": 0.6, - "cache_write": 7.5, - "tier": { - "type": "context", - "size": 200000 - } - } - ], - "context_over_200k": { - "input": 6, - "output": 22.5, - "cache_read": 0.6, - "cache_write": 7.5 - } + "input": 10, + "output": 40, + "cache_read": 2.5 }, "type": "chat" }, { - "id": "anthropic/claude-haiku-4-5", - "name": "Claude Haiku 4.5", - "display_name": "Claude Haiku 4.5", + "id": "openai/gpt-4-turbo-preview", + "name": "OpenAI: GPT-4 Turbo Preview", + "display_name": "OpenAI: GPT-4 Turbo Preview", "modalities": { "input": [ - "text", - "image", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 62000 + "context": 128000, + "output": 4096 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": false - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": false, - "mode": "budget", - "budget": { - "min": 1024, - "unit": "tokens" - }, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ], - "notes": [ - "Claude 4 manual thinking uses thinking.type = \"enabled\" with budget_tokens.", - "Interleaved thinking requires the interleaved-thinking-2025-05-14 beta header for this model family." - ] - } + "supported": false }, - "attachment": true, + "attachment": false, "open_weights": false, - "knowledge": "2025-02-01", - "release_date": "2025-10-15", - "last_updated": "2025-10-15", + "release_date": "2024-01-25", + "last_updated": "2026-03-15", "cost": { - "input": 1, - "output": 5, - "cache_read": 0.1, - "cache_write": 1.25 + "input": 10, + "output": 30 }, "type": "chat" }, { - "id": "anthropic/claude-opus-4-1", - "name": "Claude Opus 4.1", - "display_name": "Claude Opus 4.1", + "id": "openai/gpt-5-mini", + "name": "OpenAI: GPT-5 Mini", + "display_name": "OpenAI: GPT-5 Mini", "modalities": { "input": [ - "text", "image", - "pdf" + "pdf", + "text" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 32000 + "context": 400000, + "output": 128000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { "supported": true, - "default": false + "default": true }, "extra_capabilities": { "reasoning": { "supported": true, - "default_enabled": false, - "mode": "budget", - "budget": { - "min": 1024, - "unit": "tokens" - }, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" + "default_enabled": true, + "mode": "effort", + "effort": "medium", + "effort_options": [ + "minimal", + "low", + "medium", + "high" ], - "notes": [ - "Claude 4 manual thinking uses thinking.type = \"enabled\" with budget_tokens.", - "Interleaved thinking requires the interleaved-thinking-2025-05-14 beta header for this model family." - ] + "verbosity": "medium", + "verbosity_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" } }, "attachment": true, "open_weights": false, - "knowledge": "2025-03-31", - "release_date": "2025-08-05", - "last_updated": "2025-08-05", + "release_date": "2025-08-07", + "last_updated": "2026-03-15", + "cost": { + "input": 0.25, + "output": 2, + "cache_read": 0.025 + }, + "type": "chat" + }, + { + "id": "openai/gpt-4.1-mini", + "name": "OpenAI: GPT-4.1 Mini", + "display_name": "OpenAI: GPT-4.1 Mini", + "modalities": { + "input": [ + "image", + "pdf", + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 1047576, + "output": 32768 + }, + "temperature": true, + "tool_call": true, + "reasoning": { + "supported": false + }, + "attachment": true, + "open_weights": false, + "release_date": "2025-04-14", + "last_updated": "2026-03-15", "cost": { - "input": 15, - "output": 75, - "cache_read": 1.5, - "cache_write": 18.75 + "input": 0.4, + "output": 1.6, + "cache_read": 0.1 }, "type": "chat" }, { - "id": "anthropic/claude-sonnet-4-5", - "name": "Claude Sonnet 4.5", - "display_name": "Claude Sonnet 4.5", + "id": "openai/gpt-4-turbo", + "name": "OpenAI: GPT-4 Turbo", + "display_name": "OpenAI: GPT-4 Turbo", "modalities": { "input": [ "text", - "image", - "pdf" + "image" ], "output": [ "text" ] }, "limit": { - "context": 1000000, - "output": 64000 + "context": 128000, + "output": 4096 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": false - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": false, - "mode": "budget", - "budget": { - "min": 1024, - "unit": "tokens" - }, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ], - "notes": [ - "Claude 4 manual thinking uses thinking.type = \"enabled\" with budget_tokens.", - "Interleaved thinking requires the interleaved-thinking-2025-05-14 beta header for this model family." - ] - } + "supported": false }, "attachment": true, "open_weights": false, - "knowledge": "2025-07-31", - "release_date": "2025-09-29", - "last_updated": "2025-09-29", + "release_date": "2023-09-13", + "last_updated": "2024-04-09", "cost": { - "input": 3, - "output": 15, - "cache_read": 0.3, - "cache_write": 3.75 + "input": 10, + "output": 30 }, "type": "chat" }, { - "id": "anthropic/claude-3-7-sonnet", - "name": "Claude Sonnet 3.7", - "display_name": "Claude Sonnet 3.7", + "id": "openai/gpt-5-nano", + "name": "OpenAI: GPT-5 Nano", + "display_name": "OpenAI: GPT-5 Nano", "modalities": { "input": [ - "text", "image", - "pdf" + "pdf", + "text" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 64000 + "context": 400000, + "output": 128000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { "supported": true, - "default": false + "default": true }, "extra_capabilities": { "reasoning": { "supported": true, - "default_enabled": false, - "mode": "budget", - "budget": { - "min": 1024, - "unit": "tokens" - }, - "interleaved": false, - "summaries": false, - "visibility": "full", - "continuation": [ - "thinking_blocks" + "default_enabled": true, + "mode": "effort", + "effort": "medium", + "effort_options": [ + "minimal", + "low", + "medium", + "high" ], - "notes": [ - "Anthropic uses thinking budget tokens" - ] + "verbosity": "medium", + "verbosity_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" } }, "attachment": true, "open_weights": false, - "knowledge": "2024-01", - "release_date": "2025-02-19", - "last_updated": "2025-02-19", + "release_date": "2025-08-07", + "last_updated": "2026-03-15", "cost": { - "input": 3, - "output": 15, - "cache_read": 0.3, - "cache_write": 3.75 + "input": 0.05, + "output": 0.4, + "cache_read": 0.005 }, "type": "chat" }, { - "id": "anthropic/claude-opus-4-6", - "name": "Claude Opus 4.6", - "display_name": "Claude Opus 4.6", + "id": "openai/gpt-5.4-pro", + "name": "OpenAI: GPT-5.4 Pro", + "display_name": "OpenAI: GPT-5.4 Pro", "modalities": { "input": [ - "text", "image", - "pdf" + "pdf", + "text" ], "output": [ "text" ] }, "limit": { - "context": 1000000, + "context": 1050000, "output": 128000 }, - "temperature": true, "tool_call": true, "reasoning": { "supported": true, - "default": false + "default": true }, "extra_capabilities": { "reasoning": { "supported": true, - "default_enabled": false, - "mode": "mixed", - "budget": { - "min": 1024, - "unit": "tokens" - }, + "default_enabled": true, + "mode": "effort", "effort": "high", "effort_options": [ - "low", "medium", "high", - "max" + "xhigh" ], - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" + "verbosity": "medium", + "verbosity_options": [ + "low", + "medium", + "high" ], - "notes": [ - "Anthropic recommends adaptive thinking with effort for Claude 4.6; budget_tokens remains a deprecated compatibility path.", - "Anthropic API defaults effort to high; lower effort levels should be chosen per workload." - ] + "visibility": "hidden" } }, "attachment": true, "open_weights": false, - "knowledge": "2025-05-31", - "release_date": "2026-02-05", - "last_updated": "2026-02-05", + "release_date": "2026-03-06", + "last_updated": "2026-03-15", "cost": { - "input": 5, - "output": 25, - "cache_read": 0.5, - "cache_write": 6.25, - "tiers": [ - { - "input": 10, - "output": 37.5, - "cache_read": 1, - "cache_write": 12.5, - "tier": { - "type": "context", - "size": 200000 - } - } - ], - "context_over_200k": { - "input": 10, - "output": 37.5, - "cache_read": 1, - "cache_write": 12.5 - } + "input": 30, + "output": 180 }, "type": "chat" }, { - "id": "anthropic/claude-opus-4", - "name": "Claude Opus 4", - "display_name": "Claude Opus 4", + "id": "openai/o3-mini-high", + "name": "OpenAI: o3 Mini High", + "display_name": "OpenAI: o3 Mini High", "modalities": { "input": [ - "text", - "image", - "pdf" + "pdf", + "text" ], "output": [ "text" @@ -121179,93 +126244,101 @@ }, "limit": { "context": 200000, - "output": 32000 + "output": 100000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { "supported": true, - "default": false + "default": true }, "extra_capabilities": { "reasoning": { "supported": true, - "default_enabled": false, - "mode": "budget", - "budget": { - "min": 1024, - "unit": "tokens" - }, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" + "default_enabled": true, + "mode": "effort", + "effort": "medium", + "effort_options": [ + "low", + "medium", + "high" ], - "notes": [ - "Claude 4 manual thinking uses thinking.type = \"enabled\" with budget_tokens.", - "Interleaved thinking requires the interleaved-thinking-2025-05-14 beta header for this model family." - ] + "visibility": "hidden" } }, "attachment": true, "open_weights": false, - "knowledge": "2025-03-31", - "release_date": "2025-05-22", - "last_updated": "2025-05-22", + "release_date": "2025-01-31", + "last_updated": "2026-03-15", "cost": { - "input": 15, - "output": 75, - "cache_read": 1.5, - "cache_write": 18.75 + "input": 1.1, + "output": 4.4, + "cache_read": 0.55 }, "type": "chat" }, { - "id": "xai/grok-4", - "name": "Grok 4", - "display_name": "Grok 4", + "id": "openai/gpt-5.4-image-2", + "name": "OpenAI: GPT-5.4 Image 2", + "display_name": "OpenAI: GPT-5.4 Image 2", "modalities": { "input": [ + "image", "text", - "image" + "pdf" ], "output": [ + "image", "text" ] }, "limit": { - "context": 256000, - "output": 64000 + "context": 272000, + "output": 128000 }, - "temperature": true, - "tool_call": true, + "temperature": false, + "tool_call": false, "reasoning": { "supported": true, - "default": true + "default": false }, "extra_capabilities": { "reasoning": { - "supported": true + "supported": true, + "default_enabled": false, + "mode": "effort", + "effort": "none", + "effort_options": [ + "none", + "low", + "medium", + "high", + "xhigh" + ], + "verbosity": "medium", + "verbosity_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" } }, "attachment": true, "open_weights": false, - "knowledge": "2025-01", - "release_date": "2025-09-09", - "last_updated": "2025-09-09", + "release_date": "2026-04-21", + "last_updated": "2026-05-01", "cost": { - "input": 3, + "input": 8, "output": 15, - "cache_read": 0.75, - "cache_write": 3 + "cache_read": 2 }, "type": "chat" }, { - "id": "xai/grok-4-fast", - "name": "Grok 4 Fast", - "display_name": "Grok 4 Fast", + "id": "openai/gpt-4o-search-preview", + "name": "OpenAI: GPT-4o Search Preview", + "display_name": "OpenAI: GPT-4o Search Preview", "modalities": { "input": [ "text" @@ -121275,38 +126348,31 @@ ] }, "limit": { - "context": 2000000, - "output": 64000 + "context": 128000, + "output": 16384 }, - "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": true + "supported": false }, - "attachment": true, + "attachment": false, "open_weights": false, - "knowledge": "2025-01", - "release_date": "2025-09-19", - "last_updated": "2025-09-19", + "release_date": "2025-03-13", + "last_updated": "2026-03-15", "cost": { - "input": 0.2, - "output": 0.5, - "cache_read": 0.05, - "cache_write": 0.2 + "input": 2.5, + "output": 10 }, "type": "chat" }, { - "id": "google/gemini-3-flash-preview", - "name": "Gemini 3 Flash", - "display_name": "Gemini 3 Flash", + "id": "openai/gpt-5.5-pro", + "name": "OpenAI: GPT-5.5 Pro", + "display_name": "OpenAI: GPT-5.5 Pro", "modalities": { "input": [ "text", "image", - "audio", - "video", "pdf" ], "output": [ @@ -121314,10 +126380,10 @@ ] }, "limit": { - "context": 1048576, - "output": 65536 + "context": 1050000, + "output": 128000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { "supported": true, @@ -121325,129 +126391,68 @@ }, "extra_capabilities": { "reasoning": { - "supported": true, - "default_enabled": true, - "mode": "level", - "level": "high", - "level_options": [ - "minimal", - "low", - "medium", - "high" - ], - "summaries": true, - "visibility": "summary", - "continuation": [ - "thought_signatures" - ] + "supported": true } }, "attachment": true, "open_weights": false, - "knowledge": "2025-01", - "release_date": "2025-12-17", - "last_updated": "2025-12-17", + "release_date": "2026-04-24", + "last_updated": "2026-05-01", "cost": { - "input": 0.5, - "output": 3, - "cache_read": 0.05, - "cache_write": 1 + "input": 30, + "output": 180 }, "type": "chat" }, { - "id": "google/gemini-2.5-pro", - "name": "Gemini 2.5 Pro", - "display_name": "Gemini 2.5 Pro", + "id": "openai/gpt-4o-mini", + "name": "OpenAI: GPT-4o-mini", + "display_name": "OpenAI: GPT-4o-mini", "modalities": { "input": [ - "text", "image", - "audio", - "video", - "pdf" + "pdf", + "text" ], "output": [ "text" ] }, "limit": { - "context": 1048576, - "output": 65536 + "context": 128000, + "output": 16384 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": true, - "mode": "budget", - "budget": { - "default": -1, - "min": 128, - "max": 32768, - "auto": -1, - "unit": "tokens" - }, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thought_signatures" - ] - } + "supported": false }, "attachment": true, "open_weights": false, - "knowledge": "2025-01", - "release_date": "2025-03-20", - "last_updated": "2025-06-05", + "release_date": "2024-07-18", + "last_updated": "2026-03-15", "cost": { - "input": 1.25, - "output": 10, - "cache_read": 0.31, - "cache_write": 2.375, - "tiers": [ - { - "input": 2.5, - "output": 15, - "cache_read": 0.25, - "tier": { - "type": "context", - "size": 200000 - } - } - ], - "context_over_200k": { - "input": 2.5, - "output": 15, - "cache_read": 0.25 - } + "input": 0.15, + "output": 0.6, + "cache_read": 0.075 }, "type": "chat" }, { - "id": "google/gemini-2.5-flash", - "name": "Gemini 2.5 Flash", - "display_name": "Gemini 2.5 Flash", + "id": "openai/gpt-oss-20b", + "name": "OpenAI: gpt-oss-20b", + "display_name": "OpenAI: gpt-oss-20b", "modalities": { "input": [ - "text", - "image", - "audio", - "video", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 1048576, - "output": 65536 + "context": 131072, + "output": 26215 }, "temperature": true, "tool_call": true, @@ -121457,97 +126462,54 @@ }, "extra_capabilities": { "reasoning": { - "supported": true, - "default_enabled": true, - "mode": "budget", - "budget": { - "default": -1, - "min": 0, - "max": 24576, - "auto": -1, - "off": 0, - "unit": "tokens" - }, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thought_signatures" - ] + "supported": true } }, - "attachment": true, - "open_weights": false, - "knowledge": "2025-01", - "release_date": "2025-06-17", - "last_updated": "2025-06-17", + "attachment": false, + "open_weights": true, + "release_date": "2025-08-05", + "last_updated": "2025-08-05", "cost": { - "input": 0.3, - "output": 2.5, - "cache_read": 0.075, - "cache_write": 0.55 + "input": 0.03, + "output": 0.14 }, "type": "chat" }, { - "id": "google/gemini-3-pro-preview", - "name": "Gemini 3 Pro", - "display_name": "Gemini 3 Pro", + "id": "openai/gpt-4-1106-preview", + "name": "OpenAI: GPT-4 Turbo (older v1106)", + "display_name": "OpenAI: GPT-4 Turbo (older v1106)", "modalities": { "input": [ - "text", - "image", - "audio", - "video", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 1048576, - "output": 65536 + "context": 128000, + "output": 4096 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": true, - "mode": "level", - "level": "high", - "level_options": [ - "low", - "high" - ], - "summaries": true, - "visibility": "summary", - "continuation": [ - "thought_signatures" - ] - } + "supported": false }, - "attachment": true, + "attachment": false, "open_weights": false, - "knowledge": "2025-01", - "release_date": "2025-11-18", - "last_updated": "2025-11-18", + "release_date": "2023-11-06", + "last_updated": "2026-03-15", "cost": { - "input": 2, - "output": 12, - "cache_read": 0.2, - "cache_write": 4.5 + "input": 10, + "output": 30 }, "type": "chat" }, { - "id": "openai/gpt-5-pro", - "name": "GPT-5 Pro", - "display_name": "GPT-5 Pro", + "id": "openai/gpt-5-codex", + "name": "OpenAI: GPT-5 Codex", + "display_name": "OpenAI: GPT-5 Codex", "modalities": { "input": [ "text", @@ -121559,7 +126521,7 @@ }, "limit": { "context": 400000, - "output": 272000 + "output": 128000 }, "temperature": false, "tool_call": true, @@ -121571,8 +126533,14 @@ "reasoning": { "supported": true, "default_enabled": true, - "mode": "fixed", - "effort": "high", + "mode": "effort", + "effort": "medium", + "effort_options": [ + "minimal", + "low", + "medium", + "high" + ], "verbosity": "medium", "verbosity_options": [ "low", @@ -121584,19 +126552,19 @@ }, "attachment": true, "open_weights": false, - "knowledge": "2024-09-30", - "release_date": "2025-10-06", - "last_updated": "2025-10-06", + "release_date": "2025-09-15", + "last_updated": "2025-09-15", "cost": { - "input": 15, - "output": 120 + "input": 1.25, + "output": 10, + "cache_read": 0.125 }, "type": "chat" }, { - "id": "openai/gpt-5-mini", - "name": "GPT-5 Mini", - "display_name": "GPT-5 Mini", + "id": "openai/gpt-5.2-codex", + "name": "OpenAI: GPT-5.2-Codex", + "display_name": "OpenAI: GPT-5.2-Codex", "modalities": { "input": [ "text", @@ -121607,8 +126575,8 @@ ] }, "limit": { - "context": 128000, - "output": 32000 + "context": 400000, + "output": 128000 }, "temperature": false, "tool_call": true, @@ -121623,10 +126591,10 @@ "mode": "effort", "effort": "medium", "effort_options": [ - "minimal", "low", "medium", - "high" + "high", + "xhigh" ], "verbosity": "medium", "verbosity_options": [ @@ -121639,58 +126607,24 @@ }, "attachment": true, "open_weights": false, - "knowledge": "2024-05-30", - "release_date": "2025-08-07", - "last_updated": "2025-08-07", + "release_date": "2026-01-14", + "last_updated": "2026-01-14", "cost": { - "input": 0.25, - "output": 2, - "cache_read": 0.03 + "input": 1.75, + "output": 14, + "cache_read": 0.175 }, "type": "chat" }, { - "id": "openai/gpt-5-chat", - "name": "GPT-5 Chat (latest)", - "display_name": "GPT-5 Chat (latest)", + "id": "openai/gpt-5.1", + "name": "OpenAI: GPT-5.1", + "display_name": "OpenAI: GPT-5.1", "modalities": { "input": [ - "text", - "image" - ], - "output": [ + "image", + "pdf", "text" - ] - }, - "limit": { - "context": 400000, - "output": 128000 - }, - "temperature": true, - "tool_call": false, - "reasoning": { - "supported": true, - "default": true - }, - "attachment": true, - "open_weights": false, - "knowledge": "2024-09-30", - "release_date": "2025-08-07", - "last_updated": "2025-08-07", - "cost": { - "input": 1.25, - "output": 10 - }, - "type": "chat" - }, - { - "id": "openai/gpt-5.2", - "name": "GPT-5.2", - "display_name": "GPT-5.2", - "modalities": { - "input": [ - "text", - "image" ], "output": [ "text" @@ -121716,8 +126650,7 @@ "none", "low", "medium", - "high", - "xhigh" + "high" ], "verbosity": "medium", "verbosity_options": [ @@ -121730,34 +126663,34 @@ }, "attachment": true, "open_weights": false, - "knowledge": "2025-08-31", - "release_date": "2025-12-11", - "last_updated": "2025-12-11", + "release_date": "2025-11-13", + "last_updated": "2026-03-15", "cost": { - "input": 1.75, - "output": 14, - "cache_read": 0.175 + "input": 1.25, + "output": 10, + "cache_read": 0.125 }, "type": "chat" }, { - "id": "openai/gpt-5-codex", - "name": "GPT-5 Codex", - "display_name": "GPT-5 Codex", + "id": "openai/gpt-5.5", + "name": "OpenAI: GPT-5.5", + "display_name": "OpenAI: GPT-5.5", "modalities": { "input": [ "text", - "image" + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 400000, + "context": 1050000, "output": 128000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { "supported": true, @@ -121770,10 +126703,10 @@ "mode": "effort", "effort": "medium", "effort_options": [ - "minimal", "low", "medium", - "high" + "high", + "xhigh" ], "verbosity": "medium", "verbosity_options": [ @@ -121786,185 +126719,220 @@ }, "attachment": true, "open_weights": false, - "knowledge": "2024-10-01", - "release_date": "2025-09-15", - "last_updated": "2025-09-15", + "release_date": "2026-04-24", + "last_updated": "2026-05-01", "cost": { - "input": 1.25, - "output": 10, - "cache_read": 0.125 + "input": 5, + "output": 30, + "cache_read": 0.5 }, "type": "chat" }, { - "id": "openai/gpt-5-image", - "name": "GPT-5 Image", - "display_name": "GPT-5 Image", + "id": "thedrummer/cydonia-24b-v4.1", + "name": "TheDrummer: Cydonia 24B V4.1", + "display_name": "TheDrummer: Cydonia 24B V4.1", "modalities": { "input": [ - "text", - "image", - "pdf" + "text" ], "output": [ - "text", - "image" + "text" ] }, "limit": { - "context": 400000, - "output": 128000 + "context": 131072, + "output": 131072 + }, + "temperature": true, + "tool_call": false, + "reasoning": { + "supported": false + }, + "attachment": false, + "open_weights": true, + "release_date": "2025-09-27", + "last_updated": "2026-03-15", + "cost": { + "input": 0.3, + "output": 0.5 + }, + "type": "chat" + }, + { + "id": "thedrummer/skyfall-36b-v2", + "name": "TheDrummer: Skyfall 36B V2", + "display_name": "TheDrummer: Skyfall 36B V2", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 32768, + "output": 32768 + }, + "temperature": true, + "tool_call": false, + "reasoning": { + "supported": false + }, + "attachment": false, + "open_weights": true, + "release_date": "2025-03-11", + "last_updated": "2026-03-15", + "cost": { + "input": 0.55, + "output": 0.8 + }, + "type": "chat" + }, + { + "id": "thedrummer/unslopnemo-12b", + "name": "TheDrummer: UnslopNemo 12B", + "display_name": "TheDrummer: UnslopNemo 12B", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 32768, + "output": 32768 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, - "attachment": true, - "open_weights": false, - "knowledge": "2024-10-01", - "release_date": "2025-10-14", - "last_updated": "2025-10-14", + "attachment": false, + "open_weights": true, + "release_date": "2024-11-09", + "last_updated": "2026-03-15", "cost": { - "input": 5, - "output": 10, - "cache_read": 1.25 + "input": 0.4, + "output": 0.4 }, "type": "chat" }, { - "id": "openai/gpt-5", - "name": "GPT-5", - "display_name": "GPT-5", + "id": "thedrummer/rocinante-12b", + "name": "TheDrummer: Rocinante 12B", + "display_name": "TheDrummer: Rocinante 12B", "modalities": { "input": [ - "text", - "audio", - "image", - "video" + "text" ], "output": [ - "text", - "audio", - "image" + "text" ] }, "limit": { - "context": 400000, - "output": 128000 + "context": 32768, + "output": 32768 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": true, - "mode": "effort", - "effort": "medium", - "effort_options": [ - "minimal", - "low", - "medium", - "high" - ], - "verbosity": "medium", - "verbosity_options": [ - "low", - "medium", - "high" - ], - "visibility": "hidden" - } + "attachment": false, + "open_weights": true, + "release_date": "2024-09-30", + "last_updated": "2026-03-15", + "cost": { + "input": 0.17, + "output": 0.43 + }, + "type": "chat" + }, + { + "id": "bytedance/ui-tars-1.5-7b", + "name": "ByteDance: UI-TARS 7B ", + "display_name": "ByteDance: UI-TARS 7B ", + "modalities": { + "input": [ + "image", + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 128000, + "output": 2048 + }, + "temperature": true, + "tool_call": false, + "reasoning": { + "supported": false }, "attachment": true, "open_weights": false, - "knowledge": "2024-09-30", - "release_date": "2025-08-07", - "last_updated": "2025-08-07", + "release_date": "2025-07-23", + "last_updated": "2026-03-15", "cost": { - "input": 1.25, - "output": 10, - "cache_read": 0.13 + "input": 0.1, + "output": 0.2 }, "type": "chat" }, { - "id": "openai/gpt-5.4-pro", - "name": "GPT-5.4 Pro", - "display_name": "GPT-5.4 Pro", + "id": "rekaai/reka-flash-3", + "name": "Reka Flash 3", + "display_name": "Reka Flash 3", "modalities": { "input": [ - "text", - "image", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 1050000, - "output": 128000 + "context": 65536, + "output": 65536 }, - "temperature": false, - "tool_call": true, + "temperature": true, + "tool_call": false, "reasoning": { "supported": true, "default": true }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": true, - "mode": "effort", - "effort": "high", - "effort_options": [ - "medium", - "high", - "xhigh" - ], - "verbosity": "medium", - "verbosity_options": [ - "low", - "medium", - "high" - ], - "visibility": "hidden" - } - }, - "attachment": true, - "open_weights": false, - "knowledge": "2025-08-31", - "release_date": "2026-03-05", - "last_updated": "2026-03-05", + "attachment": false, + "open_weights": true, + "release_date": "2025-03-12", + "last_updated": "2026-04-11", "cost": { - "input": 30, - "output": 180, - "cache_read": 30 + "input": 0.1, + "output": 0.2 }, "type": "chat" }, { - "id": "openai/gpt-4.1-mini", - "name": "GPT-4.1 Mini", - "display_name": "GPT-4.1 Mini", + "id": "rekaai/reka-edge", + "name": "Reka Edge", + "display_name": "Reka Edge", "modalities": { "input": [ + "image", "text", - "image" + "video" ], "output": [ "text" ] }, "limit": { - "context": 1047576, - "output": 32768 + "context": 16384, + "output": 16384 }, "temperature": true, "tool_call": true, @@ -121972,256 +126940,150 @@ "supported": false }, "attachment": true, - "open_weights": false, - "knowledge": "2024-04", - "release_date": "2025-04-14", - "last_updated": "2025-04-14", + "open_weights": true, + "release_date": "2026-03-20", + "last_updated": "2026-04-11", "cost": { - "input": 0.4, - "output": 1.6, - "cache_read": 0.1 + "input": 0.1, + "output": 0.1 }, "type": "chat" }, { - "id": "openai/gpt-5.2-pro", - "name": "GPT-5.2 Pro", - "display_name": "GPT-5.2 Pro", + "id": "mistralai/mistral-large-2407", + "name": "Mistral Large 2407", + "display_name": "Mistral Large 2407", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 400000, - "output": 128000 + "context": 131072, + "output": 32768 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": true, - "mode": "effort", - "effort": "high", - "effort_options": [ - "medium", - "high", - "xhigh" - ], - "verbosity": "medium", - "verbosity_options": [ - "low", - "medium", - "high" - ], - "visibility": "hidden" - } + "supported": false }, - "attachment": true, - "open_weights": false, - "knowledge": "2025-08-31", - "release_date": "2025-12-11", - "last_updated": "2025-12-11", + "attachment": false, + "open_weights": true, + "release_date": "2024-11-19", + "last_updated": "2026-03-15", "cost": { - "input": 21, - "output": 168 + "input": 2, + "output": 6 }, "type": "chat" }, { - "id": "openai/o4-mini", - "name": "o4 Mini", - "display_name": "o4 Mini", + "id": "mistralai/mistral-small-3.2-24b-instruct", + "name": "Mistral: Mistral Small 3.2 24B", + "display_name": "Mistral: Mistral Small 3.2 24B", "modalities": { "input": [ - "text", - "image" + "image", + "text" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 100000 + "context": 131072, + "output": 131072 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": true, - "mode": "effort", - "effort": "medium", - "effort_options": [ - "low", - "medium", - "high" - ], - "visibility": "hidden" - } + "supported": false }, "attachment": true, - "open_weights": false, - "knowledge": "2024-06", - "release_date": "2025-04-16", - "last_updated": "2025-04-16", + "open_weights": true, + "release_date": "2025-06-20", + "last_updated": "2025-06-20", "cost": { - "input": 1.1, - "output": 4.4, - "cache_read": 0.28 + "input": 0.06, + "output": 0.18, + "cache_read": 0.03 }, "type": "chat" }, { - "id": "openai/gpt-5.4", - "name": "GPT-5.4", - "display_name": "GPT-5.4", + "id": "mistralai/mistral-nemo", + "name": "Mistral: Mistral Nemo", + "display_name": "Mistral: Mistral Nemo", "modalities": { "input": [ - "text", - "image", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 1050000, - "output": 128000 + "context": 131072, + "output": 16384 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": false - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": false, - "mode": "effort", - "effort": "none", - "effort_options": [ - "none", - "low", - "medium", - "high", - "xhigh" - ], - "verbosity": "medium", - "verbosity_options": [ - "low", - "medium", - "high" - ], - "visibility": "hidden" - } + "supported": false }, - "attachment": true, - "open_weights": false, - "knowledge": "2025-08-31", - "release_date": "2026-03-05", - "last_updated": "2026-03-05", + "attachment": false, + "open_weights": true, + "release_date": "2024-07-01", + "last_updated": "2024-07-30", "cost": { - "input": 2.5, - "output": 15, - "cache_read": 0.25, - "tiers": [ - { - "input": 5, - "output": 22.5, - "cache_read": 0.5, - "tier": { - "type": "context", - "size": 272000 - } - } - ], - "context_over_200k": { - "input": 5, - "output": 22.5, - "cache_read": 0.5 - } + "input": 0.02, + "output": 0.04 }, "type": "chat" }, { - "id": "openai/gpt-5.1", - "name": "GPT-5.1", - "display_name": "GPT-5.1", + "id": "mistralai/mistral-medium-3-5", + "name": "Mistral: Mistral Medium 3.5", + "display_name": "Mistral: Mistral Medium 3.5", "modalities": { "input": [ - "text", - "image" + "image", + "text" ], "output": [ "text" ] }, "limit": { - "context": 400000, - "output": 128000 + "context": 262144, + "output": 262144 }, "temperature": true, "tool_call": true, "reasoning": { "supported": true, - "default": false - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": false, - "mode": "effort", - "effort": "none", - "effort_options": [ - "none", - "low", - "medium", - "high" - ], - "verbosity": "medium", - "verbosity_options": [ - "low", - "medium", - "high" - ], - "visibility": "hidden" - } + "default": true }, "attachment": true, "open_weights": false, - "knowledge": "2024-09-30", - "release_date": "2025-11-13", - "last_updated": "2025-11-13", + "release_date": "2026-04-30", + "last_updated": "2026-05-07", "cost": { - "input": 1.25, - "output": 10, - "cache_read": 0.125 + "input": 1.5, + "output": 7.5 }, "type": "chat" }, { - "id": "openai/gpt-5-nano", - "name": "GPT-5 Nano", - "display_name": "GPT-5 Nano", + "id": "mistralai/ministral-8b-2512", + "name": "Mistral: Ministral 3 8B 2512", + "display_name": "Mistral: Ministral 3 8B 2512", "modalities": { "input": [ + "image", "text" ], "output": [ @@ -122229,481 +127091,315 @@ ] }, "limit": { - "context": 16000, - "output": 4000 + "context": 262144, + "output": 32768 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": true, - "mode": "effort", - "effort": "medium", - "effort_options": [ - "minimal", - "low", - "medium", - "high" - ], - "verbosity": "medium", - "verbosity_options": [ - "low", - "medium", - "high" - ], - "visibility": "hidden" - } + "supported": false }, "attachment": true, - "open_weights": false, - "knowledge": "2024-05-30", - "release_date": "2025-08-07", - "last_updated": "2025-08-07", + "open_weights": true, + "release_date": "2025-12-02", + "last_updated": "2026-03-15", "cost": { - "input": 0.05, - "output": 0.4, - "cache_read": 0.01 + "input": 0.15, + "output": 0.15 }, "type": "chat" }, { - "id": "openai/gpt-4o-mini", - "name": "GPT-4o Mini", - "display_name": "GPT-4o Mini", + "id": "mistralai/devstral-small", + "name": "Mistral: Devstral Small 1.1", + "display_name": "Mistral: Devstral Small 1.1", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 16384 + "context": 131072, + "output": 26215 }, "temperature": true, "tool_call": true, "reasoning": { "supported": false }, - "attachment": true, - "open_weights": false, - "knowledge": "2024-10", - "release_date": "2024-07-18", - "last_updated": "2024-07-18", + "attachment": false, + "open_weights": true, + "release_date": "2025-05-07", + "last_updated": "2025-07-10", "cost": { - "input": 0.15, - "output": 0.6, - "cache_read": 0.08 + "input": 0.1, + "output": 0.3 }, "type": "chat" }, { - "id": "openai/gpt-5.1-codex-max", - "name": "GPT-5.1-Codex-Max", - "display_name": "GPT-5.1-Codex-Max", + "id": "mistralai/mistral-small-3.1-24b-instruct", + "name": "Mistral: Mistral Small 3.1 24B", + "display_name": "Mistral: Mistral Small 3.1 24B", "modalities": { "input": [ - "text", - "image" + "image", + "text" ], "output": [ "text" ] }, "limit": { - "context": 400000, - "output": 128000 + "context": 128000, + "output": 131072 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": false - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": false, - "mode": "effort", - "effort": "none", - "effort_options": [ - "none", - "low", - "medium", - "high" - ], - "verbosity": "medium", - "verbosity_options": [ - "low", - "medium", - "high" - ], - "visibility": "hidden" - } + "supported": false }, "attachment": true, - "open_weights": false, - "knowledge": "2024-09-30", - "release_date": "2025-11-13", - "last_updated": "2025-11-13", + "open_weights": true, + "release_date": "2025-03-17", + "last_updated": "2026-03-15", "cost": { - "input": 1.1, - "output": 9, - "cache_read": 0.11 + "input": 0.35, + "output": 0.56, + "cache_read": 0.015 }, "type": "chat" }, { - "id": "openai/gpt-5.1-codex-mini", - "name": "GPT-5.1-Codex-Mini", - "display_name": "GPT-5.1-Codex-Mini", + "id": "mistralai/mistral-saba", + "name": "Mistral: Saba", + "display_name": "Mistral: Saba", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 400000, - "output": 100000 + "context": 32768, + "output": 32768 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": false - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": false, - "mode": "effort", - "effort": "none", - "effort_options": [ - "none", - "low", - "medium", - "high" - ], - "verbosity": "medium", - "verbosity_options": [ - "low", - "medium", - "high" - ], - "visibility": "hidden" - } + "supported": false }, - "attachment": true, - "open_weights": false, - "knowledge": "2024-09-30", - "release_date": "2025-11-13", - "last_updated": "2025-11-13", + "attachment": false, + "open_weights": true, + "release_date": "2025-02-17", + "last_updated": "2026-03-15", "cost": { - "input": 0.25, - "output": 2, - "cache_read": 0.025 + "input": 0.2, + "output": 0.6 }, "type": "chat" }, { - "id": "openai/gpt-4.1", - "name": "GPT-4.1", - "display_name": "GPT-4.1", + "id": "mistralai/mistral-large", + "name": "Mistral Large", + "display_name": "Mistral Large", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 1047576, - "output": 32768 + "context": 128000, + "output": 25600 }, "temperature": true, "tool_call": true, "reasoning": { "supported": false }, - "attachment": true, - "open_weights": false, - "knowledge": "2024-04", - "release_date": "2025-04-14", - "last_updated": "2025-04-14", + "attachment": false, + "open_weights": true, + "release_date": "2024-07-24", + "last_updated": "2025-12-02", "cost": { "input": 2, - "output": 8, - "cache_read": 0.5 + "output": 6 }, "type": "chat" }, { - "id": "openai/gpt-5.3-codex", - "name": "GPT-5.3-Codex", - "display_name": "GPT-5.3-Codex", + "id": "mistralai/mistral-medium-3.1", + "name": "Mistral: Mistral Medium 3.1", + "display_name": "Mistral: Mistral Medium 3.1", "modalities": { "input": [ "text", - "image", - "pdf" + "image" ], "output": [ "text" ] }, "limit": { - "context": 400000, - "output": 128000 + "context": 131072, + "output": 26215 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": true, - "mode": "effort", - "effort": "medium", - "effort_options": [ - "low", - "medium", - "high", - "xhigh" - ], - "verbosity": "medium", - "verbosity_options": [ - "low", - "medium", - "high" - ], - "visibility": "hidden" - } + "supported": false }, "attachment": true, "open_weights": false, - "knowledge": "2025-08-31", - "release_date": "2026-02-24", - "last_updated": "2026-02-24", + "release_date": "2025-08-12", + "last_updated": "2025-08-12", "cost": { - "input": 1.75, - "output": 14, - "cache_read": 0.175 + "input": 0.4, + "output": 2 }, "type": "chat" }, { - "id": "openai/gpt-5.2-chat", - "name": "GPT-5.2 Chat", - "display_name": "GPT-5.2 Chat", + "id": "mistralai/pixtral-large-2411", + "name": "Mistral: Pixtral Large 2411", + "display_name": "Mistral: Pixtral Large 2411", "modalities": { "input": [ - "text", - "image" + "image", + "text" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 16384 + "context": 131072, + "output": 32768 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, "attachment": true, - "open_weights": false, - "knowledge": "2025-08-31", - "release_date": "2025-12-11", - "last_updated": "2025-12-11", + "open_weights": true, + "release_date": "2024-11-19", + "last_updated": "2026-03-15", "cost": { - "input": 1.75, - "output": 14, - "cache_read": 0.175 + "input": 2, + "output": 6 }, "type": "chat" }, { - "id": "openai/gpt-5.2-codex", - "name": "GPT-5.2-Codex", - "display_name": "GPT-5.2-Codex", + "id": "mistralai/devstral-medium", + "name": "Mistral: Devstral Medium", + "display_name": "Mistral: Devstral Medium", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 400000, - "output": 128000 + "context": 131072, + "output": 26215 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": true, - "mode": "effort", - "effort": "medium", - "effort_options": [ - "low", - "medium", - "high", - "xhigh" - ], - "verbosity": "medium", - "verbosity_options": [ - "low", - "medium", - "high" - ], - "visibility": "hidden" - } + "supported": false }, - "attachment": true, - "open_weights": false, - "knowledge": "2025-08-31", - "release_date": "2026-01-14", - "last_updated": "2026-01-14", + "attachment": false, + "open_weights": true, + "release_date": "2025-07-10", + "last_updated": "2025-07-10", "cost": { - "input": 1.75, - "output": 14, - "cache_read": 0.175 + "input": 0.4, + "output": 2 }, "type": "chat" }, { - "id": "openai/gpt-5.1-codex", - "name": "GPT-5.1-Codex", - "display_name": "GPT-5.1-Codex", + "id": "mistralai/mistral-small-24b-instruct-2501", + "name": "Mistral: Mistral Small 3", + "display_name": "Mistral: Mistral Small 3", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 400000, - "output": 128000 + "context": 32768, + "output": 16384 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": false - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": false, - "mode": "effort", - "effort": "none", - "effort_options": [ - "none", - "low", - "medium", - "high" - ], - "verbosity": "medium", - "verbosity_options": [ - "low", - "medium", - "high" - ], - "visibility": "hidden" - } + "supported": false }, - "attachment": true, - "open_weights": false, - "knowledge": "2024-09-30", - "release_date": "2025-11-13", - "last_updated": "2025-11-13", + "attachment": false, + "open_weights": true, + "release_date": "2025-12-29", + "last_updated": "2026-01-10", "cost": { - "input": 1.25, - "output": 10, - "cache_read": 0.125 + "input": 0.05, + "output": 0.08 }, "type": "chat" }, { - "id": "openai/gpt-5.1-chat", - "name": "GPT-5.1 Chat", - "display_name": "GPT-5.1 Chat", + "id": "mistralai/ministral-3b-2512", + "name": "Mistral: Ministral 3 3B 2512", + "display_name": "Mistral: Ministral 3 3B 2512", "modalities": { "input": [ - "text", - "image" + "image", + "text" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 16384 + "context": 131072, + "output": 32768 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, "attachment": true, - "open_weights": false, - "knowledge": "2024-09-30", - "release_date": "2025-11-13", - "last_updated": "2025-11-13", + "open_weights": true, + "release_date": "2025-12-02", + "last_updated": "2026-03-15", "cost": { - "input": 1.25, - "output": 10, - "cache_read": 0.125 + "input": 0.1, + "output": 0.1 }, "type": "chat" - } - ] - }, - "venice": { - "id": "venice", - "name": "Venice AI", - "display_name": "Venice AI", - "doc": "https://docs.venice.ai", - "models": [ + }, { - "id": "nvidia-nemotron-cascade-2-30b-a3b", - "name": "Nemotron Cascade 2 30B A3B", - "display_name": "Nemotron Cascade 2 30B A3B", + "id": "mistralai/mistral-small-2603", + "name": "Mistral: Mistral Small 4", + "display_name": "Mistral: Mistral Small 4", "modalities": { "input": [ + "image", "text" ], "output": [ @@ -122711,8 +127407,8 @@ ] }, "limit": { - "context": 256000, - "output": 32768 + "context": 262144, + "output": 262144 }, "temperature": true, "tool_call": true, @@ -122720,20 +127416,21 @@ "supported": true, "default": true }, - "attachment": false, + "attachment": true, "open_weights": true, - "release_date": "2026-03-24", - "last_updated": "2026-04-09", + "release_date": "2026-03-16", + "last_updated": "2026-04-11", "cost": { - "input": 0.14, - "output": 0.8 + "input": 0.15, + "output": 0.6, + "cache_read": 0.015 }, "type": "chat" }, { - "id": "zai-org-glm-4.7-flash", - "name": "GLM 4.7 Flash", - "display_name": "GLM 4.7 Flash", + "id": "mistralai/mistral-large-2411", + "name": "Mistral Large 2411", + "display_name": "Mistral Large 2411", "modalities": { "input": [ "text" @@ -122743,29 +127440,28 @@ ] }, "limit": { - "context": 128000, - "output": 16384 + "context": 131072, + "output": 26215 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, "attachment": false, "open_weights": true, - "release_date": "2026-01-29", - "last_updated": "2026-03-12", + "release_date": "2024-07-24", + "last_updated": "2024-11-04", "cost": { - "input": 0.125, - "output": 0.5 + "input": 2, + "output": 6 }, "type": "chat" }, { - "id": "openai-gpt-52", - "name": "GPT-5.2", - "display_name": "GPT-5.2", + "id": "mistralai/mistral-7b-instruct-v0.1", + "name": "Mistral: Mistral 7B Instruct v0.1", + "display_name": "Mistral: Mistral 7B Instruct v0.1", "modalities": { "input": [ "text" @@ -122775,31 +127471,28 @@ ] }, "limit": { - "context": 256000, - "output": 65536 + "context": 2824, + "output": 565 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": true + "supported": false }, "attachment": false, "open_weights": false, - "knowledge": "2025-08-31", - "release_date": "2025-12-13", - "last_updated": "2026-03-12", + "release_date": "2025-04-03", + "last_updated": "2025-04-03", "cost": { - "input": 2.19, - "output": 17.5, - "cache_read": 0.219 + "input": 0.11, + "output": 0.19 }, "type": "chat" }, { - "id": "claude-opus-4-5", - "name": "Claude Opus 4.5", - "display_name": "Claude Opus 4.5", + "id": "mistralai/ministral-14b-2512", + "name": "Mistral: Ministral 3 14B 2512", + "display_name": "Mistral: Ministral 3 14B 2512", "modalities": { "input": [ "text", @@ -122810,183 +127503,91 @@ ] }, "limit": { - "context": 198000, - "output": 32768 + "context": 262144, + "output": 52429 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": false - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": false, - "mode": "mixed", - "budget": { - "min": 1024, - "unit": "tokens" - }, - "effort": "high", - "effort_options": [ - "low", - "medium", - "high" - ], - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ], - "notes": [ - "Claude Opus 4.5 uses manual thinking.type = \"enabled\" with budget_tokens; effort can be used alongside the thinking budget.", - "Interleaved thinking requires the interleaved-thinking-2025-05-14 beta header." - ] - } + "supported": false }, "attachment": true, "open_weights": false, - "release_date": "2025-12-06", - "last_updated": "2026-04-12", + "release_date": "2025-12-16", + "last_updated": "2025-12-16", "cost": { - "input": 6, - "output": 30, - "cache_read": 0.6, - "cache_write": 7.5 + "input": 0.2, + "output": 0.2 }, "type": "chat" }, { - "id": "claude-sonnet-4-6", - "name": "Claude Sonnet 4.6", - "display_name": "Claude Sonnet 4.6", + "id": "mistralai/devstral-2512", + "name": "Mistral: Devstral 2 2512", + "display_name": "Mistral: Devstral 2 2512", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 1000000, - "output": 64000 + "context": 262144, + "output": 65536 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": false - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": false, - "mode": "mixed", - "budget": { - "min": 1024, - "unit": "tokens" - }, - "effort": "high", - "effort_options": [ - "low", - "medium", - "high", - "max" - ], - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ], - "notes": [ - "Anthropic recommends adaptive thinking with effort for Claude 4.6; budget_tokens remains a deprecated compatibility path.", - "Anthropic API defaults effort to high; lower effort levels should be chosen per workload." - ] - } + "supported": false }, - "attachment": true, - "open_weights": false, - "knowledge": "2025-08-31", - "release_date": "2026-02-17", - "last_updated": "2026-03-16", + "attachment": false, + "open_weights": true, + "release_date": "2025-09-12", + "last_updated": "2026-03-15", "cost": { - "input": 3.6, - "output": 18, - "cache_read": 0.36, - "cache_write": 4.5 + "input": 0.4, + "output": 2, + "cache_read": 0.025 }, "type": "chat" }, { - "id": "claude-opus-4-8-fast", - "name": "Claude Opus 4.8 Fast", - "display_name": "Claude Opus 4.8 Fast", + "id": "mistralai/mixtral-8x22b-instruct", + "name": "Mistral: Mixtral 8x22B Instruct", + "display_name": "Mistral: Mixtral 8x22B Instruct", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 1000000, - "output": 128000 + "context": 65536, + "output": 13108 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": false - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": false, - "mode": "effort", - "effort": "high", - "effort_options": [ - "low", - "medium", - "high", - "xhigh", - "max" - ], - "interleaved": true, - "summaries": true, - "visibility": "omitted", - "continuation": [ - "thinking_blocks" - ], - "notes": [ - "Claude Opus 4.7 and newer Opus models require thinking.type = \"adaptive\" to enable thinking explicitly.", - "Manual budget_tokens requests return 400 on Claude Opus 4.7 and newer adaptive-only Opus models.", - "task_budget is separate from thinking control and should not be treated as a thinking budget." - ] - } + "supported": false }, - "attachment": true, - "open_weights": false, - "release_date": "2026-05-28", - "last_updated": "2026-05-28", + "attachment": false, + "open_weights": true, + "release_date": "2024-04-17", + "last_updated": "2024-04-17", "cost": { - "input": 12, - "output": 60, - "cache_read": 1.2, - "cache_write": 15 + "input": 2, + "output": 6 }, "type": "chat" }, { - "id": "openai-gpt-54", - "name": "GPT-5.4", - "display_name": "GPT-5.4", + "id": "mistralai/mistral-medium-3", + "name": "Mistral: Mistral Medium 3", + "display_name": "Mistral: Mistral Medium 3", "modalities": { "input": [ "text", @@ -122997,41 +127598,40 @@ ] }, "limit": { - "context": 1000000, - "output": 131072 + "context": 131072, + "output": 26215 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, "attachment": true, "open_weights": false, - "release_date": "2026-03-05", - "last_updated": "2026-03-09", + "release_date": "2025-05-07", + "last_updated": "2025-05-07", "cost": { - "input": 3.13, - "output": 18.8, - "cache_read": 0.313 + "input": 0.4, + "output": 2 }, "type": "chat" }, { - "id": "qwen3-next-80b", - "name": "Qwen 3 Next 80b", - "display_name": "Qwen 3 Next 80b", + "id": "mistralai/voxtral-small-24b-2507", + "name": "Mistral: Voxtral Small 24B 2507", + "display_name": "Mistral: Voxtral Small 24B 2507", "modalities": { "input": [ - "text" + "text", + "audio" ], "output": [ "text" ] }, "limit": { - "context": 256000, - "output": 16384 + "context": 32000, + "output": 6400 }, "temperature": true, "tool_call": true, @@ -123040,19 +127640,18 @@ }, "attachment": false, "open_weights": true, - "knowledge": "2025-07", - "release_date": "2025-04-29", - "last_updated": "2026-03-12", + "release_date": "2025-07-01", + "last_updated": "2025-07-01", "cost": { - "input": 0.35, - "output": 1.9 + "input": 0.1, + "output": 0.3 }, "type": "chat" }, { - "id": "openai-gpt-4o-mini-2024-07-18", - "name": "GPT-4o Mini", - "display_name": "GPT-4o Mini", + "id": "mistralai/mistral-large-2512", + "name": "Mistral: Mistral Large 3 2512", + "display_name": "Mistral: Mistral Large 3 2512", "modalities": { "input": [ "text", @@ -123063,8 +127662,8 @@ ] }, "limit": { - "context": 128000, - "output": 16384 + "context": 262144, + "output": 52429 }, "temperature": true, "tool_call": true, @@ -123072,24 +127671,22 @@ "supported": false }, "attachment": true, - "open_weights": false, - "release_date": "2026-02-28", - "last_updated": "2026-03-06", + "open_weights": true, + "release_date": "2024-11-01", + "last_updated": "2025-12-16", "cost": { - "input": 0.1875, - "output": 0.75, - "cache_read": 0.09375 + "input": 0.5, + "output": 1.5 }, "type": "chat" }, { - "id": "mistral-small-2603", - "name": "Mistral Small 4", - "display_name": "Mistral Small 4", + "id": "mistralai/codestral-2508", + "name": "Mistral: Codestral 2508", + "display_name": "Mistral: Codestral 2508", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" @@ -123097,60 +127694,58 @@ }, "limit": { "context": 256000, - "output": 65536 + "output": 51200 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, - "attachment": true, + "attachment": false, "open_weights": true, - "release_date": "2026-03-16", - "last_updated": "2026-04-09", + "release_date": "2025-08-01", + "last_updated": "2025-08-01", "cost": { - "input": 0.1875, - "output": 0.75 + "input": 0.3, + "output": 0.9 }, "type": "chat" }, { - "id": "gemma-4-uncensored", - "name": "Gemma 4 Uncensored", - "display_name": "Gemma 4 Uncensored", + "id": "morph/morph-v3-fast", + "name": "Morph: Morph V3 Fast", + "display_name": "Morph: Morph V3 Fast", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 256000, - "output": 8192 + "context": 81920, + "output": 38000 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": false }, - "attachment": true, - "open_weights": true, - "release_date": "2026-04-13", - "last_updated": "2026-04-19", + "attachment": false, + "open_weights": false, + "release_date": "2024-08-15", + "last_updated": "2024-08-15", "cost": { - "input": 0.1625, - "output": 0.5 + "input": 0.8, + "output": 1.2 }, "type": "chat" }, { - "id": "openai-gpt-oss-120b", - "name": "OpenAI GPT OSS 120B", - "display_name": "OpenAI GPT OSS 120B", + "id": "morph/morph-v3-large", + "name": "Morph: Morph V3 Large", + "display_name": "Morph: Morph V3 Large", "modalities": { "input": [ "text" @@ -123160,159 +127755,134 @@ ] }, "limit": { - "context": 128000, - "output": 16384 + "context": 262144, + "output": 131072 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": true + "supported": false }, "attachment": false, - "open_weights": true, - "knowledge": "2025-07", - "release_date": "2025-11-06", - "last_updated": "2026-05-06", + "open_weights": false, + "release_date": "2024-08-15", + "last_updated": "2024-08-15", "cost": { - "input": 0.07, - "output": 0.3 + "input": 0.9, + "output": 1.9 }, "type": "chat" }, { - "id": "hermes-3-llama-3.1-405b", - "name": "Hermes 3 Llama 3.1 405b", - "display_name": "Hermes 3 Llama 3.1 405b", + "id": "bytedance-seed/seed-1.6-flash", + "name": "ByteDance Seed: Seed 1.6 Flash", + "display_name": "ByteDance Seed: Seed 1.6 Flash", "modalities": { "input": [ - "text" + "image", + "text", + "video" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 16384 + "context": 262144, + "output": 32768 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": false, + "attachment": true, "open_weights": true, - "knowledge": "2024-04", - "release_date": "2025-09-25", - "last_updated": "2026-03-12", + "release_date": "2025-12-23", + "last_updated": "2026-03-15", "cost": { - "input": 1.1, - "output": 3 + "input": 0.075, + "output": 0.3 }, "type": "chat" }, { - "id": "claude-opus-4-7-fast", - "name": "Claude Opus 4.7 Fast", - "display_name": "Claude Opus 4.7 Fast", + "id": "bytedance-seed/seed-1.6", + "name": "ByteDance Seed: Seed 1.6", + "display_name": "ByteDance Seed: Seed 1.6", "modalities": { "input": [ + "image", "text", - "image" + "video" ], "output": [ "text" ] }, "limit": { - "context": 1000000, - "output": 128000 + "context": 262144, + "output": 32768 }, "temperature": true, "tool_call": true, "reasoning": { "supported": true, - "default": false - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": false, - "mode": "effort", - "effort": "high", - "effort_options": [ - "low", - "medium", - "high", - "xhigh", - "max" - ], - "interleaved": true, - "summaries": true, - "visibility": "omitted", - "continuation": [ - "thinking_blocks" - ], - "notes": [ - "Claude Opus 4.7 and newer Opus models require thinking.type = \"adaptive\" to enable thinking explicitly.", - "Manual budget_tokens requests return 400 on Claude Opus 4.7 and newer adaptive-only Opus models.", - "task_budget is separate from thinking control and should not be treated as a thinking budget." - ] - } + "default": true }, "attachment": true, "open_weights": false, - "release_date": "2026-05-14", - "last_updated": "2026-05-14", + "release_date": "2025-09", + "last_updated": "2025-09", "cost": { - "input": 36, - "output": 180, - "cache_read": 3.6, - "cache_write": 45 + "input": 0.25, + "output": 2 }, "type": "chat" }, { - "id": "openai-gpt-4o-2024-11-20", - "name": "GPT-4o", - "display_name": "GPT-4o", + "id": "bytedance-seed/seed-2.0-mini", + "name": "ByteDance Seed: Seed-2.0-Mini", + "display_name": "ByteDance Seed: Seed-2.0-Mini", "modalities": { "input": [ + "image", "text", - "image" + "video" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 16384 + "context": 262144, + "output": 131072 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "attachment": true, - "open_weights": false, - "release_date": "2026-02-28", - "last_updated": "2026-03-06", + "open_weights": true, + "release_date": "2026-02-27", + "last_updated": "2026-03-15", "cost": { - "input": 3.125, - "output": 12.5 + "input": 0.1, + "output": 0.4 }, "type": "chat" }, { - "id": "google-gemma-4-26b-a4b-it", - "name": "Google Gemma 4 26B A4B Instruct", - "display_name": "Google Gemma 4 26B A4B Instruct", + "id": "bytedance-seed/seed-2.0-lite", + "name": "ByteDance Seed: Seed-2.0-Lite", + "display_name": "ByteDance Seed: Seed-2.0-Lite", "modalities": { "input": [ - "text", "image", + "text", "video" ], "output": [ @@ -123320,8 +127890,8 @@ ] }, "limit": { - "context": 256000, - "output": 8192 + "context": 262144, + "output": 131072 }, "temperature": true, "tool_call": true, @@ -123331,128 +127901,95 @@ }, "attachment": true, "open_weights": true, - "release_date": "2026-04-02", - "last_updated": "2026-04-12", + "release_date": "2026-03-10", + "last_updated": "2026-03-15", "cost": { - "input": 0.1625, - "output": 0.5 + "input": 0.25, + "output": 2 }, "type": "chat" }, { - "id": "claude-opus-4-6-fast", - "name": "Claude Opus 4.6 Fast", - "display_name": "Claude Opus 4.6 Fast", + "id": "anthracite-org/magnum-v4-72b", + "name": "Magnum v4 72B", + "display_name": "Magnum v4 72B", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 1000000, - "output": 128000 + "context": 16384, + "output": 2048 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": false - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": false, - "mode": "mixed", - "budget": { - "min": 1024, - "unit": "tokens" - }, - "effort": "high", - "effort_options": [ - "low", - "medium", - "high", - "max" - ], - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ], - "notes": [ - "Anthropic recommends adaptive thinking with effort for Claude 4.6; budget_tokens remains a deprecated compatibility path.", - "Anthropic API defaults effort to high; lower effort levels should be chosen per workload." - ] - } + "supported": false }, - "attachment": true, - "open_weights": false, - "knowledge": "2025-05-31", - "release_date": "2026-04-08", - "last_updated": "2026-04-08", + "attachment": false, + "open_weights": true, + "release_date": "2024-10-22", + "last_updated": "2026-03-15", "cost": { - "input": 36, - "output": 180, - "cache_read": 3.6, - "cache_write": 45 + "input": 3, + "output": 5 }, "type": "chat" }, { - "id": "google-gemma-3-27b-it", - "name": "Google Gemma 3 27B Instruct", - "display_name": "Google Gemma 3 27B Instruct", + "id": "nvidia/nemotron-3-nano-omni-30b-a3b-reasoning:free", + "name": "NVIDIA: Nemotron 3 Nano Omni (free)", + "display_name": "NVIDIA: Nemotron 3 Nano Omni (free)", "modalities": { "input": [ "text", - "image" + "audio", + "image", + "video" ], "output": [ "text" ] }, "limit": { - "context": 198000, - "output": 16384 + "context": 256000, + "output": 65536 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "attachment": true, - "open_weights": true, - "knowledge": "2025-07", - "release_date": "2025-11-04", - "last_updated": "2026-03-12", + "open_weights": false, + "release_date": "2026-04-28", + "last_updated": "2026-05-01", "cost": { - "input": 0.12, - "output": 0.2 + "input": 0, + "output": 0 }, "type": "chat" }, { - "id": "minimax-m3", - "name": "MiniMax M3", - "display_name": "MiniMax M3", + "id": "nvidia/nemotron-3-nano-30b-a3b", + "name": "NVIDIA: Nemotron 3 Nano 30B A3B", + "display_name": "NVIDIA: Nemotron 3 Nano 30B A3B", "modalities": { "input": [ - "text", - "image", - "video" + "text" ], "output": [ "text" ] }, "limit": { - "context": 500000, - "output": 131072 + "context": 262144, + "output": 52429 }, "temperature": true, "tool_call": true, @@ -123460,58 +127997,52 @@ "supported": true, "default": true }, - "extra_capabilities": { - "reasoning": { - "supported": true - } - }, - "attachment": true, - "open_weights": false, - "release_date": "2026-06-01", - "last_updated": "2026-06-04", + "attachment": false, + "open_weights": true, + "release_date": "2024-12", + "last_updated": "2026-02-04", "cost": { - "input": 0.3, - "output": 1.2, - "cache_read": 0.06 + "input": 0.05, + "output": 0.2 }, "type": "chat" }, { - "id": "venice-uncensored-role-play", - "name": "Venice Role Play Uncensored", - "display_name": "Venice Role Play Uncensored", + "id": "nvidia/llama-3.3-nemotron-super-49b-v1.5", + "name": "NVIDIA: Llama 3.3 Nemotron Super 49B V1.5", + "display_name": "NVIDIA: Llama 3.3 Nemotron Super 49B V1.5", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 4096 + "context": 131072, + "output": 26215 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": true, - "open_weights": true, - "release_date": "2026-02-20", - "last_updated": "2026-03-16", + "attachment": false, + "open_weights": false, + "release_date": "2025-03-16", + "last_updated": "2025-03-16", "cost": { - "input": 0.5, - "output": 2 + "input": 0.1, + "output": 0.4 }, "type": "chat" }, { - "id": "deepseek-v3.2", - "name": "DeepSeek V3.2", - "display_name": "DeepSeek V3.2", + "id": "nvidia/nemotron-nano-9b-v2", + "name": "NVIDIA: Nemotron Nano 9B V2", + "display_name": "NVIDIA: Nemotron Nano 9B V2", "modalities": { "input": [ "text" @@ -123521,8 +128052,8 @@ ] }, "limit": { - "context": 160000, - "output": 32768 + "context": 131072, + "output": 26215 }, "temperature": true, "tool_call": true, @@ -123530,42 +128061,31 @@ "supported": true, "default": true }, - "extra_capabilities": { - "reasoning": { - "supported": true - } - }, "attachment": false, "open_weights": true, - "knowledge": "2025-10", - "release_date": "2025-12-04", - "last_updated": "2026-03-24", + "release_date": "2025-08-18", + "last_updated": "2025-08-18", "cost": { - "input": 0.33, - "output": 0.48, - "cache_read": 0.16 + "input": 0.04, + "output": 0.16 }, "type": "chat" }, { - "id": "gemini-3-flash-preview", - "name": "Gemini 3 Flash Preview", - "display_name": "Gemini 3 Flash Preview", + "id": "nvidia/nemotron-3-super-120b-a12b:free", + "name": "NVIDIA: Nemotron 3 Super (free)", + "display_name": "NVIDIA: Nemotron 3 Super (free)", "modalities": { "input": [ - "text", - "image", - "audio", - "video", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 256000, - "output": 65536 + "context": 262144, + "output": 262144 }, "temperature": true, "tool_call": true, @@ -123573,42 +128093,20 @@ "supported": true, "default": true }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": true, - "mode": "level", - "level": "high", - "level_options": [ - "minimal", - "low", - "medium", - "high" - ], - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } - }, - "attachment": true, - "open_weights": false, - "knowledge": "2025-01", - "release_date": "2025-12-19", - "last_updated": "2026-03-12", + "attachment": false, + "open_weights": true, + "release_date": "2026-03-12", + "last_updated": "2026-03-15", "cost": { - "input": 0.7, - "output": 3.75, - "cache_read": 0.07 + "input": 0, + "output": 0 }, "type": "chat" }, { - "id": "zai-org-glm-5-1", - "name": "GLM 5.1", - "display_name": "GLM 5.1", + "id": "nvidia/nemotron-3-super-120b-a12b", + "name": "NVIDIA: Nemotron 3 Super", + "display_name": "NVIDIA: Nemotron 3 Super", "modalities": { "input": [ "text" @@ -123618,8 +128116,8 @@ ] }, "limit": { - "context": 200000, - "output": 24000 + "context": 262144, + "output": 262144 }, "temperature": true, "tool_call": true, @@ -123627,44 +128125,35 @@ "supported": true, "default": true }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } - }, "attachment": false, "open_weights": true, - "release_date": "2026-04-07", - "last_updated": "2026-04-08", + "release_date": "2026-03-11", + "last_updated": "2026-04-11", "cost": { - "input": 1.75, - "output": 5.5, - "cache_read": 0.325 + "input": 0.1, + "output": 0.5, + "cache_read": 0.1 }, "type": "chat" }, { - "id": "grok-build-0-1", - "name": "Grok Build 0.1", - "display_name": "Grok Build 0.1", + "id": "xiaomi/mimo-v2.5", + "name": "Xiaomi: MiMo-V2.5", + "display_name": "Xiaomi: MiMo-V2.5", "modalities": { "input": [ "text", - "image" + "image", + "audio", + "video" ], "output": [ "text" ] }, "limit": { - "context": 256000, - "output": 65536 + "context": 1048576, + "output": 131072 }, "temperature": true, "tool_call": true, @@ -123672,49 +128161,63 @@ "supported": true, "default": true }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } + }, "attachment": true, - "open_weights": false, - "release_date": "2026-05-21", - "last_updated": "2026-05-22", + "open_weights": true, + "knowledge": "2024-12", + "release_date": "2026-04-22", + "last_updated": "2026-04-22", "cost": { - "input": 1, + "input": 0.4, "output": 2, - "cache_read": 0.2, + "cache_read": 0.08, "tiers": [ { - "input": 2, + "input": 0.8, "output": 4, - "cache_read": 0.4, + "cache_read": 0.16, "tier": { "type": "context", - "size": 200000 + "size": 256000 } } ], "context_over_200k": { - "input": 2, + "input": 0.8, "output": 4, - "cache_read": 0.4 + "cache_read": 0.16 } }, "type": "chat" }, { - "id": "qwen3-6-27b", - "name": "Qwen 3.6 27B", - "display_name": "Qwen 3.6 27B", + "id": "xiaomi/mimo-v2-omni", + "name": "Xiaomi: MiMo-V2-Omni", + "display_name": "Xiaomi: MiMo-V2-Omni", "modalities": { "input": [ "text", "image", - "video" + "audio", + "video", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 256000, + "context": 262144, "output": 65536 }, "temperature": true, @@ -123725,18 +128228,20 @@ }, "attachment": true, "open_weights": false, - "release_date": "2026-04-24", - "last_updated": "2026-04-29", + "knowledge": "2024-12", + "release_date": "2026-03-18", + "last_updated": "2026-03-18", "cost": { - "input": 0.325, - "output": 3.25 + "input": 0.4, + "output": 2, + "cache_read": 0.08 }, "type": "chat" }, { - "id": "zai-org-glm-4.6", - "name": "GLM 4.6", - "display_name": "GLM 4.6", + "id": "xiaomi/mimo-v2-flash", + "name": "Xiaomi: MiMo-V2-Flash", + "display_name": "Xiaomi: MiMo-V2-Flash", "modalities": { "input": [ "text" @@ -123746,8 +128251,8 @@ ] }, "limit": { - "context": 198000, - "output": 16384 + "context": 262144, + "output": 65536 }, "temperature": true, "tool_call": true, @@ -123755,46 +128260,33 @@ "supported": true, "default": true }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } - }, "attachment": false, "open_weights": true, - "release_date": "2024-04-01", - "last_updated": "2026-04-04", + "knowledge": "2024-12-01", + "release_date": "2025-12-16", + "last_updated": "2026-02-04", "cost": { - "input": 0.85, - "output": 2.75, - "cache_read": 0.3 + "input": 0.09, + "output": 0.29, + "cache_read": 0.045 }, "type": "chat" }, { - "id": "gemini-3-1-pro-preview", - "name": "Gemini 3.1 Pro Preview", - "display_name": "Gemini 3.1 Pro Preview", + "id": "xiaomi/mimo-v2-pro", + "name": "Xiaomi: MiMo-V2-Pro", + "display_name": "Xiaomi: MiMo-V2-Pro", "modalities": { "input": [ - "text", - "image", - "audio", - "video" + "text" ], "output": [ "text" ] }, "limit": { - "context": 1000000, - "output": 32768 + "context": 1048576, + "output": 131072 }, "temperature": true, "tool_call": true, @@ -123802,55 +128294,55 @@ "supported": true, "default": true }, - "attachment": true, + "attachment": false, "open_weights": false, - "release_date": "2026-02-19", - "last_updated": "2026-03-12", + "knowledge": "2024-12", + "release_date": "2026-03-18", + "last_updated": "2026-03-18", "cost": { - "input": 2.5, - "output": 15, - "cache_read": 0.5, - "cache_write": 0.5, + "input": 1, + "output": 3, + "cache_read": 0.2, "tiers": [ { - "input": 5, - "output": 22.5, - "cache_read": 0.5, + "input": 2, + "output": 6, + "cache_read": 0.4, "tier": { "type": "context", - "size": 200000 + "size": 256000 } } ], "context_over_200k": { - "input": 5, - "output": 22.5, - "cache_read": 0.5 + "input": 2, + "output": 6, + "cache_read": 0.4 } }, "type": "chat" }, { - "id": "qwen3-vl-235b-a22b", - "name": "Qwen3 VL 235B", - "display_name": "Qwen3 VL 235B", + "id": "xiaomi/mimo-v2.5-pro", + "name": "Xiaomi: MiMo V2.5 Pro", + "display_name": "Xiaomi: MiMo V2.5 Pro", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 256000, - "output": 16384 + "context": 1048576, + "output": 131072 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true + "supported": true, + "default": true }, "extra_capabilities": { "reasoning": { @@ -123863,32 +128355,49 @@ ] } }, - "attachment": true, + "attachment": false, "open_weights": true, - "release_date": "2026-01-16", - "last_updated": "2026-03-12", + "knowledge": "2024-12", + "release_date": "2026-04-22", + "last_updated": "2026-04-22", "cost": { - "input": 0.25, - "output": 1.5 + "input": 1, + "output": 3, + "cache_read": 0.2, + "tiers": [ + { + "input": 2, + "output": 6, + "cache_read": 0.4, + "tier": { + "type": "context", + "size": 256000 + } + } + ], + "context_over_200k": { + "input": 2, + "output": 6, + "cache_read": 0.4 + } }, "type": "chat" }, { - "id": "openai-gpt-55-pro", - "name": "GPT-5.5 Pro", - "display_name": "GPT-5.5 Pro", + "id": "inception/mercury-2", + "name": "Inception: Mercury 2", + "display_name": "Inception: Mercury 2", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 1000000, - "output": 128000 + "context": 128000, + "output": 50000 }, "temperature": true, "tool_call": true, @@ -123896,20 +128405,21 @@ "supported": true, "default": true }, - "attachment": true, + "attachment": false, "open_weights": false, - "release_date": "2026-04-24", - "last_updated": "2026-04-25", + "release_date": "2026-02-24", + "last_updated": "2026-02-24", "cost": { - "input": 37.5, - "output": 225 + "input": 0.25, + "output": 0.75, + "cache_read": 0.025 }, "type": "chat" }, { - "id": "kimi-k2-5", - "name": "Kimi K2.5", - "display_name": "Kimi K2.5", + "id": "anthropic/claude-3.5-haiku", + "name": "Anthropic: Claude 3.5 Haiku", + "display_name": "Anthropic: Claude 3.5 Haiku", "modalities": { "input": [ "text", @@ -123920,44 +128430,91 @@ ] }, "limit": { - "context": 256000, - "output": 65536 + "context": 200000, + "output": 8192 + }, + "temperature": true, + "tool_call": true, + "reasoning": { + "supported": false + }, + "attachment": true, + "open_weights": false, + "release_date": "2024-10-22", + "last_updated": "2024-10-22", + "cost": { + "input": 0.8, + "output": 4, + "cache_read": 0.08, + "cache_write": 1 + }, + "type": "chat" + }, + { + "id": "anthropic/claude-sonnet-4.5", + "name": "Anthropic: Claude Sonnet 4.5", + "display_name": "Anthropic: Claude Sonnet 4.5", + "modalities": { + "input": [ + "image", + "pdf", + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 1000000, + "output": 64000 }, "temperature": true, "tool_call": true, "reasoning": { "supported": true, - "default": true + "default": false }, "extra_capabilities": { "reasoning": { "supported": true, + "default_enabled": false, + "mode": "budget", + "budget": { + "min": 1024, + "unit": "tokens" + }, "interleaved": true, "summaries": true, "visibility": "summary", "continuation": [ "thinking_blocks" + ], + "notes": [ + "Claude 4 manual thinking uses thinking.type = \"enabled\" with budget_tokens.", + "Interleaved thinking requires the interleaved-thinking-2025-05-14 beta header for this model family." ] } }, "attachment": true, "open_weights": false, - "knowledge": "2024-04", - "release_date": "2026-01-27", - "last_updated": "2026-04-30", + "release_date": "2025-09-29", + "last_updated": "2026-03-15", "cost": { - "input": 0.56, - "output": 3.5, - "cache_read": 0.22 + "input": 3, + "output": 15, + "cache_read": 0.3, + "cache_write": 3.75 }, "type": "chat" }, { - "id": "qwen3-235b-a22b-thinking-2507", - "name": "Qwen 3 235B A22B Thinking 2507", - "display_name": "Qwen 3 235B A22B Thinking 2507", + "id": "anthropic/claude-sonnet-4", + "name": "Anthropic: Claude Sonnet 4", + "display_name": "Anthropic: Claude Sonnet 4", "modalities": { "input": [ + "image", + "pdf", "text" ], "output": [ @@ -123965,146 +128522,239 @@ ] }, "limit": { - "context": 128000, - "output": 16384 + "context": 200000, + "output": 64000 }, "temperature": true, "tool_call": true, "reasoning": { "supported": true, - "default": true + "default": false }, "extra_capabilities": { "reasoning": { "supported": true, + "default_enabled": false, + "mode": "budget", + "budget": { + "min": 1024, + "unit": "tokens" + }, "interleaved": true, "summaries": true, "visibility": "summary", "continuation": [ "thinking_blocks" + ], + "notes": [ + "Claude 4 manual thinking uses thinking.type = \"enabled\" with budget_tokens.", + "Interleaved thinking requires the interleaved-thinking-2025-05-14 beta header for this model family." ] } }, - "attachment": false, - "open_weights": true, - "knowledge": "2025-07", - "release_date": "2025-04-29", - "last_updated": "2026-03-12", + "attachment": true, + "open_weights": false, + "release_date": "2025-05-22", + "last_updated": "2026-03-15", "cost": { - "input": 0.45, - "output": 3.5 + "input": 3, + "output": 15, + "cache_read": 0.3, + "cache_write": 3.75 }, "type": "chat" }, { - "id": "venice-uncensored-1-2", - "name": "Venice Uncensored 1.2", - "display_name": "Venice Uncensored 1.2", + "id": "anthropic/claude-opus-4.6-fast", + "name": "Anthropic: Claude Opus 4.6 (Fast)", + "display_name": "Anthropic: Claude Opus 4.6 (Fast)", "modalities": { "input": [ - "text", - "image" + "image", + "text" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 8192 + "context": 1000000, + "output": 128000 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": false + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": false, + "mode": "mixed", + "budget": { + "min": 1024, + "unit": "tokens" + }, + "effort": "high", + "effort_options": [ + "low", + "medium", + "high", + "max" + ], + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ], + "notes": [ + "Anthropic recommends adaptive thinking with effort for Claude 4.6; budget_tokens remains a deprecated compatibility path.", + "Anthropic API defaults effort to high; lower effort levels should be chosen per workload." + ] + } }, "attachment": true, - "open_weights": true, - "release_date": "2026-04-01", - "last_updated": "2026-04-19", + "open_weights": false, + "knowledge": "2025-05-31", + "release_date": "2026-04-07", + "last_updated": "2026-04-11", "cost": { - "input": 0.2, - "output": 0.9 + "input": 30, + "output": 150, + "cache_read": 3, + "cache_write": 37.5 }, "type": "chat" }, { - "id": "nvidia-nemotron-3-ultra-550b-a55b", - "name": "NVIDIA Nemotron 3 Ultra", - "display_name": "NVIDIA Nemotron 3 Ultra", + "id": "anthropic/claude-haiku-4.5", + "name": "Anthropic: Claude Haiku 4.5", + "display_name": "Anthropic: Claude Haiku 4.5", "modalities": { "input": [ - "text", - "image" + "image", + "text" ], "output": [ "text" ] }, "limit": { - "context": 256000, - "output": 32768 + "context": 200000, + "output": 64000 }, "temperature": true, "tool_call": true, "reasoning": { "supported": true, - "default": true + "default": false + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": false, + "mode": "budget", + "budget": { + "min": 1024, + "unit": "tokens" + }, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ], + "notes": [ + "Claude 4 manual thinking uses thinking.type = \"enabled\" with budget_tokens.", + "Interleaved thinking requires the interleaved-thinking-2025-05-14 beta header for this model family." + ] + } }, "attachment": true, - "open_weights": true, - "release_date": "2026-06-04", - "last_updated": "2026-06-08", + "open_weights": false, + "release_date": "2025-10-15", + "last_updated": "2025-10-15", "cost": { - "input": 0.625, - "output": 3.125, - "cache_read": 0.1875 + "input": 1, + "output": 5, + "cache_read": 0.1, + "cache_write": 1.25 }, "type": "chat" }, { - "id": "qwen3-5-397b-a17b", - "name": "Qwen 3.5 397B", - "display_name": "Qwen 3.5 397B", + "id": "anthropic/claude-opus-4.7-fast", + "name": "Anthropic: Claude Opus 4.7 (Fast)", + "display_name": "Anthropic: Claude Opus 4.7 (Fast)", "modalities": { "input": [ - "text", "image", - "video" + "pdf", + "text" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 32768 + "context": 1000000, + "output": 128000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { "supported": true, - "default": true + "default": false + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": false, + "mode": "effort", + "effort": "high", + "effort_options": [ + "low", + "medium", + "high", + "xhigh", + "max" + ], + "interleaved": true, + "summaries": true, + "visibility": "omitted", + "continuation": [ + "thinking_blocks" + ], + "notes": [ + "Claude Opus 4.7 and newer Opus models require thinking.type = \"adaptive\" to enable thinking explicitly.", + "Manual budget_tokens requests return 400 on Claude Opus 4.7 and newer adaptive-only Opus models.", + "task_budget is separate from thinking control and should not be treated as a thinking budget." + ] + } }, "attachment": true, - "open_weights": true, - "release_date": "2026-02-16", - "last_updated": "2026-04-16", + "open_weights": false, + "release_date": "2026-05-12", + "last_updated": "2026-05-16", "cost": { - "input": 0.75, - "output": 4.5 + "input": 30, + "output": 150, + "cache_read": 3, + "cache_write": 37.5 }, "type": "chat" }, { - "id": "qwen-3-6-plus", - "name": "Qwen 3.6 Plus Uncensored", - "display_name": "Qwen 3.6 Plus Uncensored", + "id": "anthropic/claude-opus-4.7", + "name": "Anthropic: Claude Opus 4.7", + "display_name": "Anthropic: Claude Opus 4.7", "modalities": { "input": [ "text", "image", - "video" + "pdf" ], "output": [ "text" @@ -124112,50 +128762,60 @@ }, "limit": { "context": 1000000, - "output": 65536 + "output": 128000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { "supported": true, - "default": true + "default": false + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": false, + "mode": "effort", + "effort": "high", + "effort_options": [ + "low", + "medium", + "high", + "xhigh", + "max" + ], + "interleaved": true, + "summaries": true, + "visibility": "omitted", + "continuation": [ + "thinking_blocks" + ], + "notes": [ + "Claude Opus 4.7 and newer Opus models require thinking.type = \"adaptive\" to enable thinking explicitly.", + "Manual budget_tokens requests return 400 on Claude Opus 4.7 and newer adaptive-only Opus models.", + "task_budget is separate from thinking control and should not be treated as a thinking budget." + ] + } }, "attachment": true, "open_weights": false, - "release_date": "2026-04-06", - "last_updated": "2026-04-12", + "release_date": "2026-04-16", + "last_updated": "2026-05-01", "cost": { - "input": 0.625, - "output": 3.75, - "cache_read": 0.0625, - "cache_write": 0.78, - "tiers": [ - { - "input": 2.5, - "output": 7.5, - "cache_read": 0.0625, - "cache_write": 0.78, - "tier": { - "type": "context", - "size": 200000 - } - } - ], - "context_over_200k": { - "input": 2.5, - "output": 7.5, - "cache_read": 0.0625, - "cache_write": 0.78 - } + "input": 5, + "output": 25, + "cache_read": 0.5, + "cache_write": 6.25 }, "type": "chat" }, { - "id": "zai-org-glm-5", - "name": "GLM 5", - "display_name": "GLM 5", + "id": "anthropic/claude-opus-4.1", + "name": "Anthropic: Claude Opus 4.1", + "display_name": "Anthropic: Claude Opus 4.1", "modalities": { "input": [ + "image", + "pdf", "text" ], "output": [ @@ -124163,80 +128823,119 @@ ] }, "limit": { - "context": 198000, + "context": 200000, "output": 32000 }, "temperature": true, "tool_call": true, "reasoning": { "supported": true, - "default": true + "default": false }, "extra_capabilities": { "reasoning": { "supported": true, + "default_enabled": false, + "mode": "budget", + "budget": { + "min": 1024, + "unit": "tokens" + }, "interleaved": true, "summaries": true, "visibility": "summary", "continuation": [ "thinking_blocks" + ], + "notes": [ + "Claude 4 manual thinking uses thinking.type = \"enabled\" with budget_tokens.", + "Interleaved thinking requires the interleaved-thinking-2025-05-14 beta header for this model family." ] } }, - "attachment": false, - "open_weights": true, - "release_date": "2026-02-11", - "last_updated": "2026-03-12", + "attachment": true, + "open_weights": false, + "release_date": "2025-08-05", + "last_updated": "2026-03-15", "cost": { - "input": 1, - "output": 3.2, - "cache_read": 0.2 + "input": 15, + "output": 75, + "cache_read": 1.5, + "cache_write": 18.75 }, "type": "chat" }, { - "id": "qwen3-5-35b-a3b", - "name": "Qwen 3.5 35B A3B", - "display_name": "Qwen 3.5 35B A3B", + "id": "anthropic/claude-opus-4.5", + "name": "Anthropic: Claude Opus 4.5", + "display_name": "Anthropic: Claude Opus 4.5", "modalities": { "input": [ - "text", "image", - "video" + "pdf", + "text" ], "output": [ "text" ] }, "limit": { - "context": 256000, - "output": 16384 + "context": 200000, + "output": 64000 }, "temperature": true, "tool_call": true, "reasoning": { "supported": true, - "default": true + "default": false + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": false, + "mode": "mixed", + "budget": { + "min": 1024, + "unit": "tokens" + }, + "effort": "high", + "effort_options": [ + "low", + "medium", + "high" + ], + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ], + "notes": [ + "Claude Opus 4.5 uses manual thinking.type = \"enabled\" with budget_tokens; effort can be used alongside the thinking budget.", + "Interleaved thinking requires the interleaved-thinking-2025-05-14 beta header." + ] + } }, "attachment": true, - "open_weights": true, - "release_date": "2026-02-25", - "last_updated": "2026-05-25", + "open_weights": false, + "release_date": "2025-11-24", + "last_updated": "2026-03-15", "cost": { - "input": 0.3125, - "output": 1.25, - "cache_read": 0.15625 + "input": 5, + "output": 25, + "cache_read": 0.5, + "cache_write": 6.25 }, "type": "chat" }, { - "id": "openai-gpt-54-pro", - "name": "GPT-5.4 Pro", - "display_name": "GPT-5.4 Pro", + "id": "anthropic/claude-sonnet-4.6", + "name": "Anthropic: Claude Sonnet 4.6", + "display_name": "Anthropic: Claude Sonnet 4.6", "modalities": { "input": [ - "text", - "image" + "image", + "text" ], "output": [ "text" @@ -124250,125 +128949,142 @@ "tool_call": true, "reasoning": { "supported": true, - "default": true + "default": false + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": false, + "mode": "mixed", + "budget": { + "min": 1024, + "unit": "tokens" + }, + "effort": "high", + "effort_options": [ + "low", + "medium", + "high", + "max" + ], + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ], + "notes": [ + "Anthropic recommends adaptive thinking with effort for Claude 4.6; budget_tokens remains a deprecated compatibility path.", + "Anthropic API defaults effort to high; lower effort levels should be chosen per workload." + ] + } }, "attachment": true, "open_weights": false, - "release_date": "2026-03-05", - "last_updated": "2026-03-09", + "knowledge": "2025-08-31", + "release_date": "2026-02-17", + "last_updated": "2026-03-15", "cost": { - "input": 37.5, - "output": 225, - "tiers": [ - { - "input": 75, - "output": 337.5, - "tier": { - "type": "context", - "size": 272000 - } - } - ], - "context_over_200k": { - "input": 75, - "output": 337.5 - } + "input": 3, + "output": 15 }, "type": "chat" }, { - "id": "minimax-m25", - "name": "MiniMax M2.5", - "display_name": "MiniMax M2.5", + "id": "anthropic/claude-3-haiku", + "name": "Anthropic: Claude 3 Haiku", + "display_name": "Anthropic: Claude 3 Haiku", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 198000, - "output": 32768 + "context": 200000, + "output": 4096 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } + "supported": false }, - "attachment": false, + "attachment": true, "open_weights": false, - "release_date": "2026-02-12", - "last_updated": "2026-04-12", + "release_date": "2024-03-07", + "last_updated": "2024-03-07", "cost": { - "input": 0.34, - "output": 1.19, - "cache_read": 0.04 + "input": 0.25, + "output": 1.25, + "cache_read": 0.03, + "cache_write": 0.3 }, "type": "chat" }, { - "id": "kimi-k2-6", - "name": "Kimi K2.6", - "display_name": "Kimi K2.6", + "id": "anthropic/claude-opus-4", + "name": "Anthropic: Claude Opus 4", + "display_name": "Anthropic: Claude Opus 4", "modalities": { "input": [ - "text", - "image" + "image", + "pdf", + "text" ], "output": [ "text" ] }, "limit": { - "context": 256000, - "output": 65536 + "context": 200000, + "output": 32000 }, "temperature": true, "tool_call": true, "reasoning": { "supported": true, - "default": true + "default": false }, "extra_capabilities": { "reasoning": { "supported": true, + "default_enabled": false, + "mode": "budget", + "budget": { + "min": 1024, + "unit": "tokens" + }, "interleaved": true, "summaries": true, "visibility": "summary", "continuation": [ "thinking_blocks" + ], + "notes": [ + "Claude 4 manual thinking uses thinking.type = \"enabled\" with budget_tokens.", + "Interleaved thinking requires the interleaved-thinking-2025-05-14 beta header for this model family." ] } }, "attachment": true, - "open_weights": true, - "release_date": "2026-04-20", - "last_updated": "2026-04-30", + "open_weights": false, + "release_date": "2025-05-22", + "last_updated": "2026-03-15", "cost": { - "input": 0.85, - "output": 4.655, - "cache_read": 0.22 + "input": 15, + "output": 75, + "cache_read": 1.5, + "cache_write": 18.75 }, "type": "chat" }, { - "id": "openai-gpt-53-codex", - "name": "GPT-5.3 Codex", - "display_name": "GPT-5.3 Codex", + "id": "anthropic/claude-opus-4.6", + "name": "Anthropic: Claude Opus 4.6", + "display_name": "Anthropic: Claude Opus 4.6", "modalities": { "input": [ "text", @@ -124379,30 +129095,60 @@ ] }, "limit": { - "context": 400000, + "context": 1000000, "output": 128000 }, "temperature": true, "tool_call": true, "reasoning": { "supported": true, - "default": true + "default": false + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": false, + "mode": "mixed", + "budget": { + "min": 1024, + "unit": "tokens" + }, + "effort": "high", + "effort_options": [ + "low", + "medium", + "high", + "max" + ], + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ], + "notes": [ + "Anthropic recommends adaptive thinking with effort for Claude 4.6; budget_tokens remains a deprecated compatibility path.", + "Anthropic API defaults effort to high; lower effort levels should be chosen per workload." + ] + } }, "attachment": true, "open_weights": false, - "release_date": "2026-02-24", - "last_updated": "2026-03-12", + "knowledge": "2025-05-31", + "release_date": "2026-02-05", + "last_updated": "2026-02-05", "cost": { - "input": 2.19, - "output": 17.5, - "cache_read": 0.219 + "input": 5, + "output": 25, + "cache_read": 0.5, + "cache_write": 6.25 }, "type": "chat" }, { - "id": "mistral-small-3-2-24b-instruct", - "name": "Mistral Small 3.2 24B Instruct", - "display_name": "Mistral Small 3.2 24B Instruct", + "id": "tencent/hunyuan-a13b-instruct", + "name": "Tencent: Hunyuan A13B Instruct", + "display_name": "Tencent: Hunyuan A13B Instruct", "modalities": { "input": [ "text" @@ -124412,28 +129158,29 @@ ] }, "limit": { - "context": 256000, - "output": 16384 + "context": 131072, + "output": 131072 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": false + "supported": true, + "default": true }, "attachment": false, - "open_weights": true, - "release_date": "2026-01-15", - "last_updated": "2026-03-16", + "open_weights": false, + "release_date": "2025-06-30", + "last_updated": "2025-11-25", "cost": { - "input": 0.09375, - "output": 0.25 + "input": 0.14, + "output": 0.57 }, "type": "chat" }, { - "id": "qwen-3-7-max", - "name": "Qwen 3.7 Max", - "display_name": "Qwen 3.7 Max", + "id": "tencent/hy3-preview", + "name": "Tencent: Hy3 Preview", + "display_name": "Tencent: Hy3 Preview", "modalities": { "input": [ "text" @@ -124443,8 +129190,8 @@ ] }, "limit": { - "context": 1000000, - "output": 65536 + "context": 262144, + "output": 262144 }, "temperature": true, "tool_call": true, @@ -124452,90 +129199,89 @@ "supported": true, "default": true }, + "extra_capabilities": { + "reasoning": { + "supported": true + } + }, "attachment": false, "open_weights": false, - "release_date": "2026-05-22", - "last_updated": "2026-05-25", + "release_date": "2026-04-22", + "last_updated": "2026-05-16", "cost": { - "input": 2.7, - "output": 8.05, - "cache_read": 0.27, - "cache_write": 3.35 + "input": 0.066, + "output": 0.26, + "cache_read": 0.029 }, "type": "chat" }, { - "id": "z-ai-glm-5v-turbo", - "name": "GLM 5V Turbo", - "display_name": "GLM 5V Turbo", + "id": "deepcogito/cogito-v2.1-671b", + "name": "Deep Cogito: Cogito v2.1 671B", + "display_name": "Deep Cogito: Cogito v2.1 671B", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 200000, + "context": 128000, "output": 32768 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": true, "default": true }, - "attachment": true, - "open_weights": false, - "release_date": "2026-04-01", - "last_updated": "2026-04-12", + "attachment": false, + "open_weights": true, + "release_date": "2025-11-14", + "last_updated": "2026-03-15", "cost": { - "input": 1.5, - "output": 5, - "cache_read": 0.3 + "input": 1.25, + "output": 1.25 }, "type": "chat" }, { - "id": "openai-gpt-54-mini", - "name": "GPT-5.4 Mini", - "display_name": "GPT-5.4 Mini", + "id": "cohere/command-a", + "name": "Cohere: Command A", + "display_name": "Cohere: Command A", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 400000, - "output": 128000 + "context": 256000, + "output": 8192 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": true + "supported": false }, - "attachment": true, - "open_weights": false, - "release_date": "2026-03-27", - "last_updated": "2026-03-31", + "attachment": false, + "open_weights": true, + "release_date": "2025-03-13", + "last_updated": "2025-03-13", "cost": { - "input": 0.9375, - "output": 5.625, - "cache_read": 0.09375 + "input": 2.5, + "output": 10 }, "type": "chat" }, { - "id": "nvidia-nemotron-3-nano-30b-a3b", - "name": "NVIDIA Nemotron 3 Nano 30B", - "display_name": "NVIDIA Nemotron 3 Nano 30B", + "id": "cohere/command-r-08-2024", + "name": "Cohere: Command R (08-2024)", + "display_name": "Cohere: Command R (08-2024)", "modalities": { "input": [ "text" @@ -124546,7 +129292,7 @@ }, "limit": { "context": 128000, - "output": 16384 + "output": 4000 }, "temperature": true, "tool_call": true, @@ -124555,18 +129301,18 @@ }, "attachment": false, "open_weights": true, - "release_date": "2026-01-27", - "last_updated": "2026-03-12", + "release_date": "2024-08-30", + "last_updated": "2024-08-30", "cost": { - "input": 0.075, - "output": 0.3 + "input": 0.15, + "output": 0.6 }, "type": "chat" }, { - "id": "llama-3.3-70b", - "name": "Llama 3.3 70B", - "display_name": "Llama 3.3 70B", + "id": "cohere/command-r7b-12-2024", + "name": "Cohere: Command R7B (12-2024)", + "display_name": "Cohere: Command R7B (12-2024)", "modalities": { "input": [ "text" @@ -124577,7 +129323,7 @@ }, "limit": { "context": 128000, - "output": 4096 + "output": 4000 }, "temperature": true, "tool_call": true, @@ -124586,19 +129332,18 @@ }, "attachment": false, "open_weights": true, - "knowledge": "2023-12", - "release_date": "2025-04-06", - "last_updated": "2026-03-12", + "release_date": "2024-02-27", + "last_updated": "2024-02-27", "cost": { - "input": 0.7, - "output": 2.8 + "input": 0.0375, + "output": 0.15 }, "type": "chat" }, { - "id": "llama-3.2-3b", - "name": "Llama 3.2 3B", - "display_name": "Llama 3.2 3B", + "id": "cohere/command-r-plus-08-2024", + "name": "Cohere: Command R+ (08-2024)", + "display_name": "Cohere: Command R+ (08-2024)", "modalities": { "input": [ "text" @@ -124609,7 +129354,7 @@ }, "limit": { "context": 128000, - "output": 4096 + "output": 4000 }, "temperature": true, "tool_call": true, @@ -124618,19 +129363,18 @@ }, "attachment": false, "open_weights": true, - "knowledge": "2023-12", - "release_date": "2024-10-03", - "last_updated": "2026-03-12", + "release_date": "2024-08-30", + "last_updated": "2024-08-30", "cost": { - "input": 0.15, - "output": 0.6 + "input": 2.5, + "output": 10 }, "type": "chat" }, { - "id": "qwen3-coder-480b-a35b-instruct-turbo", - "name": "Qwen 3 Coder 480B Turbo", - "display_name": "Qwen 3 Coder 480B Turbo", + "id": "gryphe/mythomax-l2-13b", + "name": "MythoMax 13B", + "display_name": "MythoMax 13B", "modalities": { "input": [ "text" @@ -124640,29 +129384,28 @@ ] }, "limit": { - "context": 256000, - "output": 65536 + "context": 4096, + "output": 4096 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": false }, "attachment": false, "open_weights": true, - "release_date": "2026-01-27", - "last_updated": "2026-02-26", + "release_date": "2024-04-25", + "last_updated": "2024-04-25", "cost": { - "input": 0.35, - "output": 1.5, - "cache_read": 0.04 + "input": 0.06, + "output": 0.06 }, "type": "chat" }, { - "id": "deepseek-v4-flash", - "name": "DeepSeek V4 Flash", - "display_name": "DeepSeek V4 Flash", + "id": "stepfun/step-3.5-flash", + "name": "StepFun: Step 3.5 Flash", + "display_name": "StepFun: Step 3.5 Flash", "modalities": { "input": [ "text" @@ -124672,8 +129415,8 @@ ] }, "limit": { - "context": 1000000, - "output": 32768 + "context": 256000, + "output": 256000 }, "temperature": true, "tool_call": true, @@ -124681,117 +129424,84 @@ "supported": true, "default": true }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } - }, "attachment": false, "open_weights": true, - "release_date": "2026-04-24", - "last_updated": "2026-04-29", + "release_date": "2026-01-29", + "last_updated": "2026-01-29", "cost": { - "input": 0.17, - "output": 0.35, - "cache_read": 0.028 + "input": 0.1, + "output": 0.3, + "cache_read": 0.02 }, "type": "chat" }, { - "id": "grok-4-20-multi-agent", - "name": "Grok 4.20 Multi-Agent", - "display_name": "Grok 4.20 Multi-Agent", + "id": "prime-intellect/intellect-3", + "name": "Prime Intellect: INTELLECT-3", + "display_name": "Prime Intellect: INTELLECT-3", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 2000000, - "output": 128000 + "context": 131072, + "output": 131072 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { "supported": true, "default": true }, - "attachment": true, - "open_weights": false, - "release_date": "2026-03-12", - "last_updated": "2026-05-07", + "attachment": false, + "open_weights": true, + "release_date": "2025-11-26", + "last_updated": "2026-02-04", "cost": { - "input": 1.42, - "output": 2.83, - "cache_read": 0.23, - "tiers": [ - { - "input": 2.83, - "output": 5.67, - "cache_read": 0.45, - "tier": { - "type": "context", - "size": 200000 - } - } - ], - "context_over_200k": { - "input": 2.83, - "output": 5.67, - "cache_read": 0.45 - } + "input": 0.2, + "output": 1.1 }, "type": "chat" }, { - "id": "openai-gpt-52-codex", - "name": "GPT-5.2 Codex", - "display_name": "GPT-5.2 Codex", + "id": "nex-agi/deepseek-v3.1-nex-n1", + "name": "Nex AGI: DeepSeek V3.1 Nex N1", + "display_name": "Nex AGI: DeepSeek V3.1 Nex N1", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 256000, - "output": 65536 + "context": 131072, + "output": 163840 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, - "attachment": true, + "attachment": false, "open_weights": false, - "knowledge": "2025-08", - "release_date": "2025-01-15", - "last_updated": "2026-03-12", + "release_date": "2025-01-01", + "last_updated": "2025-11-25", "cost": { - "input": 2.19, - "output": 17.5, - "cache_read": 0.219 + "input": 0.27, + "output": 1 }, "type": "chat" }, { - "id": "minimax-m27", - "name": "MiniMax M2.7", - "display_name": "MiniMax M2.7", + "id": "undi95/remm-slerp-l2-13b", + "name": "ReMM SLERP 13B", + "display_name": "ReMM SLERP 13B", "modalities": { "input": [ "text" @@ -124801,91 +129511,59 @@ ] }, "limit": { - "context": 198000, - "output": 32768 + "context": 6144, + "output": 4096 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": true + "supported": false }, "attachment": false, - "open_weights": false, - "release_date": "2026-03-18", - "last_updated": "2026-04-12", + "open_weights": true, + "release_date": "2023-07-22", + "last_updated": "2026-03-15", "cost": { - "input": 0.375, - "output": 1.5, - "cache_read": 0.075 + "input": 0.45, + "output": 0.65 }, "type": "chat" }, { - "id": "claude-opus-4-8", - "name": "Claude Opus 4.8", - "display_name": "Claude Opus 4.8", + "id": "relace/relace-search", + "name": "Relace: Relace Search", + "display_name": "Relace: Relace Search", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 1000000, + "context": 256000, "output": 128000 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": false - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": false, - "mode": "effort", - "effort": "high", - "effort_options": [ - "low", - "medium", - "high", - "xhigh", - "max" - ], - "interleaved": true, - "summaries": true, - "visibility": "omitted", - "continuation": [ - "thinking_blocks" - ], - "notes": [ - "Claude Opus 4.7 and newer Opus models require thinking.type = \"adaptive\" to enable thinking explicitly.", - "Manual budget_tokens requests return 400 on Claude Opus 4.7 and newer adaptive-only Opus models.", - "task_budget is separate from thinking control and should not be treated as a thinking budget." - ] - } + "supported": false }, - "attachment": true, + "attachment": false, "open_weights": false, - "release_date": "2026-05-28", - "last_updated": "2026-05-28", + "release_date": "2025-12-09", + "last_updated": "2026-03-15", "cost": { - "input": 6, - "output": 30, - "cache_read": 0.6, - "cache_write": 7.5 + "input": 1, + "output": 3 }, "type": "chat" }, { - "id": "arcee-trinity-large-thinking", - "name": "Trinity Large Thinking", - "display_name": "Trinity Large Thinking", + "id": "relace/relace-apply-3", + "name": "Relace: Relace Apply 3", + "display_name": "Relace: Relace Apply 3", "modalities": { "input": [ "text" @@ -124896,40 +129574,26 @@ }, "limit": { "context": 256000, - "output": 65536 + "output": 128000 }, - "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } + "supported": false }, "attachment": false, - "open_weights": true, - "release_date": "2026-04-02", - "last_updated": "2026-04-04", + "open_weights": false, + "release_date": "2025-09-26", + "last_updated": "2026-03-15", "cost": { - "input": 0.3125, - "output": 1.125, - "cache_read": 0.075 + "input": 0.85, + "output": 1.25 }, "type": "chat" }, { - "id": "qwen3-235b-a22b-instruct-2507", - "name": "Qwen 3 235B A22B Instruct 2507", - "display_name": "Qwen 3 235B A22B Instruct 2507", + "id": "ai21/jamba-large-1.7", + "name": "AI21: Jamba Large 1.7", + "display_name": "AI21: Jamba Large 1.7", "modalities": { "input": [ "text" @@ -124939,8 +129603,8 @@ ] }, "limit": { - "context": 128000, - "output": 16384 + "context": 256000, + "output": 4096 }, "temperature": true, "tool_call": true, @@ -124948,314 +129612,208 @@ "supported": false }, "attachment": false, - "open_weights": true, - "knowledge": "2025-07", - "release_date": "2025-04-29", - "last_updated": "2026-03-12", + "open_weights": false, + "release_date": "2025-08-09", + "last_updated": "2026-03-15", "cost": { - "input": 0.15, - "output": 0.75 + "input": 2, + "output": 8 }, "type": "chat" }, { - "id": "grok-4-3", - "name": "Grok 4.3", - "display_name": "Grok 4.3", + "id": "arcee-ai/coder-large", + "name": "Arcee AI: Coder Large", + "display_name": "Arcee AI: Coder Large", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 1000000, - "output": 32000 + "context": 32768, + "output": 32768 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": true + "supported": false }, - "attachment": true, - "open_weights": false, - "release_date": "2026-04-18", - "last_updated": "2026-05-04", + "attachment": false, + "open_weights": true, + "release_date": "2025-05-06", + "last_updated": "2026-03-15", "cost": { - "input": 1.42, - "output": 2.83, - "cache_read": 0.23, - "tiers": [ - { - "input": 2.83, - "output": 5.67, - "cache_read": 0.45, - "tier": { - "type": "context", - "size": 200000 - } - } - ], - "context_over_200k": { - "input": 2.83, - "output": 5.67, - "cache_read": 0.45 - } + "input": 0.5, + "output": 0.8 }, "type": "chat" }, { - "id": "qwen3-5-9b", - "name": "Qwen 3.5 9B", - "display_name": "Qwen 3.5 9B", + "id": "arcee-ai/virtuoso-large", + "name": "Arcee AI: Virtuoso Large", + "display_name": "Arcee AI: Virtuoso Large", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 256000, - "output": 32768 + "context": 131072, + "output": 64000 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, - "attachment": true, + "attachment": false, "open_weights": true, - "release_date": "2026-03-05", - "last_updated": "2026-04-19", + "release_date": "2025-05-06", + "last_updated": "2026-03-15", "cost": { - "input": 0.1, - "output": 0.15 + "input": 0.75, + "output": 1.2 }, "type": "chat" }, { - "id": "qwen-3-7-plus", - "name": "Qwen 3.7 Plus", - "display_name": "Qwen 3.7 Plus", + "id": "arcee-ai/spotlight", + "name": "Arcee AI: Spotlight", + "display_name": "Arcee AI: Spotlight", "modalities": { "input": [ - "text", "image", - "video" + "text" ], "output": [ "text" ] }, "limit": { - "context": 1000000, - "output": 65536 + "context": 131072, + "output": 65537 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": true + "supported": false }, "attachment": true, - "open_weights": false, - "release_date": "2026-06-02", - "last_updated": "2026-06-04", + "open_weights": true, + "release_date": "2025-05-06", + "last_updated": "2026-03-15", "cost": { - "input": 0.5, - "output": 2, - "cache_read": 0.05, - "cache_write": 0.625, - "tiers": [ - { - "input": 1.5, - "output": 6, - "cache_read": 0.15, - "cache_write": 1.875, - "tier": { - "type": "context", - "size": 256000 - } - } - ], - "context_over_200k": { - "input": 1.5, - "output": 6, - "cache_read": 0.15, - "cache_write": 1.875 - } + "input": 0.18, + "output": 0.18 }, "type": "chat" }, { - "id": "claude-sonnet-4-5", - "name": "Claude Sonnet 4.5", - "display_name": "Claude Sonnet 4.5", + "id": "arcee-ai/trinity-large-thinking", + "name": "Arcee AI: Trinity Large Thinking", + "display_name": "Arcee AI: Trinity Large Thinking", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 198000, - "output": 64000 + "context": 262144, + "output": 262144 }, "temperature": true, "tool_call": true, "reasoning": { "supported": true, - "default": false - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": false, - "mode": "budget", - "budget": { - "min": 1024, - "unit": "tokens" - }, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ], - "notes": [ - "Claude 4 manual thinking uses thinking.type = \"enabled\" with budget_tokens.", - "Interleaved thinking requires the interleaved-thinking-2025-05-14 beta header for this model family." - ] - } + "default": true }, - "attachment": true, - "open_weights": false, - "release_date": "2025-01-15", - "last_updated": "2026-04-12", + "attachment": false, + "open_weights": true, + "release_date": "2026-04-01", + "last_updated": "2026-04-11", "cost": { - "input": 3.75, - "output": 18.75, - "cache_read": 0.375, - "cache_write": 4.69 + "input": 0.22, + "output": 0.85 }, "type": "chat" }, { - "id": "gemini-3-5-flash", - "name": "Gemini 3.5 Flash", - "display_name": "Gemini 3.5 Flash", + "id": "arcee-ai/maestro-reasoning", + "name": "Arcee AI: Maestro Reasoning", + "display_name": "Arcee AI: Maestro Reasoning", "modalities": { "input": [ - "text", - "image", - "audio", - "video" + "text" ], "output": [ "text" ] }, "limit": { - "context": 1000000, - "output": 65536 + "context": 131072, + "output": 32000 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": true + "supported": false }, - "attachment": true, - "open_weights": false, - "release_date": "2026-05-22", - "last_updated": "2026-05-25", + "attachment": false, + "open_weights": true, + "release_date": "2025-05-06", + "last_updated": "2026-03-15", "cost": { - "input": 1.55, - "output": 9.45, - "cache_read": 0.155, - "cache_write": 0.086 + "input": 0.9, + "output": 3.3 }, "type": "chat" }, { - "id": "claude-opus-4-6", - "name": "Claude Opus 4.6", - "display_name": "Claude Opus 4.6", + "id": "arcee-ai/trinity-mini", + "name": "Arcee AI: Trinity Mini", + "display_name": "Arcee AI: Trinity Mini", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 1000000, - "output": 128000 + "context": 131072, + "output": 131072 }, "temperature": true, "tool_call": true, "reasoning": { "supported": true, - "default": false - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": false, - "mode": "mixed", - "budget": { - "min": 1024, - "unit": "tokens" - }, - "effort": "high", - "effort_options": [ - "low", - "medium", - "high", - "max" - ], - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ], - "notes": [ - "Anthropic recommends adaptive thinking with effort for Claude 4.6; budget_tokens remains a deprecated compatibility path.", - "Anthropic API defaults effort to high; lower effort levels should be chosen per workload." - ] - } + "default": true }, - "attachment": true, - "open_weights": false, - "knowledge": "2025-05-31", - "release_date": "2026-02-05", - "last_updated": "2026-03-16", + "attachment": false, + "open_weights": true, + "release_date": "2025-12", + "last_updated": "2026-01-28", "cost": { - "input": 6, - "output": 30, - "cache_read": 0.6, - "cache_write": 7.5 + "input": 0.045, + "output": 0.15 }, "type": "chat" }, { - "id": "olafangensan-glm-4.7-flash-heretic", - "name": "GLM 4.7 Flash Heretic", - "display_name": "GLM 4.7 Flash Heretic", + "id": "mancer/weaver", + "name": "Mancer: Weaver (alpha)", + "display_name": "Mancer: Weaver (alpha)", "modalities": { "input": [ "text" @@ -125265,106 +129823,93 @@ ] }, "limit": { - "context": 200000, - "output": 24000 + "context": 8000, + "output": 2000 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": true + "supported": false }, "attachment": false, - "open_weights": true, - "release_date": "2026-02-04", - "last_updated": "2026-03-12", + "open_weights": false, + "release_date": "2023-08-02", + "last_updated": "2026-03-15", "cost": { - "input": 0.14, - "output": 0.8 + "input": 0.75, + "output": 1 }, "type": "chat" }, { - "id": "deepseek-v4-pro", - "name": "DeepSeek V4 Pro", - "display_name": "DeepSeek V4 Pro", + "id": "perplexity/sonar-reasoning-pro", + "name": "Perplexity: Sonar Reasoning Pro", + "display_name": "Perplexity: Sonar Reasoning Pro", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 1000000, - "output": 32768 + "context": 128000, + "output": 25600 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": true, "default": true }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } - }, - "attachment": false, - "open_weights": true, - "release_date": "2026-04-24", - "last_updated": "2026-04-29", + "attachment": true, + "open_weights": false, + "release_date": "2024-01-01", + "last_updated": "2025-09-01", "cost": { - "input": 1.73, - "output": 3.796, - "cache_read": 0.33 + "input": 2, + "output": 8 }, "type": "chat" }, { - "id": "aion-labs-aion-2-0", - "name": "Aion 2.0", - "display_name": "Aion 2.0", + "id": "perplexity/sonar", + "name": "Perplexity: Sonar", + "display_name": "Perplexity: Sonar", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 32768 + "context": 127072, + "output": 25415 }, "temperature": true, "tool_call": false, "reasoning": { - "supported": true, - "default": true + "supported": false }, - "attachment": false, + "attachment": true, "open_weights": false, - "release_date": "2026-03-24", - "last_updated": "2026-04-12", + "release_date": "2024-01-01", + "last_updated": "2025-09-01", "cost": { "input": 1, - "output": 2, - "cache_read": 0.25 + "output": 1 }, "type": "chat" }, { - "id": "claude-opus-4-7", - "name": "Claude Opus 4.7", - "display_name": "Claude Opus 4.7", + "id": "perplexity/sonar-pro", + "name": "Perplexity: Sonar Pro", + "display_name": "Perplexity: Sonar Pro", "modalities": { "input": [ "text", @@ -125375,92 +129920,61 @@ ] }, "limit": { - "context": 1000000, - "output": 128000 + "context": 200000, + "output": 8000 }, - "temperature": false, - "tool_call": true, + "temperature": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": false - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": false, - "mode": "effort", - "effort": "high", - "effort_options": [ - "low", - "medium", - "high", - "xhigh", - "max" - ], - "interleaved": true, - "summaries": true, - "visibility": "omitted", - "continuation": [ - "thinking_blocks" - ], - "notes": [ - "Claude Opus 4.7 and newer Opus models require thinking.type = \"adaptive\" to enable thinking explicitly.", - "Manual budget_tokens requests return 400 on Claude Opus 4.7 and newer adaptive-only Opus models.", - "task_budget is separate from thinking control and should not be treated as a thinking budget." - ] - } + "supported": false }, "attachment": true, "open_weights": false, - "release_date": "2026-04-16", - "last_updated": "2026-04-16", + "release_date": "2024-01-01", + "last_updated": "2025-09-01", "cost": { - "input": 6, - "output": 30, - "cache_read": 0.6, - "cache_write": 7.5 + "input": 3, + "output": 15 }, "type": "chat" }, { - "id": "google-gemma-4-31b-it", - "name": "Google Gemma 4 31B Instruct", - "display_name": "Google Gemma 4 31B Instruct", + "id": "perplexity/sonar-pro-search", + "name": "Perplexity: Sonar Pro Search", + "display_name": "Perplexity: Sonar Pro Search", "modalities": { "input": [ - "text", "image", - "video" + "text" ], "output": [ "text" ] }, "limit": { - "context": 256000, - "output": 8192 + "context": 200000, + "output": 8000 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": true, "default": true }, "attachment": true, - "open_weights": true, - "release_date": "2026-04-03", - "last_updated": "2026-06-08", + "open_weights": false, + "release_date": "2025-10-31", + "last_updated": "2026-03-15", "cost": { - "input": 0.12, - "output": 0.36, - "cache_read": 0.09 + "input": 3, + "output": 15 }, "type": "chat" }, { - "id": "z-ai-glm-5-turbo", - "name": "GLM 5 Turbo", - "display_name": "GLM 5 Turbo", + "id": "perplexity/sonar-deep-research", + "name": "Perplexity: Sonar Deep Research", + "display_name": "Perplexity: Sonar Deep Research", "modalities": { "input": [ "text" @@ -125470,80 +129984,61 @@ ] }, "limit": { - "context": 200000, - "output": 32768 + "context": 128000, + "output": 25600 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": true, "default": true }, "attachment": false, - "open_weights": true, - "release_date": "2026-03-15", - "last_updated": "2026-04-12", + "open_weights": false, + "release_date": "2025-01-27", + "last_updated": "2025-01-27", "cost": { - "input": 1.2, - "output": 4, - "cache_read": 0.24 + "input": 2, + "output": 8 }, "type": "chat" }, { - "id": "grok-4-20", - "name": "Grok 4.20", - "display_name": "Grok 4.20", + "id": "switchpoint/router", + "name": "Switchpoint Router", + "display_name": "Switchpoint Router", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 2000000, - "output": 128000 + "context": 131072, + "output": 32768 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": true, "default": true }, - "attachment": true, + "attachment": false, "open_weights": false, - "release_date": "2026-03-12", - "last_updated": "2026-05-07", + "release_date": "2025-07-12", + "last_updated": "2026-03-15", "cost": { - "input": 1.42, - "output": 2.83, - "cache_read": 0.23, - "tiers": [ - { - "input": 2.83, - "output": 5.67, - "cache_read": 0.45, - "tier": { - "type": "context", - "size": 200000 - } - } - ], - "context_over_200k": { - "input": 2.83, - "output": 5.67, - "cache_read": 0.45 - } + "input": 0.85, + "output": 3.4 }, "type": "chat" }, { - "id": "mercury-2", - "name": "Mercury 2", - "display_name": "Mercury 2", + "id": "openrouter/bodybuilder", + "name": "Body Builder (beta)", + "display_name": "Body Builder (beta)", "modalities": { "input": [ "text" @@ -125554,31 +130049,29 @@ }, "limit": { "context": 128000, - "output": 50000 + "output": 32768 }, - "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": true + "supported": false }, "attachment": false, "open_weights": false, - "release_date": "2026-02-20", - "last_updated": "2026-04-09", + "release_date": "2026-03-15", + "last_updated": "2026-03-15", "cost": { - "input": 0.3125, - "output": 0.9375, - "cache_read": 0.03125 + "input": 0, + "output": 0 }, "type": "chat" }, { - "id": "zai-org-glm-4.7", - "name": "GLM 4.7", - "display_name": "GLM 4.7", + "id": "openrouter/free", + "name": "Free Models Router", + "display_name": "Free Models Router", "modalities": { "input": [ + "image", "text" ], "output": [ @@ -125586,8 +130079,8 @@ ] }, "limit": { - "context": 198000, - "output": 16384 + "context": 200000, + "output": 32768 }, "temperature": true, "tool_call": true, @@ -125595,45 +130088,31 @@ "supported": true, "default": true }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } - }, - "attachment": false, - "open_weights": true, - "knowledge": "2025-04", - "release_date": "2025-12-24", - "last_updated": "2026-03-12", + "attachment": true, + "open_weights": false, + "release_date": "2026-02-01", + "last_updated": "2026-03-15", "cost": { - "input": 0.55, - "output": 2.65, - "cache_read": 0.11 + "input": 0, + "output": 0 }, "type": "chat" }, { - "id": "openai-gpt-55", - "name": "GPT-5.5", - "display_name": "GPT-5.5", + "id": "openrouter/owl-alpha", + "name": "Owl Alpha", + "display_name": "Owl Alpha", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 1000000, - "output": 131072 + "context": 1048756, + "output": 262144 }, "temperature": true, "tool_call": true, @@ -125641,45 +130120,20 @@ "supported": true, "default": true }, - "attachment": true, + "attachment": false, "open_weights": false, - "release_date": "2026-04-23", - "last_updated": "2026-04-25", + "release_date": "2026-04-28", + "last_updated": "2026-04-30", "cost": { - "input": 6.25, - "output": 37.5, - "cache_read": 0.625, - "tiers": [ - { - "input": 12.5, - "output": 56.25, - "cache_read": 1.25, - "tier": { - "type": "context", - "size": 272000 - } - } - ], - "context_over_200k": { - "input": 12.5, - "output": 56.25, - "cache_read": 1.25 - } + "input": 0, + "output": 0 }, "type": "chat" - } - ] - }, - "azure": { - "id": "azure", - "name": "Azure", - "display_name": "Azure", - "doc": "https://learn.microsoft.com/en-us/azure/ai-services/openai/concepts/models", - "models": [ + }, { - "id": "mistral-large-2411", - "name": "Mistral Large 24.11", - "display_name": "Mistral Large 24.11", + "id": "openrouter/pareto-code", + "name": "Pareto Code Router", + "display_name": "Pareto Code Router", "modalities": { "input": [ "text" @@ -125689,170 +130143,168 @@ ] }, "limit": { - "context": 128000, - "output": 32768 + "context": 200000, + "output": 65536 }, - "temperature": true, - "tool_call": true, + "temperature": false, + "tool_call": false, "reasoning": { "supported": false }, "attachment": false, "open_weights": false, - "knowledge": "2024-09", - "release_date": "2024-11-01", - "last_updated": "2024-11-01", + "release_date": "2026-04-21", + "last_updated": "2026-05-01", "cost": { - "input": 2, - "output": 6 + "input": 0, + "output": 0 }, "type": "chat" }, { - "id": "gpt-3.5-turbo-1106", - "name": "GPT-3.5 Turbo 1106", - "display_name": "GPT-3.5 Turbo 1106", + "id": "openrouter/auto", + "name": "Auto Router", + "display_name": "Auto Router", "modalities": { "input": [ - "text" + "audio", + "image", + "pdf", + "text", + "video" ], "output": [ + "image", "text" ] }, "limit": { - "context": 16384, - "output": 16384 + "context": 2000000, + "output": 32768 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": false, + "attachment": true, "open_weights": false, - "knowledge": "2021-08", - "release_date": "2023-11-06", - "last_updated": "2023-11-06", + "release_date": "2026-03-15", + "last_updated": "2026-03-15", "cost": { - "input": 1, - "output": 2 + "input": 0, + "output": 0 }, "type": "chat" }, { - "id": "claude-opus-4-5", - "name": "Claude Opus 4.5", - "display_name": "Claude Opus 4.5", + "id": "qwen/qwen3.5-plus-20260420", + "name": "Qwen: Qwen3.5 Plus 2026-04-20", + "display_name": "Qwen: Qwen3.5 Plus 2026-04-20", "modalities": { "input": [ "text", "image", - "pdf" + "video" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 64000 + "context": 1000000, + "output": 65536 }, "temperature": true, "tool_call": true, "reasoning": { "supported": true, - "default": false + "default": true }, "extra_capabilities": { "reasoning": { "supported": true, - "default_enabled": false, - "mode": "mixed", - "budget": { - "min": 1024, - "unit": "tokens" - }, - "effort": "high", - "effort_options": [ - "low", - "medium", - "high" - ], "interleaved": true, "summaries": true, "visibility": "summary", "continuation": [ "thinking_blocks" - ], - "notes": [ - "Claude Opus 4.5 uses manual thinking.type = \"enabled\" with budget_tokens; effort can be used alongside the thinking budget.", - "Interleaved thinking requires the interleaved-thinking-2025-05-14 beta header." ] } }, "attachment": true, "open_weights": false, - "knowledge": "2025-03-31", - "release_date": "2025-11-24", - "last_updated": "2025-08-01", + "release_date": "2026-04-27", + "last_updated": "2026-05-01", "cost": { - "input": 5, - "output": 25, - "cache_read": 0.5, - "cache_write": 6.25 + "input": 0.4, + "output": 2.4 }, "type": "chat" }, { - "id": "model-router", - "name": "Model Router", - "display_name": "Model Router", + "id": "qwen/qwen3-vl-235b-a22b-thinking", + "name": "Qwen: Qwen3 VL 235B A22B Thinking", + "display_name": "Qwen: Qwen3 VL 235B A22B Thinking", "modalities": { "input": [ - "text", - "image" + "image", + "text" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 16384 + "context": 131072, + "output": 32768 }, + "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } }, "attachment": true, - "open_weights": false, - "release_date": "2025-05-19", - "last_updated": "2025-11-18", + "open_weights": true, + "release_date": "2025-09-24", + "last_updated": "2026-03-15", "cost": { - "input": 0.14, - "output": 0 + "input": 0.26, + "output": 2.6 }, "type": "chat" }, { - "id": "gpt-5-pro", - "name": "GPT-5 Pro", - "display_name": "GPT-5 Pro", + "id": "qwen/qwen3-vl-30b-a3b-thinking", + "name": "Qwen: Qwen3 VL 30B A3B Thinking", + "display_name": "Qwen: Qwen3 VL 30B A3B Thinking", "modalities": { "input": [ - "text", - "image" + "image", + "text" ], "output": [ "text" ] }, "limit": { - "context": 400000, - "output": 272000 + "context": 131072, + "output": 32768 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, @@ -125861,33 +130313,28 @@ "extra_capabilities": { "reasoning": { "supported": true, - "default_enabled": true, - "mode": "fixed", - "effort": "high", - "verbosity": "medium", - "verbosity_options": [ - "low", - "medium", - "high" - ], - "visibility": "hidden" + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] } }, "attachment": true, - "open_weights": false, - "knowledge": "2024-09-30", - "release_date": "2025-10-06", - "last_updated": "2025-10-06", + "open_weights": true, + "release_date": "2025-10-11", + "last_updated": "2026-03-15", "cost": { - "input": 15, - "output": 120 + "input": 0.13, + "output": 1.56 }, "type": "chat" }, { - "id": "deepseek-r1-0528", - "name": "DeepSeek-R1-0528", - "display_name": "DeepSeek-R1-0528", + "id": "qwen/qwen3-coder-plus", + "name": "Qwen: Qwen3 Coder Plus", + "display_name": "Qwen: Qwen3 Coder Plus", "modalities": { "input": [ "text" @@ -125897,46 +130344,32 @@ ] }, "limit": { - "context": 163840, - "output": 163840 + "context": 1000000, + "output": 65536 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } + "supported": false }, "attachment": false, "open_weights": true, - "knowledge": "2024-07", - "release_date": "2025-05-28", - "last_updated": "2025-05-28", + "release_date": "2025-07-01", + "last_updated": "2026-03-15", "cost": { - "input": 1.35, - "output": 5.4 + "input": 0.65, + "output": 3.25, + "cache_read": 0.2 }, "type": "chat" }, { - "id": "claude-sonnet-4-6", - "name": "Claude Sonnet 4.6", - "display_name": "Claude Sonnet 4.6", + "id": "qwen/qwen-plus", + "name": "Qwen: Qwen-Plus", + "display_name": "Qwen: Qwen-Plus", "modalities": { "input": [ - "text", - "image", - "pdf" + "text" ], "output": [ "text" @@ -125944,115 +130377,70 @@ }, "limit": { "context": 1000000, - "output": 64000 + "output": 32768 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": false + "supported": true }, "extra_capabilities": { "reasoning": { "supported": true, - "default_enabled": false, - "mode": "mixed", - "budget": { - "min": 1024, - "unit": "tokens" - }, - "effort": "high", - "effort_options": [ - "low", - "medium", - "high", - "max" - ], "interleaved": true, "summaries": true, "visibility": "summary", "continuation": [ "thinking_blocks" - ], - "notes": [ - "Anthropic recommends adaptive thinking with effort for Claude 4.6; budget_tokens remains a deprecated compatibility path.", - "Anthropic API defaults effort to high; lower effort levels should be chosen per workload." ] } }, - "attachment": true, + "attachment": false, "open_weights": false, - "knowledge": "2025-08-31", - "release_date": "2026-02-17", - "last_updated": "2026-03-13", + "release_date": "2024-01-25", + "last_updated": "2025-09-11", "cost": { - "input": 3, - "output": 15, - "cache_read": 0.3, - "cache_write": 3.75 + "input": 0.4, + "output": 1.2, + "cache_read": 0.08 }, "type": "chat" }, { - "id": "gpt-5-mini", - "name": "GPT-5 Mini", - "display_name": "GPT-5 Mini", + "id": "qwen/qwen3-coder-30b-a3b-instruct", + "name": "Qwen: Qwen3 Coder 30B A3B Instruct", + "display_name": "Qwen: Qwen3 Coder 30B A3B Instruct", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 272000, - "output": 128000 + "context": 160000, + "output": 32768 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": true, - "mode": "effort", - "effort": "medium", - "effort_options": [ - "minimal", - "low", - "medium", - "high" - ], - "verbosity": "medium", - "verbosity_options": [ - "low", - "medium", - "high" - ], - "visibility": "hidden" - } + "supported": false }, - "attachment": true, - "open_weights": false, - "knowledge": "2024-05-30", - "release_date": "2025-08-07", - "last_updated": "2025-08-07", + "attachment": false, + "open_weights": true, + "release_date": "2025-07-31", + "last_updated": "2025-07-31", "cost": { - "input": 0.25, - "output": 2, - "cache_read": 0.03 + "input": 0.07, + "output": 0.27 }, "type": "chat" }, { - "id": "ministral-3b", - "name": "Ministral 3B", - "display_name": "Ministral 3B", + "id": "qwen/qwen3-32b", + "name": "Qwen: Qwen3 32B", + "display_name": "Qwen: Qwen3 32B", "modalities": { "input": [ "text" @@ -126062,64 +130450,75 @@ ] }, "limit": { - "context": 128000, - "output": 8192 + "context": 40960, + "output": 40960 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } }, "attachment": false, "open_weights": true, - "knowledge": "2024-03", - "release_date": "2024-10-22", - "last_updated": "2024-10-22", + "release_date": "2024-12-01", + "last_updated": "2026-02-04", "cost": { - "input": 0.04, - "output": 0.04 + "input": 0.08, + "output": 0.24, + "cache_read": 0.04 }, "type": "chat" }, { - "id": "gpt-4-turbo-vision", - "name": "GPT-4 Turbo Vision", - "display_name": "GPT-4 Turbo Vision", + "id": "qwen/qwen3-next-80b-a3b-instruct", + "name": "Qwen: Qwen3 Next 80B A3B Instruct", + "display_name": "Qwen: Qwen3 Next 80B A3B Instruct", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 4096 + "context": 131072, + "output": 52429 }, "temperature": true, "tool_call": true, "reasoning": { "supported": false }, - "attachment": true, - "open_weights": false, - "knowledge": "2023-11", - "release_date": "2023-11-06", - "last_updated": "2024-04-09", + "attachment": false, + "open_weights": true, + "release_date": "2025-09-11", + "last_updated": "2026-03-15", "cost": { - "input": 10, - "output": 30 + "input": 0.09, + "output": 1.1 }, "type": "chat" }, { - "id": "meta-llama-3.1-405b-instruct", - "name": "Meta-Llama-3.1-405B-Instruct", - "display_name": "Meta-Llama-3.1-405B-Instruct", + "id": "qwen/qwen3-vl-8b-instruct", + "name": "Qwen: Qwen3 VL 8B Instruct", + "display_name": "Qwen: Qwen3 VL 8B Instruct", "modalities": { "input": [ + "image", "text" ], "output": [ @@ -126127,7 +130526,7 @@ ] }, "limit": { - "context": 128000, + "context": 131072, "output": 32768 }, "temperature": true, @@ -126135,161 +130534,161 @@ "reasoning": { "supported": false }, - "attachment": false, + "attachment": true, "open_weights": true, - "knowledge": "2023-12", - "release_date": "2024-07-23", - "last_updated": "2024-07-23", + "release_date": "2025-10-15", + "last_updated": "2025-11-25", "cost": { - "input": 5.33, - "output": 16 + "input": 0.08, + "output": 0.5 }, "type": "chat" }, { - "id": "gpt-5-chat", - "name": "GPT-5 Chat", - "display_name": "GPT-5 Chat", + "id": "qwen/qwen3.6-35b-a3b", + "name": "Qwen: Qwen3.6 35B A3B", + "display_name": "Qwen: Qwen3.6 35B A3B", "modalities": { "input": [ "text", - "image" + "image", + "video" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 16384 + "context": 262144, + "output": 65536 }, - "temperature": false, + "temperature": true, "tool_call": false, "reasoning": { "supported": true, "default": true }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } + }, "attachment": true, "open_weights": false, - "knowledge": "2024-10-24", - "release_date": "2025-08-07", - "last_updated": "2025-08-07", + "release_date": "2026-04-27", + "last_updated": "2026-05-01", "cost": { - "input": 1.25, - "output": 10, - "cache_read": 0.13 + "input": 0.1612, + "output": 0.96525, + "cache_read": 0.1612 }, "type": "chat" }, { - "id": "gpt-4o", - "name": "GPT-4o", - "display_name": "GPT-4o", + "id": "qwen/qwen3.7-max", + "name": "Qwen: Qwen3.7 Max", + "display_name": "Qwen: Qwen3.7 Max", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 16384 + "context": 1000000, + "output": 65536 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": true, + "extra_capabilities": { + "reasoning": { + "supported": true + } + }, + "attachment": false, "open_weights": false, - "knowledge": "2023-09", - "release_date": "2024-05-13", - "last_updated": "2024-08-06", + "release_date": "2025-08-26", + "last_updated": "2026-05-27", "cost": { - "input": 2.5, - "output": 10, - "cache_read": 1.25 + "input": 1.625, + "output": 4.875, + "cache_read": 0.1625, + "cache_write": 2.03125 }, "type": "chat" }, { - "id": "gpt-5.2", - "name": "GPT-5.2", - "display_name": "GPT-5.2", + "id": "qwen/qwen3-max", + "name": "Qwen: Qwen3 Max", + "display_name": "Qwen: Qwen3 Max", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 400000, - "output": 128000 + "context": 262144, + "output": 32768 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": false + "supported": true }, "extra_capabilities": { "reasoning": { "supported": true, - "default_enabled": false, - "mode": "effort", - "effort": "none", - "effort_options": [ - "none", - "low", - "medium", - "high", - "xhigh" - ], - "verbosity": "medium", - "verbosity_options": [ - "low", - "medium", - "high" - ], - "visibility": "hidden" + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] } }, - "attachment": true, + "attachment": false, "open_weights": false, - "knowledge": "2025-08-31", - "release_date": "2025-12-11", - "last_updated": "2025-12-11", + "release_date": "2025-09-05", + "last_updated": "2026-03-15", "cost": { - "input": 1.75, - "output": 14, - "cache_read": 0.125 + "input": 1.2, + "output": 6, + "cache_read": 0.24 }, "type": "chat" }, { - "id": "gpt-5-codex", - "name": "GPT-5-Codex", - "display_name": "GPT-5-Codex", + "id": "qwen/qwen3-8b", + "name": "Qwen: Qwen3 8B", + "display_name": "Qwen: Qwen3 8B", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 400000, - "output": 128000 + "context": 40960, + "output": 8192 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, @@ -126298,54 +130697,86 @@ "extra_capabilities": { "reasoning": { "supported": true, - "default_enabled": true, - "mode": "effort", - "effort": "medium", - "effort_options": [ - "minimal", - "low", - "medium", - "high" - ], - "verbosity": "medium", - "verbosity_options": [ - "low", - "medium", - "high" - ], - "visibility": "hidden" + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] } }, "attachment": false, - "open_weights": false, - "knowledge": "2024-09-30", - "release_date": "2025-09-15", - "last_updated": "2025-09-15", + "open_weights": true, + "release_date": "2025-04", + "last_updated": "2026-03-15", "cost": { - "input": 1.25, - "output": 10, - "cache_read": 0.13 + "input": 0.05, + "output": 0.4, + "cache_read": 0.05 }, "type": "chat" }, { - "id": "o3", - "name": "o3", - "display_name": "o3", + "id": "qwen/qwen-plus-2025-07-28", + "name": "Qwen: Qwen Plus 0728", + "display_name": "Qwen: Qwen Plus 0728", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 1000000, + "output": 32768 + }, + "temperature": true, + "tool_call": true, + "reasoning": { + "supported": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } + }, + "attachment": false, + "open_weights": true, + "release_date": "2025-09-09", + "last_updated": "2026-03-15", + "cost": { + "input": 0.26, + "output": 0.78 + }, + "type": "chat" + }, + { + "id": "qwen/qwen3.5-flash-02-23", + "name": "Qwen: Qwen3.5-Flash", + "display_name": "Qwen: Qwen3.5-Flash", "modalities": { "input": [ + "image", "text", - "image" + "video" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 100000 + "context": 1000000, + "output": 65536 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, @@ -126354,33 +130785,28 @@ "extra_capabilities": { "reasoning": { "supported": true, - "default_enabled": true, - "mode": "effort", - "effort": "medium", - "effort_options": [ - "low", - "medium", - "high" - ], - "visibility": "hidden" + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] } }, "attachment": true, - "open_weights": false, - "knowledge": "2024-05", - "release_date": "2025-04-16", - "last_updated": "2025-04-16", + "open_weights": true, + "release_date": "2026-02-26", + "last_updated": "2026-03-15", "cost": { - "input": 2, - "output": 8, - "cache_read": 0.5 + "input": 0.1, + "output": 0.4 }, "type": "chat" }, { - "id": "phi-3-medium-128k-instruct", - "name": "Phi-3-medium-instruct (128k)", - "display_name": "Phi-3-medium-instruct (128k)", + "id": "qwen/qwen3-30b-a3b-instruct-2507", + "name": "Qwen: Qwen3 30B A3B Instruct 2507", + "display_name": "Qwen: Qwen3 30B A3B Instruct 2507", "modalities": { "input": [ "text" @@ -126390,8 +130816,40 @@ ] }, "limit": { - "context": 128000, - "output": 4096 + "context": 262144, + "output": 262144 + }, + "temperature": true, + "tool_call": true, + "reasoning": { + "supported": false + }, + "attachment": false, + "open_weights": true, + "release_date": "2025-07-29", + "last_updated": "2026-03-15", + "cost": { + "input": 0.09, + "output": 0.3, + "cache_read": 0.04 + }, + "type": "chat" + }, + { + "id": "qwen/qwen-2.5-coder-32b-instruct", + "name": "Qwen2.5 Coder 32B Instruct", + "display_name": "Qwen2.5 Coder 32B Instruct", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 32768, + "output": 8192 }, "temperature": true, "tool_call": false, @@ -126400,19 +130858,19 @@ }, "attachment": false, "open_weights": true, - "knowledge": "2023-10", - "release_date": "2024-04-23", - "last_updated": "2024-04-23", + "release_date": "2024-11-11", + "last_updated": "2026-03-15", "cost": { - "input": 0.17, - "output": 0.68 + "input": 0.2, + "output": 0.2, + "cache_read": 0.015 }, "type": "chat" }, { - "id": "deepseek-v3-0324", - "name": "DeepSeek-V3-0324", - "display_name": "DeepSeek-V3-0324", + "id": "qwen/qwen3-next-80b-a3b-thinking", + "name": "Qwen: Qwen3 Next 80B A3B Thinking", + "display_name": "Qwen: Qwen3 Next 80B A3B Thinking", "modalities": { "input": [ "text" @@ -126423,28 +130881,39 @@ }, "limit": { "context": 131072, - "output": 131072 + "output": 32768 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } }, "attachment": false, "open_weights": true, - "knowledge": "2024-07", - "release_date": "2025-03-24", - "last_updated": "2025-03-24", + "release_date": "2025-09-11", + "last_updated": "2026-03-15", "cost": { - "input": 1.14, - "output": 4.56 + "input": 0.0975, + "output": 0.78 }, "type": "chat" }, { - "id": "kimi-k2-thinking", - "name": "Kimi K2 Thinking", - "display_name": "Kimi K2 Thinking", + "id": "qwen/qwen3-235b-a22b-thinking-2507", + "name": "Qwen: Qwen3 235B A22B Thinking 2507", + "display_name": "Qwen: Qwen3 235B A22B Thinking 2507", "modalities": { "input": [ "text" @@ -126476,20 +130945,18 @@ }, "attachment": false, "open_weights": true, - "knowledge": "2024-08", - "release_date": "2025-11-06", - "last_updated": "2025-12-02", + "release_date": "2025-07-25", + "last_updated": "2026-03-15", "cost": { - "input": 0.6, - "output": 2.5, - "cache_read": 0.15 + "input": 0.11, + "output": 0.6 }, "type": "chat" }, { - "id": "mistral-small-2503", - "name": "Mistral Small 3.1", - "display_name": "Mistral Small 3.1", + "id": "qwen/qwen3-vl-32b-instruct", + "name": "Qwen: Qwen3 VL 32B Instruct", + "display_name": "Qwen: Qwen3 VL 32B Instruct", "modalities": { "input": [ "text", @@ -126500,7 +130967,7 @@ ] }, "limit": { - "context": 128000, + "context": 131072, "output": 32768 }, "temperature": true, @@ -126510,19 +130977,18 @@ }, "attachment": true, "open_weights": false, - "knowledge": "2024-09", - "release_date": "2025-03-01", - "last_updated": "2025-03-01", + "release_date": "2025-10-21", + "last_updated": "2025-11-25", "cost": { - "input": 0.1, - "output": 0.3 + "input": 0.104, + "output": 0.416 }, "type": "chat" }, { - "id": "text-embedding-3-small", - "name": "text-embedding-3-small", - "display_name": "text-embedding-3-small", + "id": "qwen/qwen3-coder", + "name": "Qwen: Qwen3 Coder 480B A35B", + "display_name": "Qwen: Qwen3 Coder 480B A35B", "modalities": { "input": [ "text" @@ -126532,41 +130998,44 @@ ] }, "limit": { - "context": 8191, - "output": 1536 + "context": 262144, + "output": 52429 }, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { "supported": false }, "attachment": false, - "open_weights": false, - "release_date": "2024-01-25", - "last_updated": "2024-01-25", + "open_weights": true, + "release_date": "2025-07-23", + "last_updated": "2025-07-23", "cost": { - "input": 0.02, - "output": 0 + "input": 0.22, + "output": 1, + "cache_read": 0.022 }, - "type": "embedding" + "type": "chat" }, { - "id": "gpt-5", - "name": "GPT-5", - "display_name": "GPT-5", + "id": "qwen/qwen3.6-flash", + "name": "Qwen: Qwen3.6 Flash", + "display_name": "Qwen: Qwen3.6 Flash", "modalities": { "input": [ "text", - "image" + "image", + "video" ], "output": [ "text" ] }, "limit": { - "context": 272000, - "output": 128000 + "context": 1000000, + "output": 65536 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, @@ -126575,112 +131044,119 @@ "extra_capabilities": { "reasoning": { "supported": true, - "default_enabled": true, - "mode": "effort", - "effort": "medium", - "effort_options": [ - "minimal", - "low", - "medium", - "high" - ], - "verbosity": "medium", - "verbosity_options": [ - "low", - "medium", - "high" - ], - "visibility": "hidden" + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] } }, "attachment": true, "open_weights": false, - "knowledge": "2024-09-30", - "release_date": "2025-08-07", - "last_updated": "2025-08-07", + "release_date": "2026-04-27", + "last_updated": "2026-05-01", "cost": { - "input": 1.25, - "output": 10, - "cache_read": 0.13 + "input": 0.25, + "output": 1.5, + "cache_write": 0.3125 }, "type": "chat" }, { - "id": "claude-haiku-4-5", - "name": "Claude Haiku 4.5", - "display_name": "Claude Haiku 4.5", + "id": "qwen/qwen3.5-plus-02-15", + "name": "Qwen: Qwen3.5 Plus 2026-02-15", + "display_name": "Qwen: Qwen3.5 Plus 2026-02-15", "modalities": { "input": [ - "text", "image", - "pdf" + "text", + "video" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 64000 + "context": 1000000, + "output": 65536 }, "temperature": true, "tool_call": true, "reasoning": { "supported": true, - "default": false + "default": true }, "extra_capabilities": { "reasoning": { "supported": true, - "default_enabled": false, - "mode": "budget", - "budget": { - "min": 1024, - "unit": "tokens" - }, "interleaved": true, "summaries": true, "visibility": "summary", "continuation": [ "thinking_blocks" - ], - "notes": [ - "Claude 4 manual thinking uses thinking.type = \"enabled\" with budget_tokens.", - "Interleaved thinking requires the interleaved-thinking-2025-05-14 beta header for this model family." ] } }, "attachment": true, "open_weights": false, - "knowledge": "2025-02-31", - "release_date": "2025-11-18", - "last_updated": "2025-11-18", + "release_date": "2026-02-15", + "last_updated": "2026-03-15", "cost": { - "input": 1, - "output": 5, - "cache_read": 0.1, - "cache_write": 1.25 + "input": 0.26, + "output": 1.56 }, "type": "chat" }, { - "id": "gpt-5.4-pro", - "name": "GPT-5.4 Pro", - "display_name": "GPT-5.4 Pro", + "id": "qwen/qwen-2.5-7b-instruct", + "name": "Qwen: Qwen2.5 7B Instruct", + "display_name": "Qwen: Qwen2.5 7B Instruct", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 1050000, - "output": 128000 + "context": 32768, + "output": 6554 }, - "temperature": false, + "temperature": true, + "tool_call": true, + "reasoning": { + "supported": false + }, + "attachment": false, + "open_weights": true, + "release_date": "2024-09", + "last_updated": "2025-04-16", + "cost": { + "input": 0.04, + "output": 0.1 + }, + "type": "chat" + }, + { + "id": "qwen/qwen3-vl-8b-thinking", + "name": "Qwen: Qwen3 VL 8B Thinking", + "display_name": "Qwen: Qwen3 VL 8B Thinking", + "modalities": { + "input": [ + "image", + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 131072, + "output": 32768 + }, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, @@ -126689,86 +131165,71 @@ "extra_capabilities": { "reasoning": { "supported": true, - "default_enabled": true, - "mode": "effort", - "effort": "high", - "effort_options": [ - "medium", - "high", - "xhigh" - ], - "verbosity": "medium", - "verbosity_options": [ - "low", - "medium", - "high" - ], - "visibility": "hidden" + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] } }, "attachment": true, "open_weights": false, - "knowledge": "2025-08-31", - "release_date": "2026-03-05", - "last_updated": "2026-03-05", + "release_date": "2025-10-15", + "last_updated": "2025-11-25", "cost": { - "input": 30, - "output": 180, - "tiers": [ - { - "input": 60, - "output": 270, - "tier": { - "type": "context", - "size": 272000 - } - } - ], - "context_over_200k": { - "input": 60, - "output": 270 - } + "input": 0.117, + "output": 1.365 }, "type": "chat" }, { - "id": "gpt-4.1-mini", - "name": "GPT-4.1 mini", - "display_name": "GPT-4.1 mini", + "id": "qwen/qwen3-max-thinking", + "name": "Qwen: Qwen3 Max Thinking", + "display_name": "Qwen: Qwen3 Max Thinking", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 1047576, + "context": 262144, "output": 32768 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": true, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } + }, + "attachment": false, "open_weights": false, - "knowledge": "2024-04", - "release_date": "2025-04-14", - "last_updated": "2025-04-14", + "release_date": "2026-01-23", + "last_updated": "2026-03-15", "cost": { - "input": 0.4, - "output": 1.6, - "cache_read": 0.1 + "input": 0.78, + "output": 3.9 }, "type": "chat" }, { - "id": "deepseek-v3.2", - "name": "DeepSeek-V3.2", - "display_name": "DeepSeek-V3.2", + "id": "qwen/qwen3-30b-a3b-thinking-2507", + "name": "Qwen: Qwen3 30B A3B Thinking 2507", + "display_name": "Qwen: Qwen3 30B A3B Thinking 2507", "modalities": { "input": [ "text" @@ -126778,8 +131239,8 @@ ] }, "limit": { - "context": 128000, - "output": 128000 + "context": 32768, + "output": 6554 }, "temperature": true, "tool_call": true, @@ -126789,26 +131250,32 @@ }, "extra_capabilities": { "reasoning": { - "supported": true + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] } }, "attachment": false, "open_weights": true, - "knowledge": "2024-07", - "release_date": "2025-12-01", - "last_updated": "2025-12-01", + "release_date": "2025-07-29", + "last_updated": "2025-07-29", "cost": { - "input": 0.58, - "output": 1.68 + "input": 0.051, + "output": 0.34 }, "type": "chat" }, { - "id": "text-embedding-3-large", - "name": "text-embedding-3-large", - "display_name": "text-embedding-3-large", + "id": "qwen/qwen2.5-vl-72b-instruct", + "name": "Qwen: Qwen2.5 VL 72B Instruct", + "display_name": "Qwen: Qwen2.5 VL 72B Instruct", "modalities": { "input": [ + "image", "text" ], "output": [ @@ -126816,41 +131283,44 @@ ] }, "limit": { - "context": 8191, - "output": 3072 + "context": 32768, + "output": 32768 }, + "temperature": true, "tool_call": false, "reasoning": { "supported": false }, - "attachment": false, - "open_weights": false, - "release_date": "2024-01-25", - "last_updated": "2024-01-25", + "attachment": true, + "open_weights": true, + "release_date": "2025-02-01", + "last_updated": "2026-03-15", "cost": { - "input": 0.13, - "output": 0 + "input": 0.8, + "output": 0.8, + "cache_read": 0.075 }, - "type": "embedding" + "type": "chat" }, { - "id": "o4-mini", - "name": "o4-mini", - "display_name": "o4-mini", + "id": "qwen/qwen3.5-27b", + "name": "Qwen: Qwen3.5-27B", + "display_name": "Qwen: Qwen3.5-27B", "modalities": { "input": [ + "image", "text", - "image" + "video" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 100000 + "context": 262144, + "output": 65536 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, @@ -126859,107 +131329,72 @@ "extra_capabilities": { "reasoning": { "supported": true, - "default_enabled": true, - "mode": "effort", - "effort": "medium", - "effort_options": [ - "low", - "medium", - "high" - ], - "visibility": "hidden" + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] } }, "attachment": true, - "open_weights": false, - "knowledge": "2024-05", - "release_date": "2025-04-16", - "last_updated": "2025-04-16", + "open_weights": true, + "release_date": "2026-02-26", + "last_updated": "2026-03-15", "cost": { - "input": 1.1, - "output": 4.4, - "cache_read": 0.275 + "input": 0.195, + "output": 1.56 }, "type": "chat" }, { - "id": "gpt-5.4", - "name": "GPT-5.4", - "display_name": "GPT-5.4", + "id": "qwen/qwen3-235b-a22b", + "name": "Qwen: Qwen3 235B A22B", + "display_name": "Qwen: Qwen3 235B A22B", "modalities": { "input": [ - "text", - "image", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 1050000, - "output": 128000 + "context": 131072, + "output": 8192 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, - "default": false + "default": true }, "extra_capabilities": { "reasoning": { "supported": true, - "default_enabled": false, - "mode": "effort", - "effort": "none", - "effort_options": [ - "none", - "low", - "medium", - "high", - "xhigh" - ], - "verbosity": "medium", - "verbosity_options": [ - "low", - "medium", - "high" - ], - "visibility": "hidden" + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] } }, - "attachment": true, - "open_weights": false, - "knowledge": "2025-08-31", - "release_date": "2026-03-05", - "last_updated": "2026-03-05", + "attachment": false, + "open_weights": true, + "release_date": "2024-12-01", + "last_updated": "2026-03-15", "cost": { - "input": 2.5, - "output": 15, - "cache_read": 0.25, - "tiers": [ - { - "input": 5, - "output": 22.5, - "cache_read": 0.5, - "tier": { - "type": "context", - "size": 272000 - } - } - ], - "context_over_200k": { - "input": 5, - "output": 22.5, - "cache_read": 0.5 - } + "input": 0.455, + "output": 1.82, + "cache_read": 0.15 }, "type": "chat" }, { - "id": "o3-mini", - "name": "o3-mini", - "display_name": "o3-mini", + "id": "qwen/qwen-2.5-72b-instruct", + "name": "Qwen2.5 72B Instruct", + "display_name": "Qwen2.5 72B Instruct", "modalities": { "input": [ "text" @@ -126969,45 +131404,28 @@ ] }, "limit": { - "context": 200000, - "output": 100000 + "context": 32768, + "output": 16384 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": true, - "mode": "effort", - "effort": "medium", - "effort_options": [ - "low", - "medium", - "high" - ], - "visibility": "hidden" - } + "supported": false }, "attachment": false, - "open_weights": false, - "knowledge": "2024-05", - "release_date": "2024-12-20", - "last_updated": "2025-01-29", + "open_weights": true, + "release_date": "2024-09", + "last_updated": "2026-01-10", "cost": { - "input": 1.1, - "output": 4.4, - "cache_read": 0.55 + "input": 0.12, + "output": 0.39 }, "type": "chat" }, { - "id": "phi-4-reasoning", - "name": "Phi-4-reasoning", - "display_name": "Phi-4-reasoning", + "id": "qwen/qwen-plus-2025-07-28:thinking", + "name": "Qwen: Qwen Plus 0728 (thinking)", + "display_name": "Qwen: Qwen Plus 0728 (thinking)", "modalities": { "input": [ "text" @@ -127017,30 +131435,29 @@ ] }, "limit": { - "context": 32000, - "output": 4096 + "context": 1000000, + "output": 32768 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { "supported": true, "default": true }, "attachment": false, "open_weights": true, - "knowledge": "2023-10", - "release_date": "2024-12-11", - "last_updated": "2024-12-11", + "release_date": "2025-09-09", + "last_updated": "2026-03-15", "cost": { - "input": 0.125, - "output": 0.5 + "input": 0.26, + "output": 0.78 }, "type": "chat" }, { - "id": "phi-4", - "name": "Phi-4", - "display_name": "Phi-4", + "id": "qwen/qwen3-coder-next", + "name": "Qwen: Qwen3 Coder Next", + "display_name": "Qwen: Qwen3 Coder Next", "modalities": { "input": [ "text" @@ -127050,44 +131467,44 @@ ] }, "limit": { - "context": 128000, - "output": 4096 + "context": 262144, + "output": 65536 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { "supported": false }, "attachment": false, "open_weights": true, - "knowledge": "2023-10", - "release_date": "2024-12-11", - "last_updated": "2024-12-11", + "release_date": "2026-02-02", + "last_updated": "2026-03-15", "cost": { - "input": 0.125, - "output": 0.5 + "input": 0.12, + "output": 0.75, + "cache_read": 0.035 }, "type": "chat" }, { - "id": "gpt-5.5", - "name": "GPT-5.5", - "display_name": "GPT-5.5", + "id": "qwen/qwen3.6-27b", + "name": "Qwen: Qwen3.6 27B", + "display_name": "Qwen: Qwen3.6 27B", "modalities": { "input": [ "text", "image", - "pdf" + "video" ], "output": [ "text" ] }, "limit": { - "context": 1050000, - "output": 128000 + "context": 256000, + "output": 65536 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, @@ -127096,100 +131513,86 @@ "extra_capabilities": { "reasoning": { "supported": true, - "default_enabled": true, - "mode": "effort", - "effort": "medium", - "effort_options": [ - "low", - "medium", - "high", - "xhigh" - ], - "verbosity": "medium", - "verbosity_options": [ - "low", - "medium", - "high" - ], - "visibility": "hidden" + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] } }, "attachment": true, "open_weights": false, - "knowledge": "2025-12-01", - "release_date": "2026-04-24", - "last_updated": "2026-04-24", + "release_date": "2026-04-27", + "last_updated": "2026-05-01", "cost": { - "input": 5, - "output": 30, - "cache_read": 0.5, - "tiers": [ - { - "input": 10, - "output": 45, - "cache_read": 1, - "tier": { - "type": "context", - "size": 272000 - } - } - ], - "context_over_200k": { - "input": 10, - "output": 45, - "cache_read": 1 - } + "input": 0.325, + "output": 3.25 }, "type": "chat" }, { - "id": "mistral-nemo", - "name": "Mistral Nemo", - "display_name": "Mistral Nemo", + "id": "qwen/qwen3.5-35b-a3b", + "name": "Qwen: Qwen3.5-35B-A3B", + "display_name": "Qwen: Qwen3.5-35B-A3B", "modalities": { "input": [ - "text" + "image", + "text", + "video" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 128000 + "context": 262144, + "output": 65536 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": false, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } + }, + "attachment": true, "open_weights": true, - "knowledge": "2024-07", - "release_date": "2024-07-18", - "last_updated": "2024-07-18", + "release_date": "2026-02-26", + "last_updated": "2026-03-15", "cost": { - "input": 0.15, - "output": 0.15 + "input": 0.1625, + "output": 1.3 }, "type": "chat" }, { - "id": "kimi-k2.6", - "name": "Kimi K2.6", - "display_name": "Kimi K2.6", + "id": "qwen/qwen3.5-9b", + "name": "Qwen: Qwen3.5-9B", + "display_name": "Qwen: Qwen3.5-9B", "modalities": { "input": [ + "image", "text", - "image" + "video" ], "output": [ "text" ] }, "limit": { - "context": 262144, - "output": 262144 + "context": 256000, + "output": 32768 }, "temperature": true, "tool_call": true, @@ -127200,66 +131603,84 @@ "extra_capabilities": { "reasoning": { "supported": true, - "interleaved": true + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] } }, - "attachment": false, + "attachment": true, "open_weights": true, - "knowledge": "2025-01", - "release_date": "2026-04-22", - "last_updated": "2026-04-22", + "release_date": "2026-03-10", + "last_updated": "2026-03-15", "cost": { - "input": 0.95, - "output": 4 + "input": 0.05, + "output": 0.15 }, "type": "chat" }, { - "id": "gpt-4-32k", - "name": "GPT-4 32K", - "display_name": "GPT-4 32K", + "id": "qwen/qwen3.5-397b-a17b", + "name": "Qwen: Qwen3.5 397B A17B", + "display_name": "Qwen: Qwen3.5 397B A17B", "modalities": { "input": [ - "text" + "image", + "text", + "video" ], "output": [ "text" ] }, "limit": { - "context": 32768, - "output": 32768 + "context": 262144, + "output": 65536 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": false, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } + }, + "attachment": true, "open_weights": false, - "knowledge": "2023-11", - "release_date": "2023-03-14", - "last_updated": "2023-03-14", + "release_date": "2026-02-15", + "last_updated": "2026-03-15", "cost": { - "input": 60, - "output": 120 + "input": 0.39, + "output": 2.34 }, "type": "chat" }, { - "id": "meta-llama-3.1-8b-instruct", - "name": "Meta-Llama-3.1-8B-Instruct", - "display_name": "Meta-Llama-3.1-8B-Instruct", + "id": "qwen/qwen3-vl-30b-a3b-instruct", + "name": "Qwen: Qwen3 VL 30B A3B Instruct", + "display_name": "Qwen: Qwen3 VL 30B A3B Instruct", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 128000, + "context": 131072, "output": 32768 }, "temperature": true, @@ -127267,54 +131688,52 @@ "reasoning": { "supported": false }, - "attachment": false, + "attachment": true, "open_weights": true, - "knowledge": "2023-12", - "release_date": "2024-07-23", - "last_updated": "2024-07-23", + "release_date": "2025-10-05", + "last_updated": "2025-11-25", "cost": { - "input": 0.3, - "output": 0.61 + "input": 0.13, + "output": 0.52 }, "type": "chat" }, { - "id": "llama-4-scout-17b-16e-instruct", - "name": "Llama 4 Scout 17B 16E Instruct", - "display_name": "Llama 4 Scout 17B 16E Instruct", + "id": "qwen/qwen3-235b-a22b-2507", + "name": "Qwen: Qwen3 235B A22B Instruct 2507", + "display_name": "Qwen: Qwen3 235B A22B Instruct 2507", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 8192 + "context": 262144, + "output": 52429 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": true, + "attachment": false, "open_weights": true, - "knowledge": "2024-08", - "release_date": "2025-04-05", - "last_updated": "2025-04-05", + "release_date": "2025-04", + "last_updated": "2026-01", "cost": { - "input": 0.2, - "output": 0.78 + "input": 0.071, + "output": 0.1 }, "type": "chat" }, { - "id": "phi-3-mini-128k-instruct", - "name": "Phi-3-mini-instruct (128k)", - "display_name": "Phi-3-mini-instruct (128k)", + "id": "qwen/qwen3-coder-flash", + "name": "Qwen: Qwen3 Coder Flash", + "display_name": "Qwen: Qwen3 Coder Flash", "modalities": { "input": [ "text" @@ -127324,29 +131743,29 @@ ] }, "limit": { - "context": 128000, - "output": 4096 + "context": 1000000, + "output": 65536 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { "supported": false }, "attachment": false, - "open_weights": true, - "knowledge": "2023-10", - "release_date": "2024-04-23", - "last_updated": "2024-04-23", + "open_weights": false, + "release_date": "2025-07-23", + "last_updated": "2026-03-15", "cost": { - "input": 0.13, - "output": 0.52 + "input": 0.195, + "output": 0.975, + "cache_read": 0.06 }, "type": "chat" }, { - "id": "phi-3-small-128k-instruct", - "name": "Phi-3-small-instruct (128k)", - "display_name": "Phi-3-small-instruct (128k)", + "id": "qwen/qwen3-14b", + "name": "Qwen: Qwen3 14B", + "display_name": "Qwen: Qwen3 14B", "modalities": { "input": [ "text" @@ -127356,134 +131775,131 @@ ] }, "limit": { - "context": 128000, - "output": 4096 + "context": 40960, + "output": 40960 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } }, "attachment": false, "open_weights": true, - "knowledge": "2023-10", - "release_date": "2024-04-23", - "last_updated": "2024-04-23", + "release_date": "2025-04", + "last_updated": "2026-03-15", "cost": { - "input": 0.15, - "output": 0.6 + "input": 0.06, + "output": 0.24, + "cache_read": 0.025 }, "type": "chat" }, { - "id": "phi-4-mini", - "name": "Phi-4-mini", - "display_name": "Phi-4-mini", + "id": "qwen/qwen3-vl-235b-a22b-instruct", + "name": "Qwen: Qwen3 VL 235B A22B Instruct", + "display_name": "Qwen: Qwen3 VL 235B A22B Instruct", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 4096 + "context": 262144, + "output": 52429 }, "temperature": true, "tool_call": true, "reasoning": { "supported": false }, - "attachment": false, + "attachment": true, "open_weights": true, - "knowledge": "2023-10", - "release_date": "2024-12-11", - "last_updated": "2024-12-11", + "release_date": "2025-09-23", + "last_updated": "2026-01-10", "cost": { - "input": 0.075, - "output": 0.3 + "input": 0.2, + "output": 0.88, + "cache_read": 0.11 }, "type": "chat" }, { - "id": "gpt-5.1", - "name": "GPT-5.1", - "display_name": "GPT-5.1", + "id": "qwen/qwen3-30b-a3b", + "name": "Qwen: Qwen3 30B A3B", + "display_name": "Qwen: Qwen3 30B A3B", "modalities": { "input": [ - "text", - "image", - "audio" + "text" ], "output": [ - "text", - "image", - "audio" + "text" ] }, "limit": { - "context": 272000, - "output": 128000 + "context": 40960, + "output": 40960 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, - "default": false + "default": true }, "extra_capabilities": { "reasoning": { "supported": true, - "default_enabled": false, - "mode": "effort", - "effort": "none", - "effort_options": [ - "none", - "low", - "medium", - "high" - ], - "verbosity": "medium", - "verbosity_options": [ - "low", - "medium", - "high" - ], - "visibility": "hidden" + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] } }, - "attachment": true, - "open_weights": false, - "knowledge": "2024-09-30", - "release_date": "2025-11-14", - "last_updated": "2025-11-14", + "attachment": false, + "open_weights": true, + "release_date": "2025-04", + "last_updated": "2026-03-15", "cost": { - "input": 1.25, - "output": 10, - "cache_read": 0.125 + "input": 0.08, + "output": 0.28, + "cache_read": 0.03 }, "type": "chat" }, { - "id": "gpt-5-nano", - "name": "GPT-5 Nano", - "display_name": "GPT-5 Nano", + "id": "qwen/qwen3.6-max-preview", + "name": "Qwen: Qwen3.6 Max Preview", + "display_name": "Qwen: Qwen3.6 Max Preview", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 272000, - "output": 128000 + "context": 262144, + "output": 65536 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, @@ -127492,188 +131908,184 @@ "extra_capabilities": { "reasoning": { "supported": true, - "default_enabled": true, - "mode": "effort", - "effort": "medium", - "effort_options": [ - "minimal", - "low", - "medium", - "high" - ], - "verbosity": "medium", - "verbosity_options": [ - "low", - "medium", - "high" - ], - "visibility": "hidden" + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] } }, - "attachment": true, + "attachment": false, "open_weights": false, - "knowledge": "2024-05-30", - "release_date": "2025-08-07", - "last_updated": "2025-08-07", + "release_date": "2026-04-27", + "last_updated": "2026-05-01", "cost": { - "input": 0.05, - "output": 0.4, - "cache_read": 0.01 + "input": 1.04, + "output": 6.24, + "cache_write": 1.3 }, "type": "chat" }, { - "id": "gpt-4o-mini", - "name": "GPT-4o mini", - "display_name": "GPT-4o mini", + "id": "qwen/qwen3.5-122b-a10b", + "name": "Qwen: Qwen3.5-122B-A10B", + "display_name": "Qwen: Qwen3.5-122B-A10B", "modalities": { "input": [ + "image", "text", - "image" + "video" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 16384 + "context": 262144, + "output": 65536 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } }, "attachment": true, - "open_weights": false, - "knowledge": "2023-09", - "release_date": "2024-07-18", - "last_updated": "2024-07-18", + "open_weights": true, + "release_date": "2026-02-26", + "last_updated": "2026-03-15", "cost": { - "input": 0.15, - "output": 0.6, - "cache_read": 0.075 + "input": 0.26, + "output": 2.08 }, "type": "chat" }, { - "id": "claude-opus-4-1", - "name": "Claude Opus 4.1", - "display_name": "Claude Opus 4.1", + "id": "qwen/qwen3.6-plus", + "name": "Qwen: Qwen3.6 Plus", + "display_name": "Qwen: Qwen3.6 Plus", "modalities": { "input": [ - "text", "image", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 32000 + "context": 1000000, + "output": 65536 }, "temperature": true, "tool_call": true, "reasoning": { "supported": true, - "default": false + "default": true }, "extra_capabilities": { "reasoning": { "supported": true, - "default_enabled": false, - "mode": "budget", - "budget": { - "min": 1024, - "unit": "tokens" - }, "interleaved": true, "summaries": true, "visibility": "summary", "continuation": [ "thinking_blocks" - ], - "notes": [ - "Claude 4 manual thinking uses thinking.type = \"enabled\" with budget_tokens.", - "Interleaved thinking requires the interleaved-thinking-2025-05-14 beta header for this model family." ] } }, "attachment": true, "open_weights": false, - "knowledge": "2025-03-31", - "release_date": "2025-11-18", - "last_updated": "2025-11-18", + "release_date": "2025-08-26", + "last_updated": "2026-04-11", "cost": { - "input": 15, - "output": 75, - "cache_read": 1.5, - "cache_write": 18.75 + "input": 0.325, + "output": 1.95, + "cache_read": 0.0325, + "cache_write": 0.40625 }, "type": "chat" }, { - "id": "gpt-5.1-codex-max", - "name": "GPT-5.1 Codex Max", - "display_name": "GPT-5.1 Codex Max", + "id": "amazon/nova-lite-v1", + "name": "Amazon: Nova Lite 1.0", + "display_name": "Amazon: Nova Lite 1.0", "modalities": { "input": [ - "text", - "image" + "image", + "text" ], "output": [ "text" ] }, "limit": { - "context": 400000, - "output": 128000 + "context": 300000, + "output": 5120 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": false + "supported": false }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": false, - "mode": "effort", - "effort": "none", - "effort_options": [ - "none", - "low", - "medium", - "high" - ], - "verbosity": "medium", - "verbosity_options": [ - "low", - "medium", - "high" - ], - "visibility": "hidden" - } + "attachment": true, + "open_weights": false, + "release_date": "2024-12-06", + "last_updated": "2026-03-15", + "cost": { + "input": 0.06, + "output": 0.24 + }, + "type": "chat" + }, + { + "id": "amazon/nova-premier-v1", + "name": "Amazon: Nova Premier 1.0", + "display_name": "Amazon: Nova Premier 1.0", + "modalities": { + "input": [ + "image", + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 1000000, + "output": 32000 + }, + "temperature": true, + "tool_call": true, + "reasoning": { + "supported": false }, "attachment": true, "open_weights": false, - "knowledge": "2024-09-30", - "release_date": "2025-11-13", - "last_updated": "2025-11-13", + "release_date": "2025-11-01", + "last_updated": "2026-03-15", "cost": { - "input": 1.25, - "output": 10, - "cache_read": 0.125 + "input": 2.5, + "output": 12.5 }, "type": "chat" }, { - "id": "grok-4-fast-reasoning", - "name": "Grok 4 Fast (Reasoning)", - "display_name": "Grok 4 Fast (Reasoning)", + "id": "amazon/nova-pro-v1", + "name": "Amazon: Nova Pro 1.0", + "display_name": "Amazon: Nova Pro 1.0", "modalities": { "input": [ "text", @@ -127684,92 +132096,94 @@ ] }, "limit": { - "context": 2000000, - "output": 30000 + "context": 300000, + "output": 5120 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true - } + "supported": false }, "attachment": true, "open_weights": false, - "knowledge": "2025-07", - "release_date": "2025-09-19", - "last_updated": "2025-09-19", + "release_date": "2024-12-03", + "last_updated": "2024-12-03", "cost": { - "input": 0.2, - "output": 0.5, - "cache_read": 0.05 + "input": 0.8, + "output": 3.2 }, "type": "chat" }, { - "id": "gpt-5.1-codex-mini", - "name": "GPT-5.1 Codex Mini", - "display_name": "GPT-5.1 Codex Mini", + "id": "amazon/nova-micro-v1", + "name": "Amazon: Nova Micro 1.0", + "display_name": "Amazon: Nova Micro 1.0", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 128000, + "output": 5120 + }, + "temperature": true, + "tool_call": true, + "reasoning": { + "supported": false + }, + "attachment": false, + "open_weights": false, + "release_date": "2024-12-06", + "last_updated": "2026-03-15", + "cost": { + "input": 0.035, + "output": 0.14 + }, + "type": "chat" + }, + { + "id": "amazon/nova-2-lite-v1", + "name": "Amazon: Nova 2 Lite", + "display_name": "Amazon: Nova 2 Lite", "modalities": { "input": [ + "image", + "pdf", "text", - "image" + "video" ], "output": [ "text" ] }, "limit": { - "context": 400000, - "output": 128000 + "context": 1000000, + "output": 65535 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, - "default": false - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": false, - "mode": "effort", - "effort": "none", - "effort_options": [ - "none", - "low", - "medium", - "high" - ], - "verbosity": "medium", - "verbosity_options": [ - "low", - "medium", - "high" - ], - "visibility": "hidden" - } + "default": true }, - "attachment": false, + "attachment": true, "open_weights": false, - "knowledge": "2024-09-30", - "release_date": "2025-11-14", - "last_updated": "2025-11-14", + "release_date": "2024-12-01", + "last_updated": "2026-03-15", "cost": { - "input": 0.25, - "output": 2, - "cache_read": 0.025 + "input": 0.3, + "output": 2.5 }, "type": "chat" }, { - "id": "text-embedding-ada-002", - "name": "text-embedding-ada-002", - "display_name": "text-embedding-ada-002", + "id": "aion-labs/aion-rp-llama-3.1-8b", + "name": "AionLabs: Aion-RP 1.0 (8B)", + "display_name": "AionLabs: Aion-RP 1.0 (8B)", "modalities": { "input": [ "text" @@ -127779,27 +132193,28 @@ ] }, "limit": { - "context": 8192, - "output": 1536 + "context": 32768, + "output": 32768 }, + "temperature": true, "tool_call": false, "reasoning": { "supported": false }, "attachment": false, "open_weights": false, - "release_date": "2022-12-15", - "last_updated": "2022-12-15", + "release_date": "2025-02-05", + "last_updated": "2026-03-15", "cost": { - "input": 0.1, - "output": 0 + "input": 0.8, + "output": 1.6 }, - "type": "embedding" + "type": "chat" }, { - "id": "phi-4-reasoning-plus", - "name": "Phi-4-reasoning-plus", - "display_name": "Phi-4-reasoning-plus", + "id": "aion-labs/aion-1.0-mini", + "name": "AionLabs: Aion-1.0-Mini", + "display_name": "AionLabs: Aion-1.0-Mini", "modalities": { "input": [ "text" @@ -127809,8 +132224,8 @@ ] }, "limit": { - "context": 32000, - "output": 4096 + "context": 131072, + "output": 32768 }, "temperature": true, "tool_call": false, @@ -127819,53 +132234,51 @@ "default": true }, "attachment": false, - "open_weights": true, - "knowledge": "2023-10", - "release_date": "2024-12-11", - "last_updated": "2024-12-11", + "open_weights": false, + "release_date": "2025-02-05", + "last_updated": "2026-03-15", "cost": { - "input": 0.125, - "output": 0.5 + "input": 0.7, + "output": 1.4 }, "type": "chat" }, { - "id": "grok-4-1-fast-non-reasoning", - "name": "Grok 4.1 Fast (Non-Reasoning)", - "display_name": "Grok 4.1 Fast (Non-Reasoning)", + "id": "aion-labs/aion-2.0", + "name": "AionLabs: Aion-2.0", + "display_name": "AionLabs: Aion-2.0", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 8192 + "context": 131072, + "output": 32768 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": true, + "attachment": false, "open_weights": false, - "release_date": "2025-06-27", - "last_updated": "2025-06-27", + "release_date": "2026-02-24", + "last_updated": "2026-03-15", "cost": { - "input": 0.2, - "output": 0.5, - "cache_read": 0.05 + "input": 0.8, + "output": 1.6 }, "type": "chat" }, { - "id": "deepseek-r1", - "name": "DeepSeek-R1", - "display_name": "DeepSeek-R1", + "id": "aion-labs/aion-1.0", + "name": "AionLabs: Aion-1.0", + "display_name": "AionLabs: Aion-1.0", "modalities": { "input": [ "text" @@ -127875,8 +132288,8 @@ ] }, "limit": { - "context": 163840, - "output": 163840 + "context": 131072, + "output": 32768 }, "temperature": true, "tool_call": false, @@ -127884,98 +132297,82 @@ "supported": true, "default": true }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } - }, "attachment": false, - "open_weights": true, - "knowledge": "2024-07", - "release_date": "2025-01-20", - "last_updated": "2025-01-20", + "open_weights": false, + "release_date": "2025-02-05", + "last_updated": "2026-03-15", "cost": { - "input": 1.35, - "output": 5.4 + "input": 4, + "output": 8 }, "type": "chat" }, { - "id": "mistral-medium-2505", - "name": "Mistral Medium 3", - "display_name": "Mistral Medium 3", + "id": "inflection/inflection-3-pi", + "name": "Inflection: Inflection 3 Pi", + "display_name": "Inflection: Inflection 3 Pi", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 128000 + "context": 8000, + "output": 1024 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": false }, - "attachment": true, + "attachment": false, "open_weights": false, - "knowledge": "2025-05", - "release_date": "2025-05-07", - "last_updated": "2025-05-07", + "release_date": "2024-10-11", + "last_updated": "2026-03-15", "cost": { - "input": 0.4, - "output": 2 + "input": 2.5, + "output": 10 }, "type": "chat" }, { - "id": "llama-4-maverick-17b-128e-instruct-fp8", - "name": "Llama 4 Maverick 17B 128E Instruct FP8", - "display_name": "Llama 4 Maverick 17B 128E Instruct FP8", + "id": "inflection/inflection-3-productivity", + "name": "Inflection: Inflection 3 Productivity", + "display_name": "Inflection: Inflection 3 Productivity", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 8192 + "context": 8000, + "output": 1024 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": false }, - "attachment": true, - "open_weights": true, - "knowledge": "2024-08", - "release_date": "2025-04-05", - "last_updated": "2025-04-05", + "attachment": false, + "open_weights": false, + "release_date": "2024-10-11", + "last_updated": "2026-03-15", "cost": { - "input": 0.25, - "output": 1 + "input": 2.5, + "output": 10 }, "type": "chat" }, { - "id": "cohere-command-r-plus-08-2024", - "name": "Command R+", - "display_name": "Command R+", + "id": "sao10k/l3.1-euryale-70b", + "name": "Sao10K: Llama 3.1 Euryale 70B v2.2", + "display_name": "Sao10K: Llama 3.1 Euryale 70B v2.2", "modalities": { "input": [ "text" @@ -127985,8 +132382,8 @@ ] }, "limit": { - "context": 128000, - "output": 4000 + "context": 131072, + "output": 16384 }, "temperature": true, "tool_call": true, @@ -127995,53 +132392,49 @@ }, "attachment": false, "open_weights": true, - "knowledge": "2024-06-01", - "release_date": "2024-08-30", - "last_updated": "2024-08-30", + "release_date": "2024-08-28", + "last_updated": "2026-03-15", "cost": { - "input": 2.5, - "output": 10 + "input": 0.85, + "output": 0.85 }, "type": "chat" }, { - "id": "gpt-4.1", - "name": "GPT-4.1", - "display_name": "GPT-4.1", + "id": "sao10k/l3.3-euryale-70b", + "name": "Sao10K: Llama 3.3 Euryale 70B", + "display_name": "Sao10K: Llama 3.3 Euryale 70B", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 1047576, - "output": 32768 + "context": 131072, + "output": 16384 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": false }, - "attachment": true, - "open_weights": false, - "knowledge": "2024-04", - "release_date": "2025-04-14", - "last_updated": "2025-04-14", + "attachment": false, + "open_weights": true, + "release_date": "2024-12-18", + "last_updated": "2026-03-15", "cost": { - "input": 2, - "output": 8, - "cache_read": 0.5 + "input": 0.65, + "output": 0.75 }, "type": "chat" }, { - "id": "phi-3-small-8k-instruct", - "name": "Phi-3-small-instruct (8k)", - "display_name": "Phi-3-small-instruct (8k)", + "id": "sao10k/l3-lunaris-8b", + "name": "Sao10K: Llama 3 8B Lunaris", + "display_name": "Sao10K: Llama 3 8B Lunaris", "modalities": { "input": [ "text" @@ -128052,7 +132445,7 @@ }, "limit": { "context": 8192, - "output": 2048 + "output": 8192 }, "temperature": true, "tool_call": false, @@ -128061,19 +132454,18 @@ }, "attachment": false, "open_weights": true, - "knowledge": "2023-10", - "release_date": "2024-04-23", - "last_updated": "2024-04-23", + "release_date": "2024-08-13", + "last_updated": "2026-03-15", "cost": { - "input": 0.15, - "output": 0.6 + "input": 0.04, + "output": 0.05 }, "type": "chat" }, { - "id": "meta-llama-3-8b-instruct", - "name": "Meta-Llama-3-8B-Instruct", - "display_name": "Meta-Llama-3-8B-Instruct", + "id": "sao10k/l3-euryale-70b", + "name": "Sao10k: Llama 3 Euryale 70B v2.1", + "display_name": "Sao10k: Llama 3 Euryale 70B v2.1", "modalities": { "input": [ "text" @@ -128084,86 +132476,58 @@ }, "limit": { "context": 8192, - "output": 2048 + "output": 8192 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { "supported": false }, "attachment": false, "open_weights": true, - "knowledge": "2023-12", - "release_date": "2024-04-18", - "last_updated": "2024-04-18", + "release_date": "2024-06-18", + "last_updated": "2026-03-15", "cost": { - "input": 0.3, - "output": 0.61 + "input": 1.48, + "output": 1.48 }, "type": "chat" }, { - "id": "gpt-5.4-nano", - "name": "GPT-5.4 Nano", - "display_name": "GPT-5.4 Nano", + "id": "sao10k/l3.1-70b-hanami-x1", + "name": "Sao10K: Llama 3.1 70B Hanami x1", + "display_name": "Sao10K: Llama 3.1 70B Hanami x1", "modalities": { "input": [ - "text", - "image", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 400000, - "output": 128000 + "context": 16000, + "output": 16000 }, - "temperature": false, - "tool_call": true, + "temperature": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": false - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": false, - "mode": "effort", - "effort": "none", - "effort_options": [ - "none", - "low", - "medium", - "high", - "xhigh" - ], - "verbosity": "medium", - "verbosity_options": [ - "low", - "medium", - "high" - ], - "visibility": "hidden" - } + "supported": false }, - "attachment": true, - "open_weights": false, - "knowledge": "2025-08-31", - "release_date": "2026-03-17", - "last_updated": "2026-03-17", + "attachment": false, + "open_weights": true, + "release_date": "2025-01-08", + "last_updated": "2026-03-15", "cost": { - "input": 0.2, - "output": 1.25, - "cache_read": 0.02 + "input": 3, + "output": 3 }, "type": "chat" }, { - "id": "phi-3.5-mini-instruct", - "name": "Phi-3.5-mini-instruct", - "display_name": "Phi-3.5-mini-instruct", + "id": "upstage/solar-pro-3", + "name": "Upstage: Solar Pro 3", + "display_name": "Upstage: Solar Pro 3", "modalities": { "input": [ "text" @@ -128174,28 +132538,28 @@ }, "limit": { "context": 128000, - "output": 4096 + "output": 32768 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "attachment": false, - "open_weights": true, - "knowledge": "2023-10", - "release_date": "2024-08-20", - "last_updated": "2024-08-20", + "open_weights": false, + "release_date": "2026-01-27", + "last_updated": "2026-03-15", "cost": { - "input": 0.13, - "output": 0.52 + "input": 0.15, + "output": 0.6 }, "type": "chat" }, { - "id": "cohere-embed-v3-english", - "name": "Embed v3 English", - "display_name": "Embed v3 English", + "id": "allenai/olmo-3-32b-think", + "name": "AllenAI: Olmo 3 32B Think", + "display_name": "AllenAI: Olmo 3 32B Think", "modalities": { "input": [ "text" @@ -128205,28 +132569,29 @@ ] }, "limit": { - "context": 512, - "output": 1024 + "context": 65536, + "output": 65536 }, - "temperature": false, + "temperature": true, "tool_call": false, "reasoning": { - "supported": false + "supported": true, + "default": true }, "attachment": false, "open_weights": true, - "release_date": "2023-11-07", - "last_updated": "2023-11-07", + "release_date": "2025-11-22", + "last_updated": "2026-03-15", "cost": { - "input": 0.1, - "output": 0 + "input": 0.15, + "output": 0.5 }, "type": "chat" }, { - "id": "phi-3-mini-4k-instruct", - "name": "Phi-3-mini-instruct (4k)", - "display_name": "Phi-3-mini-instruct (4k)", + "id": "essentialai/rnj-1-instruct", + "name": "EssentialAI: Rnj 1 Instruct", + "display_name": "EssentialAI: Rnj 1 Instruct", "modalities": { "input": [ "text" @@ -128236,29 +132601,28 @@ ] }, "limit": { - "context": 4096, - "output": 1024 + "context": 32768, + "output": 6554 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { "supported": false }, "attachment": false, "open_weights": true, - "knowledge": "2023-10", - "release_date": "2024-04-23", - "last_updated": "2024-04-23", + "release_date": "2025-12-05", + "last_updated": "2026-03-15", "cost": { - "input": 0.13, - "output": 0.52 + "input": 0.15, + "output": 0.15 }, "type": "chat" }, { - "id": "meta-llama-3.1-70b-instruct", - "name": "Meta-Llama-3.1-70B-Instruct", - "display_name": "Meta-Llama-3.1-70B-Instruct", + "id": "deepseek/deepseek-r1-0528", + "name": "DeepSeek: R1 0528", + "display_name": "DeepSeek: R1 0528", "modalities": { "input": [ "text" @@ -128268,29 +132632,41 @@ ] }, "limit": { - "context": 128000, - "output": 32768 + "context": 163840, + "output": 65536 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } }, "attachment": false, "open_weights": true, - "knowledge": "2023-12", - "release_date": "2024-07-23", - "last_updated": "2024-07-23", + "release_date": "2025-05-28", + "last_updated": "2026-03-15", "cost": { - "input": 2.68, - "output": 3.54 + "input": 0.45, + "output": 2.15, + "cache_read": 0.2 }, "type": "chat" }, { - "id": "phi-3-medium-4k-instruct", - "name": "Phi-3-medium-instruct (4k)", - "display_name": "Phi-3-medium-instruct (4k)", + "id": "deepseek/deepseek-v4-flash", + "name": "DeepSeek: DeepSeek V4 Flash", + "display_name": "DeepSeek: DeepSeek V4 Flash", "modalities": { "input": [ "text" @@ -128300,29 +132676,41 @@ ] }, "limit": { - "context": 4096, - "output": 1024 + "context": 1048576, + "output": 384000 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } }, "attachment": false, - "open_weights": true, - "knowledge": "2023-10", - "release_date": "2024-04-23", - "last_updated": "2024-04-23", + "open_weights": false, + "release_date": "2026-04-24", + "last_updated": "2026-05-01", "cost": { - "input": 0.17, - "output": 0.68 + "input": 0.14, + "output": 0.28, + "cache_read": 0.0028 }, "type": "chat" }, { - "id": "deepseek-v3.2-speciale", - "name": "DeepSeek-V3.2-Speciale", - "display_name": "DeepSeek-V3.2-Speciale", + "id": "deepseek/deepseek-v3.1-terminus", + "name": "DeepSeek: DeepSeek V3.1 Terminus", + "display_name": "DeepSeek: DeepSeek V3.1 Terminus", "modalities": { "input": [ "text" @@ -128332,121 +132720,112 @@ ] }, "limit": { - "context": 128000, - "output": 128000 + "context": 163840, + "output": 32768 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { "supported": true, "default": true }, "attachment": false, "open_weights": true, - "knowledge": "2024-07", - "release_date": "2025-12-01", - "last_updated": "2025-12-01", + "release_date": "2025-09-22", + "last_updated": "2025-09-22", "cost": { - "input": 0.58, - "output": 1.68 + "input": 0.21, + "output": 0.79, + "cache_read": 0.13 }, "type": "chat" }, { - "id": "gpt-5.3-codex", - "name": "GPT-5.3 Codex", - "display_name": "GPT-5.3 Codex", + "id": "deepseek/deepseek-r1-distill-llama-70b", + "name": "DeepSeek: R1 Distill Llama 70B", + "display_name": "DeepSeek: R1 Distill Llama 70B", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 400000, - "output": 128000 + "context": 131072, + "output": 16384 }, - "temperature": false, - "tool_call": true, + "temperature": true, + "tool_call": false, "reasoning": { "supported": true, "default": true }, "extra_capabilities": { "reasoning": { - "supported": true, - "default_enabled": true, - "mode": "effort", - "effort": "medium", - "effort_options": [ - "low", - "medium", - "high", - "xhigh" - ], - "verbosity": "medium", - "verbosity_options": [ - "low", - "medium", - "high" - ], - "visibility": "hidden" + "supported": true } }, "attachment": false, - "open_weights": false, - "knowledge": "2025-08-31", - "release_date": "2026-02-24", - "last_updated": "2026-02-24", + "open_weights": true, + "release_date": "2025-01-23", + "last_updated": "2026-03-15", "cost": { - "input": 1.75, - "output": 14, - "cache_read": 0.175 + "input": 0.7, + "output": 0.8, + "cache_read": 0.015 }, "type": "chat" }, { - "id": "phi-4-multimodal", - "name": "Phi-4-multimodal", - "display_name": "Phi-4-multimodal", + "id": "deepseek/deepseek-v4-pro", + "name": "DeepSeek: DeepSeek V4 Pro", + "display_name": "DeepSeek: DeepSeek V4 Pro", "modalities": { "input": [ - "text", - "image", - "audio" + "text" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 4096 + "context": 1048576, + "output": 384000 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": true, - "open_weights": true, - "knowledge": "2023-10", - "release_date": "2024-12-11", - "last_updated": "2024-12-11", + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } + }, + "attachment": false, + "open_weights": false, + "release_date": "2026-04-24", + "last_updated": "2026-05-01", "cost": { - "input": 0.08, - "output": 0.32, - "input_audio": 4 + "input": 0.435, + "output": 0.87, + "cache_read": 0.003625 }, "type": "chat" }, { - "id": "gpt-3.5-turbo-0125", - "name": "GPT-3.5 Turbo 0125", - "display_name": "GPT-3.5 Turbo 0125", + "id": "deepseek/deepseek-r1", + "name": "DeepSeek: R1", + "display_name": "DeepSeek: R1", "modalities": { "input": [ "text" @@ -128456,62 +132835,73 @@ ] }, "limit": { - "context": 16384, - "output": 16384 + "context": 64000, + "output": 16000 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } }, "attachment": false, - "open_weights": false, - "knowledge": "2021-08", - "release_date": "2024-01-25", - "last_updated": "2024-01-25", + "open_weights": true, + "release_date": "2025-01-20", + "last_updated": "2025-01-20", "cost": { - "input": 0.5, - "output": 1.5 + "input": 0.7, + "output": 2.5 }, "type": "chat" }, { - "id": "llama-3.2-11b-vision-instruct", - "name": "Llama-3.2-11B-Vision-Instruct", - "display_name": "Llama-3.2-11B-Vision-Instruct", + "id": "deepseek/deepseek-v3.2-speciale", + "name": "DeepSeek: DeepSeek V3.2 Speciale", + "display_name": "DeepSeek: DeepSeek V3.2 Speciale", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 8192 + "context": 163840, + "output": 163840 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": true, + "attachment": false, "open_weights": true, - "knowledge": "2023-12", - "release_date": "2024-09-25", - "last_updated": "2024-09-25", + "release_date": "2025-12-01", + "last_updated": "2026-03-15", "cost": { - "input": 0.37, - "output": 0.37 + "input": 0.4, + "output": 1.2, + "cache_read": 0.135 }, "type": "chat" }, { - "id": "phi-3.5-moe-instruct", - "name": "Phi-3.5-MoE-instruct", - "display_name": "Phi-3.5-MoE-instruct", + "id": "deepseek/deepseek-v3.2-exp", + "name": "DeepSeek: DeepSeek V3.2 Exp", + "display_name": "DeepSeek: DeepSeek V3.2 Exp", "modalities": { "input": [ "text" @@ -128521,29 +132911,29 @@ ] }, "limit": { - "context": 128000, - "output": 4096 + "context": 163840, + "output": 65536 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "attachment": false, "open_weights": true, - "knowledge": "2023-10", - "release_date": "2024-08-20", - "last_updated": "2024-08-20", + "release_date": "2025-01-01", + "last_updated": "2025-09-29", "cost": { - "input": 0.16, - "output": 0.64 + "input": 0.27, + "output": 0.41 }, "type": "chat" }, { - "id": "cohere-command-r-08-2024", - "name": "Command R", - "display_name": "Command R", + "id": "deepseek/deepseek-chat-v3-0324", + "name": "DeepSeek: DeepSeek V3 0324", + "display_name": "DeepSeek: DeepSeek V3 0324", "modalities": { "input": [ "text" @@ -128553,64 +132943,62 @@ ] }, "limit": { - "context": 128000, - "output": 4000 + "context": 163840, + "output": 65536 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "attachment": false, "open_weights": true, - "knowledge": "2024-06-01", - "release_date": "2024-08-30", - "last_updated": "2024-08-30", + "release_date": "2025-03-24", + "last_updated": "2026-03-15", "cost": { - "input": 0.15, - "output": 0.6 + "input": 0.2, + "output": 0.77, + "cache_read": 0.095 }, "type": "chat" }, { - "id": "gpt-5.2-chat", - "name": "GPT-5.2 Chat", - "display_name": "GPT-5.2 Chat", + "id": "deepseek/deepseek-r1-distill-qwen-32b", + "name": "DeepSeek: R1 Distill Qwen 32B", + "display_name": "DeepSeek: R1 Distill Qwen 32B", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 16384 + "context": 32768, + "output": 32768 }, - "temperature": false, - "tool_call": true, + "temperature": true, + "tool_call": false, "reasoning": { "supported": true, "default": true }, - "attachment": true, - "open_weights": false, - "knowledge": "2025-08-31", - "release_date": "2025-12-11", - "last_updated": "2025-12-11", + "attachment": false, + "open_weights": true, + "release_date": "2025-01-01", + "last_updated": "2025-11-25", "cost": { - "input": 1.75, - "output": 14, - "cache_read": 0.175 + "input": 0.29, + "output": 0.29 }, "type": "chat" }, { - "id": "meta-llama-3-70b-instruct", - "name": "Meta-Llama-3-70B-Instruct", - "display_name": "Meta-Llama-3-70B-Instruct", + "id": "deepseek/deepseek-chat", + "name": "DeepSeek: DeepSeek V3", + "display_name": "DeepSeek: DeepSeek V3", "modalities": { "input": [ "text" @@ -128620,29 +133008,29 @@ ] }, "limit": { - "context": 8192, - "output": 2048 + "context": 163840, + "output": 163840 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { "supported": false }, "attachment": false, "open_weights": true, - "knowledge": "2023-12", - "release_date": "2024-04-18", - "last_updated": "2024-04-18", + "release_date": "2024-12-01", + "last_updated": "2026-03-15", "cost": { - "input": 2.68, - "output": 3.54 + "input": 0.32, + "output": 0.89, + "cache_read": 0.15 }, "type": "chat" }, { - "id": "grok-4-20-reasoning", - "name": "Grok 4.20 (Reasoning)", - "display_name": "Grok 4.20 (Reasoning)", + "id": "deepseek/deepseek-v3.2", + "name": "DeepSeek: DeepSeek V3.2", + "display_name": "DeepSeek: DeepSeek V3.2", "modalities": { "input": [ "text" @@ -128652,8 +133040,8 @@ ] }, "limit": { - "context": 262000, - "output": 8192 + "context": 163840, + "output": 65536 }, "temperature": true, "tool_call": true, @@ -128667,20 +133055,20 @@ } }, "attachment": false, - "open_weights": false, - "knowledge": "2025-09", - "release_date": "2026-04-08", - "last_updated": "2026-04-08", + "open_weights": true, + "release_date": "2025-12-01", + "last_updated": "2026-03-15", "cost": { - "input": 2, - "output": 6 + "input": 0.26, + "output": 0.38, + "cache_read": 0.125 }, "type": "chat" }, { - "id": "gpt-3.5-turbo-instruct", - "name": "GPT-3.5 Turbo Instruct", - "display_name": "GPT-3.5 Turbo Instruct", + "id": "deepseek/deepseek-chat-v3.1", + "name": "DeepSeek: DeepSeek V3.1", + "display_name": "DeepSeek: DeepSeek V3.1", "modalities": { "input": [ "text" @@ -128690,43 +133078,42 @@ ] }, "limit": { - "context": 4096, - "output": 4096 + "context": 32768, + "output": 7168 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "attachment": false, - "open_weights": false, - "knowledge": "2021-08", - "release_date": "2023-09-21", - "last_updated": "2023-09-21", + "open_weights": true, + "release_date": "2025-08-21", + "last_updated": "2025-08-21", "cost": { - "input": 1.5, - "output": 2 + "input": 0.15, + "output": 0.75 }, "type": "chat" }, { - "id": "gpt-5.2-codex", - "name": "GPT-5.2 Codex", - "display_name": "GPT-5.2 Codex", + "id": "minimax/minimax-m2.5", + "name": "MiniMax: MiniMax M2.5", + "display_name": "MiniMax: MiniMax M2.5", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 400000, - "output": 128000 + "context": 196608, + "output": 196608 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, @@ -128734,41 +133121,24 @@ }, "extra_capabilities": { "reasoning": { - "supported": true, - "default_enabled": true, - "mode": "effort", - "effort": "medium", - "effort_options": [ - "low", - "medium", - "high", - "xhigh" - ], - "verbosity": "medium", - "verbosity_options": [ - "low", - "medium", - "high" - ], - "visibility": "hidden" + "supported": true } }, "attachment": false, - "open_weights": false, - "knowledge": "2025-08-31", - "release_date": "2026-01-14", - "last_updated": "2026-01-14", + "open_weights": true, + "release_date": "2026-02-12", + "last_updated": "2026-03-15", "cost": { - "input": 1.75, - "output": 14, - "cache_read": 0.175 + "input": 0.25, + "output": 1.2, + "cache_read": 0.029 }, "type": "chat" }, { - "id": "deepseek-v4-flash", - "name": "DeepSeek-V4-Flash", - "display_name": "DeepSeek-V4-Flash", + "id": "minimax/minimax-m2.1", + "name": "MiniMax: MiniMax M2.1", + "display_name": "MiniMax: MiniMax M2.1", "modalities": { "input": [ "text" @@ -128778,148 +133148,105 @@ ] }, "limit": { - "context": 1000000, - "output": 384000 + "context": 196608, + "output": 39322 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { "supported": true, "default": true }, "extra_capabilities": { "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] + "supported": true } }, "attachment": false, "open_weights": true, - "knowledge": "2025-05", - "release_date": "2026-04-24", - "last_updated": "2026-04-24", + "release_date": "2025-12-23", + "last_updated": "2025-12-23", "cost": { - "input": 1.74, - "output": 3.48 + "input": 0.27, + "output": 0.95, + "cache_read": 0.03 }, "type": "chat" }, { - "id": "o1-mini", - "name": "o1-mini", - "display_name": "o1-mini", + "id": "minimax/minimax-01", + "name": "MiniMax: MiniMax-01", + "display_name": "MiniMax: MiniMax-01", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 65536 + "context": 1000192, + "output": 1000192 }, - "temperature": false, - "tool_call": true, + "temperature": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": true, - "mode": "effort", - "effort": "medium", - "effort_options": [ - "low", - "medium", - "high" - ], - "visibility": "hidden" - } + "supported": false }, - "attachment": false, - "open_weights": false, - "knowledge": "2023-09", - "release_date": "2024-09-12", - "last_updated": "2024-09-12", + "attachment": true, + "open_weights": true, + "release_date": "2025-01-15", + "last_updated": "2025-01-15", "cost": { - "input": 1.1, - "output": 4.4, - "cache_read": 0.55 + "input": 0.2, + "output": 1.1 }, "type": "chat" }, { - "id": "gpt-5.1-codex", - "name": "GPT-5.1 Codex", - "display_name": "GPT-5.1 Codex", + "id": "minimax/minimax-m2", + "name": "MiniMax: MiniMax M2", + "display_name": "MiniMax: MiniMax M2", "modalities": { "input": [ - "text", - "image", - "audio" + "text" ], "output": [ - "text", - "image", - "audio" + "text" ] }, "limit": { - "context": 400000, - "output": 128000 + "context": 196608, + "output": 196608 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, - "default": false + "default": true }, "extra_capabilities": { "reasoning": { - "supported": true, - "default_enabled": false, - "mode": "effort", - "effort": "none", - "effort_options": [ - "none", - "low", - "medium", - "high" - ], - "verbosity": "medium", - "verbosity_options": [ - "low", - "medium", - "high" - ], - "visibility": "hidden" + "supported": true } }, "attachment": false, - "open_weights": false, - "knowledge": "2024-09-30", - "release_date": "2025-11-14", - "last_updated": "2025-11-14", + "open_weights": true, + "release_date": "2025-10-23", + "last_updated": "2026-03-15", "cost": { - "input": 1.25, - "output": 10, - "cache_read": 0.125 + "input": 0.255, + "output": 1, + "cache_read": 0.03 }, "type": "chat" }, { - "id": "phi-4-mini-reasoning", - "name": "Phi-4-mini-reasoning", - "display_name": "Phi-4-mini-reasoning", + "id": "minimax/minimax-m2-her", + "name": "MiniMax: MiniMax M2-her", + "display_name": "MiniMax: MiniMax M2-her", "modalities": { "input": [ "text" @@ -128929,68 +133256,72 @@ ] }, "limit": { - "context": 128000, - "output": 4096 + "context": 65536, + "output": 2048 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": true + "supported": false }, "attachment": false, "open_weights": true, - "knowledge": "2023-10", - "release_date": "2024-12-11", - "last_updated": "2024-12-11", + "release_date": "2026-01-23", + "last_updated": "2026-03-15", "cost": { - "input": 0.075, - "output": 0.3 + "input": 0.3, + "output": 1.2 }, "type": "chat" }, { - "id": "gpt-5.1-chat", - "name": "GPT-5.1 Chat", - "display_name": "GPT-5.1 Chat", + "id": "minimax/minimax-m2.7", + "name": "MiniMax: MiniMax M2.7", + "display_name": "MiniMax: MiniMax M2.7", "modalities": { "input": [ - "text", - "image", - "audio" + "text" ], "output": [ - "text", - "image", - "audio" + "text" ] }, "limit": { - "context": 128000, - "output": 16384 + "context": 204800, + "output": 131072 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, "default": true }, - "attachment": true, - "open_weights": false, - "knowledge": "2024-09-30", - "release_date": "2025-11-14", - "last_updated": "2025-11-14", + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } + }, + "attachment": false, + "open_weights": true, + "release_date": "2026-03-18", + "last_updated": "2026-03-18", "cost": { - "input": 1.25, - "output": 10, - "cache_read": 0.125 + "input": 0.3, + "output": 1.2, + "cache_read": 0.06 }, "type": "chat" }, { - "id": "gpt-3.5-turbo-0613", - "name": "GPT-3.5 Turbo 0613", - "display_name": "GPT-3.5 Turbo 0613", + "id": "minimax/minimax-m1", + "name": "MiniMax: MiniMax M1", + "display_name": "MiniMax: MiniMax M1", "modalities": { "input": [ "text" @@ -129000,44 +133331,44 @@ ] }, "limit": { - "context": 16384, - "output": 16384 + "context": 1000000, + "output": 40000 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "attachment": false, - "open_weights": false, - "knowledge": "2021-08", - "release_date": "2023-06-13", - "last_updated": "2023-06-13", + "open_weights": true, + "release_date": "2025-06-17", + "last_updated": "2025-06-17", "cost": { - "input": 3, - "output": 4 + "input": 0.4, + "output": 2.2 }, "type": "chat" }, { - "id": "claude-sonnet-4-5", - "name": "Claude Sonnet 4.5", - "display_name": "Claude Sonnet 4.5", + "id": "stealth/claude-opus-4.7", + "name": "Stealth: Claude Opus 4.7 (20% off)", + "display_name": "Stealth: Claude Opus 4.7 (20% off)", "modalities": { "input": [ - "text", "image", - "pdf" + "pdf", + "text" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 64000 + "context": 1000000, + "output": 128000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { "supported": true, @@ -129047,55 +133378,59 @@ "reasoning": { "supported": true, "default_enabled": false, - "mode": "budget", - "budget": { - "min": 1024, - "unit": "tokens" - }, + "mode": "effort", + "effort": "high", + "effort_options": [ + "low", + "medium", + "high", + "xhigh", + "max" + ], "interleaved": true, "summaries": true, - "visibility": "summary", + "visibility": "omitted", "continuation": [ "thinking_blocks" ], "notes": [ - "Claude 4 manual thinking uses thinking.type = \"enabled\" with budget_tokens.", - "Interleaved thinking requires the interleaved-thinking-2025-05-14 beta header for this model family." + "Claude Opus 4.7 and newer Opus models require thinking.type = \"adaptive\" to enable thinking explicitly.", + "Manual budget_tokens requests return 400 on Claude Opus 4.7 and newer adaptive-only Opus models.", + "task_budget is separate from thinking control and should not be treated as a thinking budget." ] } }, "attachment": true, "open_weights": false, - "knowledge": "2025-07-31", - "release_date": "2025-11-18", - "last_updated": "2025-11-18", + "release_date": "2026-04-16", + "last_updated": "2026-05-27", "cost": { - "input": 3, - "output": 15, - "cache_read": 0.3, - "cache_write": 3.75 + "input": 4, + "output": 20, + "cache_read": 0.4, + "cache_write": 5 }, "type": "chat" }, { - "id": "gpt-5.4-mini", - "name": "GPT-5.4 Mini", - "display_name": "GPT-5.4 Mini", + "id": "stealth/claude-sonnet-4.6", + "name": "Stealth: Claude Sonnet 4.6 (20% off)", + "display_name": "Stealth: Claude Sonnet 4.6 (20% off)", "modalities": { "input": [ - "text", "image", - "pdf" + "pdf", + "text" ], "output": [ "text" ] }, "limit": { - "context": 400000, - "output": 128000 + "context": 1000000, + "output": 64000 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, @@ -129105,85 +133440,58 @@ "reasoning": { "supported": true, "default_enabled": false, - "mode": "effort", - "effort": "none", + "mode": "mixed", + "budget": { + "min": 1024, + "unit": "tokens" + }, + "effort": "high", "effort_options": [ - "none", "low", "medium", "high", - "xhigh" + "max" ], - "verbosity": "medium", - "verbosity_options": [ - "low", - "medium", - "high" + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" ], - "visibility": "hidden" + "notes": [ + "Anthropic recommends adaptive thinking with effort for Claude 4.6; budget_tokens remains a deprecated compatibility path.", + "Anthropic API defaults effort to high; lower effort levels should be chosen per workload." + ] } }, "attachment": true, "open_weights": false, - "knowledge": "2025-08-31", - "release_date": "2026-03-17", - "last_updated": "2026-03-17", - "cost": { - "input": 0.75, - "output": 4.5, - "cache_read": 0.075 - }, - "type": "chat" - }, - { - "id": "gpt-4-turbo", - "name": "GPT-4 Turbo", - "display_name": "GPT-4 Turbo", - "modalities": { - "input": [ - "text", - "image" - ], - "output": [ - "text" - ] - }, - "limit": { - "context": 128000, - "output": 4096 - }, - "temperature": true, - "tool_call": true, - "reasoning": { - "supported": false - }, - "attachment": true, - "open_weights": false, - "knowledge": "2023-12", - "release_date": "2023-11-06", - "last_updated": "2024-04-09", + "release_date": "2026-02-17", + "last_updated": "2026-05-27", "cost": { - "input": 10, - "output": 30 + "input": 2.4, + "output": 12, + "cache_read": 0.24, + "cache_write": 3 }, "type": "chat" }, { - "id": "claude-opus-4-6", - "name": "Claude Opus 4.6", - "display_name": "Claude Opus 4.6", + "id": "stealth/claude-opus-4.6", + "name": "Stealth: Claude Opus 4.6 (20% off)", + "display_name": "Stealth: Claude Opus 4.6 (20% off)", "modalities": { "input": [ - "text", "image", - "pdf" + "pdf", + "text" ], "output": [ "text" ] }, "limit": { - "context": 200000, + "context": 1000000, "output": 128000 }, "temperature": true, @@ -129222,39 +133530,20 @@ }, "attachment": true, "open_weights": false, - "knowledge": "2025-05-31", "release_date": "2026-02-05", - "last_updated": "2026-02-05", + "last_updated": "2026-05-27", "cost": { - "input": 5, - "output": 25, - "cache_read": 0.5, - "cache_write": 6.25, - "tiers": [ - { - "input": 10, - "output": 37.5, - "cache_read": 1, - "cache_write": 12.5, - "tier": { - "type": "context", - "size": 200000 - } - } - ], - "context_over_200k": { - "input": 10, - "output": 37.5, - "cache_read": 1, - "cache_write": 12.5 - } + "input": 4, + "output": 20, + "cache_read": 0.4, + "cache_write": 5 }, "type": "chat" }, { - "id": "llama-3.3-70b-instruct", - "name": "Llama-3.3-70B-Instruct", - "display_name": "Llama-3.3-70B-Instruct", + "id": "kwaipilot/kat-coder-pro-v2", + "name": "Kwaipilot: KAT-Coder-Pro V2", + "display_name": "Kwaipilot: KAT-Coder-Pro V2", "modalities": { "input": [ "text" @@ -129264,8 +133553,8 @@ ] }, "limit": { - "context": 128000, - "output": 32768 + "context": 256000, + "output": 80000 }, "temperature": true, "tool_call": true, @@ -129274,52 +133563,50 @@ }, "attachment": false, "open_weights": true, - "knowledge": "2023-12", - "release_date": "2024-12-06", - "last_updated": "2024-12-06", + "release_date": "2026-03-27", + "last_updated": "2026-04-11", "cost": { - "input": 0.71, - "output": 0.71 + "input": 0.3, + "output": 1.2, + "cache_read": 0.06 }, "type": "chat" }, { - "id": "llama-3.2-90b-vision-instruct", - "name": "Llama-3.2-90B-Vision-Instruct", - "display_name": "Llama-3.2-90B-Vision-Instruct", + "id": "nousresearch/hermes-2-pro-llama-3-8b", + "name": "NousResearch: Hermes 2 Pro - Llama-3 8B", + "display_name": "NousResearch: Hermes 2 Pro - Llama-3 8B", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 128000, + "context": 8192, "output": 8192 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": false }, - "attachment": true, + "attachment": false, "open_weights": true, - "knowledge": "2023-12", - "release_date": "2024-09-25", - "last_updated": "2024-09-25", + "release_date": "2024-05-27", + "last_updated": "2024-06-27", "cost": { - "input": 2.04, - "output": 2.04 + "input": 0.14, + "output": 0.14 }, "type": "chat" }, { - "id": "gpt-3.5-turbo-0301", - "name": "GPT-3.5 Turbo 0301", - "display_name": "GPT-3.5 Turbo 0301", + "id": "nousresearch/hermes-4-405b", + "name": "Nous: Hermes 4 405B", + "display_name": "Nous: Hermes 4 405B", "modalities": { "input": [ "text" @@ -129329,78 +133616,60 @@ ] }, "limit": { - "context": 4096, - "output": 4096 + "context": 131072, + "output": 26215 }, "temperature": true, "tool_call": false, "reasoning": { - "supported": false + "supported": true, + "default": true }, "attachment": false, - "open_weights": false, - "knowledge": "2021-08", - "release_date": "2023-03-01", - "last_updated": "2023-03-01", + "open_weights": true, + "release_date": "2025-08-25", + "last_updated": "2025-08-25", "cost": { - "input": 1.5, - "output": 2 + "input": 1, + "output": 3 }, "type": "chat" }, { - "id": "o1", - "name": "o1", - "display_name": "o1", + "id": "nousresearch/hermes-3-llama-3.1-70b", + "name": "Nous: Hermes 3 70B Instruct", + "display_name": "Nous: Hermes 3 70B Instruct", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 100000 + "context": 131072, + "output": 32768 }, - "temperature": false, - "tool_call": true, + "temperature": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": true, - "mode": "effort", - "effort": "medium", - "effort_options": [ - "low", - "medium", - "high" - ], - "visibility": "hidden" - } + "supported": false }, "attachment": false, - "open_weights": false, - "knowledge": "2023-09", - "release_date": "2024-12-05", - "last_updated": "2024-12-05", + "open_weights": true, + "release_date": "2024-08-18", + "last_updated": "2026-03-15", "cost": { - "input": 15, - "output": 60, - "cache_read": 7.5 + "input": 0.3, + "output": 0.3 }, "type": "chat" }, { - "id": "deepseek-v4-pro", - "name": "DeepSeek-V4-Pro", - "display_name": "DeepSeek-V4-Pro", + "id": "nousresearch/hermes-3-llama-3.1-405b", + "name": "Nous: Hermes 3 405B Instruct", + "display_name": "Nous: Hermes 3 405B Instruct", "modalities": { "input": [ "text" @@ -129410,86 +133679,70 @@ ] }, "limit": { - "context": 1000000, - "output": 384000 + "context": 131072, + "output": 16384 }, "temperature": true, "tool_call": false, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } + "supported": false }, "attachment": false, "open_weights": true, - "knowledge": "2025-05", - "release_date": "2026-04-24", - "last_updated": "2026-04-24", + "release_date": "2024-08-16", + "last_updated": "2024-08-16", "cost": { - "input": 0.19, - "output": 0.51 + "input": 1, + "output": 1 }, "type": "chat" }, { - "id": "kimi-k2.5", - "name": "Kimi K2.5", - "display_name": "Kimi K2.5", + "id": "nousresearch/hermes-4-70b", + "name": "Nous: Hermes 4 70B", + "display_name": "Nous: Hermes 4 70B", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 262144, - "output": 262144 + "context": 131072, + "output": 131072 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": true, "default": true }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } - }, "attachment": false, "open_weights": true, - "knowledge": "2025-01", - "release_date": "2026-02-06", - "last_updated": "2026-02-06", + "release_date": "2025-08-25", + "last_updated": "2026-03-15", "cost": { - "input": 0.6, - "output": 3 + "input": 0.13, + "output": 0.4, + "cache_read": 0.055 }, "type": "chat" - }, + } + ] + }, + "lucidquery": { + "id": "lucidquery", + "name": "LucidQuery AI", + "display_name": "LucidQuery AI", + "api": "https://lucidquery.com/api/v1", + "doc": "https://lucidquery.com/api/docs", + "models": [ { - "id": "codex-mini", - "name": "Codex Mini", - "display_name": "Codex Mini", + "id": "lucidnova-rf1-100b", + "name": "LucidNova RF1 100B", + "display_name": "LucidNova RF1 100B", "modalities": { "input": [ "text" @@ -129499,8 +133752,8 @@ ] }, "limit": { - "context": 200000, - "output": 100000 + "context": 120000, + "output": 8000 }, "temperature": false, "tool_call": true, @@ -129510,20 +133763,19 @@ }, "attachment": true, "open_weights": false, - "knowledge": "2024-04", - "release_date": "2025-05-16", - "last_updated": "2025-05-16", + "knowledge": "2025-09-16", + "release_date": "2024-12-28", + "last_updated": "2025-09-10", "cost": { - "input": 1.5, - "output": 6, - "cache_read": 0.375 + "input": 2, + "output": 5 }, "type": "chat" }, { - "id": "deepseek-v3.1", - "name": "DeepSeek-V3.1", - "display_name": "DeepSeek-V3.1", + "id": "lucidquery-nexus-coder", + "name": "LucidQuery Nexus Coder", + "display_name": "LucidQuery Nexus Coder", "modalities": { "input": [ "text" @@ -129533,30 +133785,70 @@ ] }, "limit": { - "context": 131072, - "output": 131072 + "context": 250000, + "output": 60000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { "supported": true, "default": true }, + "attachment": true, + "open_weights": false, + "knowledge": "2025-08-01", + "release_date": "2025-09-01", + "last_updated": "2025-09-01", + "cost": { + "input": 2, + "output": 5 + }, + "type": "chat" + } + ] + }, + "meganova": { + "id": "meganova", + "name": "Meganova", + "display_name": "Meganova", + "api": "https://api.meganova.ai/v1", + "doc": "https://docs.meganova.ai", + "models": [ + { + "id": "meta-llama/Llama-3.3-70B-Instruct", + "name": "Llama 3.3 70B Instruct", + "display_name": "Llama 3.3 70B Instruct", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 131072, + "output": 16384 + }, + "temperature": true, + "tool_call": true, + "reasoning": { + "supported": false + }, "attachment": false, "open_weights": true, - "knowledge": "2024-07", - "release_date": "2025-08-21", - "last_updated": "2025-08-21", + "release_date": "2024-12-06", + "last_updated": "2024-12-06", "cost": { - "input": 0.56, - "output": 1.68 + "input": 0.1, + "output": 0.3 }, "type": "chat" }, { - "id": "cohere-command-a", - "name": "Command A", - "display_name": "Command A", + "id": "moonshotai/Kimi-K2-Thinking", + "name": "Kimi K2 Thinking", + "display_name": "Kimi K2 Thinking", "modalities": { "input": [ "text" @@ -129566,8 +133858,8 @@ ] }, "limit": { - "context": 256000, - "output": 8000 + "context": 262144, + "output": 262144 }, "temperature": true, "tool_call": true, @@ -129575,53 +133867,77 @@ "supported": true, "default": true }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } + }, "attachment": false, "open_weights": true, - "knowledge": "2024-06-01", - "release_date": "2025-03-13", - "last_updated": "2025-03-13", + "knowledge": "2024-08", + "release_date": "2025-11-06", + "last_updated": "2025-11-06", "cost": { - "input": 2.5, - "output": 10 + "input": 0.6, + "output": 2.6 }, "type": "chat" }, { - "id": "gpt-4", - "name": "GPT-4", - "display_name": "GPT-4", + "id": "moonshotai/Kimi-K2.5", + "name": "Kimi K2.5", + "display_name": "Kimi K2.5", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 8192, - "output": 8192 + "context": 262144, + "output": 262144 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } }, "attachment": false, - "open_weights": false, - "knowledge": "2023-11", - "release_date": "2023-03-14", - "last_updated": "2023-03-14", + "open_weights": true, + "knowledge": "2026-01", + "release_date": "2026-01-27", + "last_updated": "2026-01-27", "cost": { - "input": 60, - "output": 120 + "input": 0.45, + "output": 2.8 }, "type": "chat" }, { - "id": "gpt-5.3-chat", - "name": "GPT-5.3 Chat", - "display_name": "GPT-5.3 Chat", + "id": "Qwen/Qwen2.5-VL-32B-Instruct", + "name": "Qwen2.5 VL 32B Instruct", + "display_name": "Qwen2.5 VL 32B Instruct", "modalities": { "input": [ "text", @@ -129632,43 +133948,41 @@ ] }, "limit": { - "context": 128000, + "context": 16384, "output": 16384 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, "attachment": true, - "open_weights": false, - "knowledge": "2025-08-31", - "release_date": "2026-03-03", - "last_updated": "2026-03-03", + "open_weights": true, + "release_date": "2025-03-24", + "last_updated": "2025-03-24", "cost": { - "input": 1.75, - "output": 14, - "cache_read": 0.175 + "input": 0.2, + "output": 0.6 }, "type": "chat" }, { - "id": "grok-4-1-fast-reasoning", - "name": "Grok 4.1 Fast (Reasoning)", - "display_name": "Grok 4.1 Fast (Reasoning)", + "id": "Qwen/Qwen3.5-Plus", + "name": "Qwen3.5 Plus", + "display_name": "Qwen3.5 Plus", "modalities": { "input": [ "text", - "image" + "image", + "video" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 8192 + "context": 1000000, + "output": 65536 }, "temperature": true, "tool_call": true, @@ -129678,24 +133992,31 @@ }, "extra_capabilities": { "reasoning": { - "supported": true + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] } }, - "attachment": true, + "attachment": false, "open_weights": false, - "release_date": "2025-06-27", - "last_updated": "2025-06-27", + "knowledge": "2025-04", + "release_date": "2026-02", + "last_updated": "2026-02", "cost": { - "input": 0.2, - "output": 0.5, - "cache_read": 0.05 + "input": 0.4, + "output": 2.4, + "reasoning": 2.4 }, "type": "chat" }, { - "id": "codestral-2501", - "name": "Codestral 25.01", - "display_name": "Codestral 25.01", + "id": "Qwen/Qwen3-235B-A22B-Instruct-2507", + "name": "Qwen3 235B A22B Instruct 2507", + "display_name": "Qwen3 235B A22B Instruct 2507", "modalities": { "input": [ "text" @@ -129705,8 +134026,8 @@ ] }, "limit": { - "context": 256000, - "output": 256000 + "context": 262000, + "output": 262000 }, "temperature": true, "tool_call": true, @@ -129714,20 +134035,19 @@ "supported": false }, "attachment": false, - "open_weights": false, - "knowledge": "2024-03", - "release_date": "2025-01-01", - "last_updated": "2025-01-01", + "open_weights": true, + "release_date": "2025-07-23", + "last_updated": "2025-07-23", "cost": { - "input": 0.3, - "output": 0.9 + "input": 0.09, + "output": 0.6 }, "type": "chat" }, { - "id": "grok-4-20-non-reasoning", - "name": "Grok 4.20 (Non-Reasoning)", - "display_name": "Grok 4.20 (Non-Reasoning)", + "id": "XiaomiMiMo/MiMo-V2-Flash", + "name": "MiMo V2 Flash", + "display_name": "MiMo V2 Flash", "modalities": { "input": [ "text" @@ -129737,34 +134057,30 @@ ] }, "limit": { - "context": 262000, - "output": 8192 + "context": 262144, + "output": 32000 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true - } + "supported": true, + "default": true }, "attachment": false, - "open_weights": false, - "knowledge": "2025-09", - "release_date": "2026-04-08", - "last_updated": "2026-04-08", + "open_weights": true, + "knowledge": "2024-12-01", + "release_date": "2025-12-17", + "last_updated": "2025-12-17", "cost": { - "input": 2, - "output": 6 + "input": 0.1, + "output": 0.3 }, "type": "chat" }, { - "id": "gpt-4.1-nano", - "name": "GPT-4.1 nano", - "display_name": "GPT-4.1 nano", + "id": "mistralai/Mistral-Small-3.2-24B-Instruct-2506", + "name": "Mistral Small 3.2 24B Instruct", + "display_name": "Mistral Small 3.2 24B Instruct", "modalities": { "input": [ "text", @@ -129775,8 +134091,8 @@ ] }, "limit": { - "context": 1047576, - "output": 32768 + "context": 32768, + "output": 8192 }, "temperature": true, "tool_call": true, @@ -129784,21 +134100,20 @@ "supported": false }, "attachment": true, - "open_weights": false, - "knowledge": "2024-04", - "release_date": "2025-04-14", - "last_updated": "2025-04-14", + "open_weights": true, + "knowledge": "2024-10", + "release_date": "2025-06-20", + "last_updated": "2025-06-20", "cost": { - "input": 0.1, - "output": 0.4, - "cache_read": 0.025 + "input": 0, + "output": 0 }, "type": "chat" }, { - "id": "cohere-embed-v3-multilingual", - "name": "Embed v3 Multilingual", - "display_name": "Embed v3 Multilingual", + "id": "mistralai/Mistral-Nemo-Instruct-2407", + "name": "Mistral Nemo Instruct 2407", + "display_name": "Mistral Nemo Instruct 2407", "modalities": { "input": [ "text" @@ -129808,69 +134123,72 @@ ] }, "limit": { - "context": 512, - "output": 1024 + "context": 131072, + "output": 65536 }, - "temperature": false, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { "supported": false }, "attachment": false, "open_weights": true, - "release_date": "2023-11-07", - "last_updated": "2023-11-07", + "release_date": "2024-07-18", + "last_updated": "2024-07-18", "cost": { - "input": 0.1, - "output": 0 + "input": 0.02, + "output": 0.04 }, "type": "chat" }, { - "id": "cohere-embed-v-4-0", - "name": "Embed v4", - "display_name": "Embed v4", + "id": "zai-org/GLM-4.6", + "name": "GLM-4.6", + "display_name": "GLM-4.6", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 1536 + "context": 202752, + "output": 131072 }, - "temperature": false, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": true, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } + }, + "attachment": false, "open_weights": true, - "release_date": "2025-04-15", - "last_updated": "2025-04-15", + "knowledge": "2025-04", + "release_date": "2025-09-30", + "last_updated": "2025-09-30", "cost": { - "input": 0.12, - "output": 0 + "input": 0.45, + "output": 1.9 }, "type": "chat" - } - ] - }, - "atomic-chat": { - "id": "atomic-chat", - "name": "Atomic Chat", - "display_name": "Atomic Chat", - "api": "http://127.0.0.1:1337/v1", - "doc": "https://atomic.chat", - "models": [ + }, { - "id": "Meta-Llama-3_1-8B-Instruct-GGUF", - "name": "Meta Llama 3.1 8B Instruct (GGUF)", - "display_name": "Meta Llama 3.1 8B Instruct (GGUF)", + "id": "zai-org/GLM-5", + "name": "GLM-5", + "display_name": "GLM-5", "modalities": { "input": [ "text" @@ -129880,28 +134198,40 @@ ] }, "limit": { - "context": 131072, - "output": 4096 + "context": 202752, + "output": 131072 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } }, "attachment": false, "open_weights": true, - "release_date": "2024-07-23", - "last_updated": "2024-07-23", + "release_date": "2026-02-11", + "last_updated": "2026-02-11", "cost": { - "input": 0, - "output": 0 + "input": 0.8, + "output": 2.56 }, "type": "chat" }, { - "id": "gemma-4-E4B-it-IQ4_XS", - "name": "Gemma 4 E4B Instruct (IQ4_XS)", - "display_name": "Gemma 4 E4B Instruct (IQ4_XS)", + "id": "zai-org/GLM-4.7", + "name": "GLM-4.7", + "display_name": "GLM-4.7", "modalities": { "input": [ "text" @@ -129911,60 +134241,72 @@ ] }, "limit": { - "context": 32768, - "output": 8192 + "context": 202752, + "output": 131072 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } }, "attachment": false, "open_weights": true, - "release_date": "2026-04-02", - "last_updated": "2026-04-02", + "knowledge": "2025-04", + "release_date": "2025-12-22", + "last_updated": "2025-12-22", "cost": { - "input": 0, - "output": 0 + "input": 0.2, + "output": 0.8 }, "type": "chat" }, { - "id": "Qwen3_5-9B-MLX-4bit", - "name": "Qwen 3.5 9B (MLX 4-bit)", - "display_name": "Qwen 3.5 9B (MLX 4-bit)", + "id": "deepseek-ai/DeepSeek-V3-0324", + "name": "DeepSeek V3 0324", + "display_name": "DeepSeek V3 0324", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 32768, - "output": 8192 + "context": 163840, + "output": 163840 }, "temperature": true, "tool_call": true, "reasoning": { "supported": false }, - "attachment": true, + "attachment": false, "open_weights": true, - "release_date": "2026-03-05", - "last_updated": "2026-04-04", + "release_date": "2025-03-24", + "last_updated": "2025-03-24", "cost": { - "input": 0, - "output": 0 + "input": 0.25, + "output": 0.88 }, "type": "chat" }, { - "id": "gemma-4-E4B-it-MLX-4bit", - "name": "Gemma 4 E4B Instruct (MLX 4-bit)", - "display_name": "Gemma 4 E4B Instruct (MLX 4-bit)", + "id": "deepseek-ai/DeepSeek-R1-0528", + "name": "DeepSeek R1 0528", + "display_name": "DeepSeek R1 0528", "modalities": { "input": [ "text" @@ -129974,68 +134316,103 @@ ] }, "limit": { - "context": 32768, - "output": 8192 + "context": 163840, + "output": 64000 }, "temperature": true, "tool_call": false, + "reasoning": { + "supported": true, + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } + }, + "attachment": false, + "open_weights": true, + "knowledge": "2024-07", + "release_date": "2025-05-28", + "last_updated": "2025-05-28", + "cost": { + "input": 0.5, + "output": 2.15 + }, + "type": "chat" + }, + { + "id": "deepseek-ai/DeepSeek-V3.1", + "name": "DeepSeek V3.1", + "display_name": "DeepSeek V3.1", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 164000, + "output": 164000 + }, + "temperature": true, + "tool_call": true, "reasoning": { "supported": false }, "attachment": false, "open_weights": true, - "release_date": "2026-04-02", - "last_updated": "2026-04-02", + "release_date": "2025-08-25", + "last_updated": "2025-08-25", "cost": { - "input": 0, - "output": 0 + "input": 0.27, + "output": 1 }, "type": "chat" }, { - "id": "Qwen3_5-9B-Q4_K_M", - "name": "Qwen 3.5 9B (Q4_K_M)", - "display_name": "Qwen 3.5 9B (Q4_K_M)", + "id": "deepseek-ai/DeepSeek-V3.2-Exp", + "name": "DeepSeek V3.2 Exp", + "display_name": "DeepSeek V3.2 Exp", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 32768, - "output": 8192 + "context": 164000, + "output": 164000 }, "temperature": true, "tool_call": true, "reasoning": { "supported": false }, - "attachment": true, + "attachment": false, "open_weights": true, - "release_date": "2026-03-05", - "last_updated": "2026-04-04", + "release_date": "2025-10-10", + "last_updated": "2025-10-10", "cost": { - "input": 0, - "output": 0 + "input": 0.27, + "output": 0.4 }, "type": "chat" - } - ] - }, - "merge-gateway": { - "id": "merge-gateway", - "name": "Merge Gateway", - "display_name": "Merge Gateway", - "doc": "https://docs.merge.dev/merge-gateway", - "models": [ + }, { - "id": "deepseek/deepseek-v4-flash", - "name": "DeepSeek V4 Flash", - "display_name": "DeepSeek V4 Flash", + "id": "deepseek-ai/DeepSeek-V3.2", + "name": "DeepSeek V3.2", + "display_name": "DeepSeek V3.2", "modalities": { "input": [ "text" @@ -130045,8 +134422,44 @@ ] }, "limit": { - "context": 1000000, - "output": 384000 + "context": 164000, + "output": 164000 + }, + "temperature": true, + "tool_call": true, + "reasoning": { + "supported": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true + } + }, + "attachment": false, + "open_weights": true, + "release_date": "2025-12-03", + "last_updated": "2025-12-03", + "cost": { + "input": 0.26, + "output": 0.38 + }, + "type": "chat" + }, + { + "id": "MiniMaxAI/MiniMax-M2.1", + "name": "MiniMax M2.1", + "display_name": "MiniMax M2.1", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 196608, + "output": 131072 }, "temperature": true, "tool_call": true, @@ -130067,20 +134480,18 @@ }, "attachment": false, "open_weights": true, - "knowledge": "2025-05", - "release_date": "2026-04-24", - "last_updated": "2026-04-24", + "release_date": "2025-12-23", + "last_updated": "2025-12-23", "cost": { - "input": 0.14, - "output": 0.28, - "cache_read": 0.0028 + "input": 0.28, + "output": 1.2 }, "type": "chat" }, { - "id": "deepseek/deepseek-v4-pro", - "name": "DeepSeek V4 Pro", - "display_name": "DeepSeek V4 Pro", + "id": "MiniMaxAI/MiniMax-M2.5", + "name": "MiniMax M2.5", + "display_name": "MiniMax M2.5", "modalities": { "input": [ "text" @@ -130090,8 +134501,8 @@ ] }, "limit": { - "context": 1000000, - "output": 384000 + "context": 204800, + "output": 131072 }, "temperature": true, "tool_call": true, @@ -130112,90 +134523,96 @@ }, "attachment": false, "open_weights": true, - "knowledge": "2025-05", - "release_date": "2026-04-24", - "last_updated": "2026-04-24", + "release_date": "2026-02-12", + "last_updated": "2026-02-12", "cost": { - "input": 0.435, - "output": 0.87, - "cache_read": 0.003625 + "input": 0.3, + "output": 1.2 + }, + "type": "chat" + } + ] + }, + "perplexity": { + "id": "perplexity", + "name": "Perplexity", + "display_name": "Perplexity", + "doc": "https://docs.perplexity.ai", + "models": [ + { + "id": "sonar-reasoning-pro", + "name": "Sonar Reasoning Pro", + "display_name": "Sonar Reasoning Pro", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 128000, + "output": 4096 + }, + "temperature": true, + "tool_call": false, + "reasoning": { + "supported": true, + "default": true + }, + "attachment": true, + "open_weights": false, + "knowledge": "2025-09-01", + "release_date": "2024-01-01", + "last_updated": "2025-09-01", + "cost": { + "input": 2, + "output": 8 }, "type": "chat" }, { - "id": "anthropic/claude-sonnet-4-6", - "name": "Claude Sonnet 4.6", - "display_name": "Claude Sonnet 4.6", + "id": "sonar", + "name": "Sonar", + "display_name": "Sonar", "modalities": { "input": [ - "text", - "image", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 1000000, - "output": 64000 + "context": 128000, + "output": 4096 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": false - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": false, - "mode": "mixed", - "budget": { - "min": 1024, - "unit": "tokens" - }, - "effort": "high", - "effort_options": [ - "low", - "medium", - "high", - "max" - ], - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ], - "notes": [ - "Anthropic recommends adaptive thinking with effort for Claude 4.6; budget_tokens remains a deprecated compatibility path.", - "Anthropic API defaults effort to high; lower effort levels should be chosen per workload." - ] - } + "supported": false }, - "attachment": true, + "attachment": false, "open_weights": false, - "knowledge": "2025-08-31", - "release_date": "2026-02-17", - "last_updated": "2026-03-13", + "knowledge": "2025-09-01", + "release_date": "2024-01-01", + "last_updated": "2025-09-01", "cost": { - "input": 3, - "output": 15, - "cache_read": 0.3, - "cache_write": 3.75 + "input": 1, + "output": 1 }, "type": "chat" }, { - "id": "anthropic/claude-haiku-4-5-20251001", - "name": "Claude Haiku 4.5", - "display_name": "Claude Haiku 4.5", + "id": "sonar-pro", + "name": "Sonar Pro", + "display_name": "Sonar Pro", "modalities": { "input": [ "text", - "image", - "pdf" + "image" ], "output": [ "text" @@ -130203,110 +134620,70 @@ }, "limit": { "context": 200000, - "output": 64000 + "output": 8192 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": false - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": false, - "mode": "budget", - "budget": { - "min": 1024, - "unit": "tokens" - }, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ], - "notes": [ - "Claude 4 manual thinking uses thinking.type = \"enabled\" with budget_tokens.", - "Interleaved thinking requires the interleaved-thinking-2025-05-14 beta header for this model family." - ] - } + "supported": false }, "attachment": true, "open_weights": false, - "knowledge": "2025-02-28", - "release_date": "2025-10-15", - "last_updated": "2025-10-15", + "knowledge": "2025-09-01", + "release_date": "2024-01-01", + "last_updated": "2025-09-01", "cost": { - "input": 1, - "output": 5, - "cache_read": 0.1, - "cache_write": 1.25 + "input": 3, + "output": 15 }, "type": "chat" }, { - "id": "anthropic/claude-opus-4-20250514", - "name": "Claude Opus 4", - "display_name": "Claude Opus 4", + "id": "sonar-deep-research", + "name": "Perplexity Sonar Deep Research", + "display_name": "Perplexity Sonar Deep Research", "modalities": { "input": [ - "text", - "image", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 32000 + "context": 128000, + "output": 32768 }, - "temperature": true, - "tool_call": true, + "temperature": false, + "tool_call": false, "reasoning": { "supported": true, - "default": false - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": false, - "mode": "budget", - "budget": { - "min": 1024, - "unit": "tokens" - }, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ], - "notes": [ - "Claude 4 manual thinking uses thinking.type = \"enabled\" with budget_tokens.", - "Interleaved thinking requires the interleaved-thinking-2025-05-14 beta header for this model family." - ] - } + "default": true }, - "attachment": true, + "attachment": false, "open_weights": false, - "knowledge": "2025-03-31", - "release_date": "2025-05-22", - "last_updated": "2025-05-22", + "knowledge": "2025-01", + "release_date": "2025-02-01", + "last_updated": "2025-09-01", "cost": { - "input": 15, - "output": 75, - "cache_read": 1.5, - "cache_write": 18.75 + "input": 2, + "output": 8, + "reasoning": 3 }, "type": "chat" - }, + } + ] + }, + "amazon-bedrock": { + "id": "amazon-bedrock", + "name": "Amazon Bedrock", + "display_name": "Amazon Bedrock", + "doc": "https://docs.aws.amazon.com/bedrock/latest/userguide/models-supported.html", + "models": [ { - "id": "anthropic/claude-sonnet-4-5-20250929", - "name": "Claude Sonnet 4.5", - "display_name": "Claude Sonnet 4.5", + "id": "global.anthropic.claude-haiku-4-5-20251001-v1:0", + "name": "Claude Haiku 4.5 (Global)", + "display_name": "Claude Haiku 4.5 (Global)", "modalities": { "input": [ "text", @@ -130350,21 +134727,21 @@ }, "attachment": true, "open_weights": false, - "knowledge": "2025-07-31", - "release_date": "2025-09-29", - "last_updated": "2025-09-29", + "knowledge": "2025-02-28", + "release_date": "2025-10-15", + "last_updated": "2025-10-15", "cost": { - "input": 3, - "output": 15, - "cache_read": 0.3, - "cache_write": 3.75 + "input": 1, + "output": 5, + "cache_read": 0.1, + "cache_write": 1.25 }, "type": "chat" }, { - "id": "anthropic/claude-opus-4-1-20250805", - "name": "Claude Opus 4.1", - "display_name": "Claude Opus 4.1", + "id": "global.anthropic.claude-sonnet-4-5-20250929-v1:0", + "name": "Claude Sonnet 4.5 (Global)", + "display_name": "Claude Sonnet 4.5 (Global)", "modalities": { "input": [ "text", @@ -130377,7 +134754,7 @@ }, "limit": { "context": 200000, - "output": 32000 + "output": 64000 }, "temperature": true, "tool_call": true, @@ -130408,143 +134785,86 @@ }, "attachment": true, "open_weights": false, - "knowledge": "2025-03-31", - "release_date": "2025-08-05", - "last_updated": "2025-08-05", + "knowledge": "2025-07-31", + "release_date": "2025-09-29", + "last_updated": "2025-09-29", "cost": { - "input": 15, - "output": 75, - "cache_read": 1.5, - "cache_write": 18.75 + "input": 3, + "output": 15, + "cache_read": 0.3, + "cache_write": 3.75 }, "type": "chat" }, { - "id": "anthropic/claude-opus-4-5-20251101", - "name": "Claude Opus 4.5", - "display_name": "Claude Opus 4.5", + "id": "us.meta.llama4-scout-17b-instruct-v1:0", + "name": "Llama 4 Scout 17B Instruct (US)", + "display_name": "Llama 4 Scout 17B Instruct (US)", "modalities": { "input": [ "text", - "image", - "pdf" + "image" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 64000 + "context": 3500000, + "output": 16384 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": false - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": false, - "mode": "mixed", - "budget": { - "min": 1024, - "unit": "tokens" - }, - "effort": "high", - "effort_options": [ - "low", - "medium", - "high" - ], - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ], - "notes": [ - "Claude Opus 4.5 uses manual thinking.type = \"enabled\" with budget_tokens; effort can be used alongside the thinking budget.", - "Interleaved thinking requires the interleaved-thinking-2025-05-14 beta header." - ] - } + "supported": false }, "attachment": true, - "open_weights": false, - "knowledge": "2025-03-31", - "release_date": "2025-11-01", - "last_updated": "2025-11-01", + "open_weights": true, + "knowledge": "2024-08", + "release_date": "2025-04-05", + "last_updated": "2025-04-05", "cost": { - "input": 5, - "output": 25, - "cache_read": 0.5, - "cache_write": 6.25 + "input": 0.17, + "output": 0.66 }, "type": "chat" }, { - "id": "anthropic/claude-sonnet-4-20250514", - "name": "Claude Sonnet 4", - "display_name": "Claude Sonnet 4", + "id": "minimax.minimax-m2", + "name": "MiniMax M2", + "display_name": "MiniMax M2", "modalities": { "input": [ - "text", - "image", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 64000 + "context": 204608, + "output": 128000 }, "temperature": true, "tool_call": true, "reasoning": { "supported": true, - "default": false - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": false, - "mode": "budget", - "budget": { - "min": 1024, - "unit": "tokens" - }, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ], - "notes": [ - "Claude 4 manual thinking uses thinking.type = \"enabled\" with budget_tokens.", - "Interleaved thinking requires the interleaved-thinking-2025-05-14 beta header for this model family." - ] - } + "default": true }, - "attachment": true, - "open_weights": false, - "knowledge": "2025-03-31", - "release_date": "2025-05-22", - "last_updated": "2025-05-22", + "attachment": false, + "open_weights": true, + "release_date": "2025-10-27", + "last_updated": "2025-10-27", "cost": { - "input": 3, - "output": 15, - "cache_read": 0.3, - "cache_write": 3.75 + "input": 0.3, + "output": 1.2 }, "type": "chat" }, { - "id": "anthropic/claude-opus-4-6", - "name": "Claude Opus 4.6", - "display_name": "Claude Opus 4.6", + "id": "anthropic.claude-opus-4-7", + "name": "Claude Opus 4.7", + "display_name": "Claude Opus 4.7", "modalities": { "input": [ "text", @@ -130559,7 +134879,7 @@ "context": 1000000, "output": 128000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { "supported": true, @@ -130569,35 +134889,33 @@ "reasoning": { "supported": true, "default_enabled": false, - "mode": "mixed", - "budget": { - "min": 1024, - "unit": "tokens" - }, + "mode": "effort", "effort": "high", "effort_options": [ "low", "medium", "high", + "xhigh", "max" ], "interleaved": true, "summaries": true, - "visibility": "summary", + "visibility": "omitted", "continuation": [ "thinking_blocks" ], "notes": [ - "Anthropic recommends adaptive thinking with effort for Claude 4.6; budget_tokens remains a deprecated compatibility path.", - "Anthropic API defaults effort to high; lower effort levels should be chosen per workload." + "Claude Opus 4.7 and newer Opus models require thinking.type = \"adaptive\" to enable thinking explicitly.", + "Manual budget_tokens requests return 400 on Claude Opus 4.7 and newer adaptive-only Opus models.", + "task_budget is separate from thinking control and should not be treated as a thinking budget." ] } }, "attachment": true, "open_weights": false, - "knowledge": "2025-05-31", - "release_date": "2026-02-05", - "last_updated": "2026-03-13", + "knowledge": "2026-01-31", + "release_date": "2026-04-16", + "last_updated": "2026-04-16", "cost": { "input": 5, "output": 25, @@ -130607,9 +134925,9 @@ "type": "chat" }, { - "id": "anthropic/claude-opus-4-7", - "name": "Claude Opus 4.7", - "display_name": "Claude Opus 4.7", + "id": "eu.anthropic.claude-sonnet-4-6", + "name": "Claude Sonnet 4.6 (EU)", + "display_name": "Claude Sonnet 4.6 (EU)", "modalities": { "input": [ "text", @@ -130622,9 +134940,9 @@ }, "limit": { "context": 1000000, - "output": 128000 + "output": 64000 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, @@ -130634,187 +134952,59 @@ "reasoning": { "supported": true, "default_enabled": false, - "mode": "effort", + "mode": "mixed", + "budget": { + "min": 1024, + "unit": "tokens" + }, "effort": "high", "effort_options": [ "low", "medium", "high", - "xhigh", "max" ], "interleaved": true, "summaries": true, - "visibility": "omitted", + "visibility": "summary", "continuation": [ "thinking_blocks" ], "notes": [ - "Claude Opus 4.7 and newer Opus models require thinking.type = \"adaptive\" to enable thinking explicitly.", - "Manual budget_tokens requests return 400 on Claude Opus 4.7 and newer adaptive-only Opus models.", - "task_budget is separate from thinking control and should not be treated as a thinking budget." + "Anthropic recommends adaptive thinking with effort for Claude 4.6; budget_tokens remains a deprecated compatibility path.", + "Anthropic API defaults effort to high; lower effort levels should be chosen per workload." ] } }, "attachment": true, "open_weights": false, - "knowledge": "2026-01-31", - "release_date": "2026-04-16", - "last_updated": "2026-04-16", - "cost": { - "input": 5, - "output": 25, - "cache_read": 0.5, - "cache_write": 6.25 - }, - "type": "chat" - }, - { - "id": "mistral/mistral-large-2411", - "name": "Mistral Large 2.1", - "display_name": "Mistral Large 2.1", - "modalities": { - "input": [ - "text" - ], - "output": [ - "text" - ] - }, - "limit": { - "context": 131072, - "output": 16384 - }, - "temperature": true, - "tool_call": true, - "reasoning": { - "supported": false - }, - "attachment": false, - "open_weights": true, - "knowledge": "2024-11", - "release_date": "2024-11-01", - "last_updated": "2024-11-04", - "cost": { - "input": 2, - "output": 6 - }, - "type": "chat" - }, - { - "id": "mistral/mistral-medium-latest", - "name": "Mistral Medium (latest)", - "display_name": "Mistral Medium (latest)", - "modalities": { - "input": [ - "text", - "image" - ], - "output": [ - "text" - ] - }, - "limit": { - "context": 262144, - "output": 262144 - }, - "temperature": true, - "tool_call": true, - "reasoning": { - "supported": false - }, - "attachment": true, - "open_weights": false, - "knowledge": "2025-05", - "release_date": "2025-08-12", - "last_updated": "2025-08-12", - "cost": { - "input": 0.4, - "output": 2 - }, - "type": "chat" - }, - { - "id": "mistral/devstral-medium-latest", - "name": "Devstral 2 (latest)", - "display_name": "Devstral 2 (latest)", - "modalities": { - "input": [ - "text" - ], - "output": [ - "text" - ] - }, - "limit": { - "context": 262144, - "output": 262144 - }, - "temperature": true, - "tool_call": true, - "reasoning": { - "supported": false - }, - "attachment": false, - "open_weights": true, - "knowledge": "2025-12", - "release_date": "2025-12-02", - "last_updated": "2025-12-02", - "cost": { - "input": 0.4, - "output": 2 - }, - "type": "chat" - }, - { - "id": "mistral/mistral-large-2512", - "name": "Mistral Large 3", - "display_name": "Mistral Large 3", - "modalities": { - "input": [ - "text", - "image" - ], - "output": [ - "text" - ] - }, - "limit": { - "context": 262144, - "output": 262144 - }, - "temperature": true, - "tool_call": true, - "reasoning": { - "supported": false - }, - "attachment": true, - "open_weights": true, - "knowledge": "2024-11", - "release_date": "2024-11-01", - "last_updated": "2025-12-02", + "knowledge": "2025-08-31", + "release_date": "2026-02-17", + "last_updated": "2026-03-13", "cost": { - "input": 0.5, - "output": 1.5 + "input": 3.3, + "output": 16.5, + "cache_read": 0.33, + "cache_write": 4.125 }, "type": "chat" }, { - "id": "mistral/mistral-large-latest", - "name": "Mistral Large (latest)", - "display_name": "Mistral Large (latest)", + "id": "mistral.voxtral-small-24b-2507", + "name": "Voxtral Small 24B 2507", + "display_name": "Voxtral Small 24B 2507", "modalities": { "input": [ "text", - "image" + "audio" ], "output": [ "text" ] }, "limit": { - "context": 262144, - "output": 262144 + "context": 32000, + "output": 8192 }, "temperature": true, "tool_call": true, @@ -130823,19 +135013,18 @@ }, "attachment": true, "open_weights": true, - "knowledge": "2024-11", - "release_date": "2024-11-01", - "last_updated": "2025-12-02", + "release_date": "2025-07-01", + "last_updated": "2025-07-01", "cost": { - "input": 0.5, - "output": 1.5 + "input": 0.15, + "output": 0.35 }, "type": "chat" }, { - "id": "mistral/mistral-medium-2505", - "name": "Mistral Medium 3", - "display_name": "Mistral Medium 3", + "id": "mistral.ministral-3-3b-instruct", + "name": "Ministral 3 3B", + "display_name": "Ministral 3 3B", "modalities": { "input": [ "text", @@ -130845,105 +135034,9 @@ "text" ] }, - "limit": { - "context": 131072, - "output": 131072 - }, - "temperature": true, - "tool_call": true, - "reasoning": { - "supported": false - }, - "attachment": true, - "open_weights": false, - "knowledge": "2025-05", - "release_date": "2025-05-07", - "last_updated": "2025-05-07", - "cost": { - "input": 0.4, - "output": 2 - }, - "type": "chat" - }, - { - "id": "mistral/devstral-small-2507", - "name": "Devstral Small", - "display_name": "Devstral Small", - "modalities": { - "input": [ - "text" - ], - "output": [ - "text" - ] - }, - "limit": { - "context": 128000, - "output": 128000 - }, - "temperature": true, - "tool_call": true, - "reasoning": { - "supported": false - }, - "attachment": false, - "open_weights": true, - "knowledge": "2025-05", - "release_date": "2025-07-10", - "last_updated": "2025-07-10", - "cost": { - "input": 0.1, - "output": 0.3 - }, - "type": "chat" - }, - { - "id": "mistral/devstral-2512", - "name": "Devstral 2", - "display_name": "Devstral 2", - "modalities": { - "input": [ - "text" - ], - "output": [ - "text" - ] - }, - "limit": { - "context": 262144, - "output": 262144 - }, - "temperature": true, - "tool_call": true, - "reasoning": { - "supported": false - }, - "attachment": false, - "open_weights": true, - "knowledge": "2025-12", - "release_date": "2025-12-09", - "last_updated": "2025-12-09", - "cost": { - "input": 0.4, - "output": 2 - }, - "type": "chat" - }, - { - "id": "mistral/codestral-latest", - "name": "Codestral (latest)", - "display_name": "Codestral (latest)", - "modalities": { - "input": [ - "text" - ], - "output": [ - "text" - ] - }, "limit": { "context": 256000, - "output": 4096 + "output": 8192 }, "temperature": true, "tool_call": true, @@ -130952,52 +135045,18 @@ }, "attachment": false, "open_weights": true, - "knowledge": "2024-10", - "release_date": "2024-05-29", - "last_updated": "2025-01-04", - "cost": { - "input": 0.3, - "output": 0.9 - }, - "type": "chat" - }, - { - "id": "mistral/pixtral-large-latest", - "name": "Pixtral Large (latest)", - "display_name": "Pixtral Large (latest)", - "modalities": { - "input": [ - "text", - "image" - ], - "output": [ - "text" - ] - }, - "limit": { - "context": 128000, - "output": 128000 - }, - "temperature": true, - "tool_call": true, - "reasoning": { - "supported": false - }, - "attachment": true, - "open_weights": true, - "knowledge": "2024-11", - "release_date": "2024-11-01", - "last_updated": "2024-11-04", + "release_date": "2025-12-02", + "last_updated": "2025-12-02", "cost": { - "input": 2, - "output": 6 + "input": 0.1, + "output": 0.1 }, "type": "chat" }, { - "id": "mistral/magistral-medium-latest", - "name": "Magistral Medium (latest)", - "display_name": "Magistral Medium (latest)", + "id": "openai.gpt-oss-20b", + "name": "gpt-oss-20b", + "display_name": "gpt-oss-20b", "modalities": { "input": [ "text" @@ -131018,53 +135077,83 @@ }, "attachment": false, "open_weights": false, - "knowledge": "2025-06", - "release_date": "2025-03-17", - "last_updated": "2025-03-20", + "release_date": "2025-08-05", + "last_updated": "2025-08-05", "cost": { - "input": 2, - "output": 5 + "input": 0.07, + "output": 0.3 }, "type": "chat" }, { - "id": "mistral/mistral-small-latest", - "name": "Mistral Small (latest)", - "display_name": "Mistral Small (latest)", + "id": "anthropic.claude-opus-4-6-v1", + "name": "Claude Opus 4.6", + "display_name": "Claude Opus 4.6", "modalities": { "input": [ "text", - "image" + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 256000, - "output": 256000 + "context": 1000000, + "output": 128000 }, "temperature": true, "tool_call": true, "reasoning": { "supported": true, - "default": true + "default": false + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": false, + "mode": "mixed", + "budget": { + "min": 1024, + "unit": "tokens" + }, + "effort": "high", + "effort_options": [ + "low", + "medium", + "high", + "max" + ], + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ], + "notes": [ + "Anthropic recommends adaptive thinking with effort for Claude 4.6; budget_tokens remains a deprecated compatibility path.", + "Anthropic API defaults effort to high; lower effort levels should be chosen per workload." + ] + } }, "attachment": true, - "open_weights": true, - "knowledge": "2025-06", - "release_date": "2026-03-16", - "last_updated": "2026-03-16", + "open_weights": false, + "knowledge": "2025-05-31", + "release_date": "2026-02-05", + "last_updated": "2026-03-13", "cost": { - "input": 0.15, - "output": 0.6 + "input": 5, + "output": 25, + "cache_read": 0.5, + "cache_write": 6.25 }, "type": "chat" }, { - "id": "mistral/devstral-medium-2507", - "name": "Devstral Medium", - "display_name": "Devstral Medium", + "id": "openai.gpt-oss-safeguard-20b", + "name": "GPT OSS Safeguard 20B", + "display_name": "GPT OSS Safeguard 20B", "modalities": { "input": [ "text" @@ -131075,7 +135164,7 @@ }, "limit": { "context": 128000, - "output": 128000 + "output": 16384 }, "temperature": true, "tool_call": true, @@ -131084,19 +135173,18 @@ }, "attachment": false, "open_weights": false, - "knowledge": "2025-05", - "release_date": "2025-07-10", - "last_updated": "2025-07-10", + "release_date": "2025-10-29", + "last_updated": "2025-10-29", "cost": { - "input": 0.4, - "output": 2 + "input": 0.07, + "output": 0.2 }, "type": "chat" }, { - "id": "xai/grok-4.20-0309-reasoning", - "name": "Grok 4.20 (Reasoning)", - "display_name": "Grok 4.20 (Reasoning)", + "id": "anthropic.claude-opus-4-5-20251101-v1:0", + "name": "Claude Opus 4.5", + "display_name": "Claude Opus 4.5", "modalities": { "input": [ "text", @@ -131108,51 +135196,63 @@ ] }, "limit": { - "context": 1000000, - "output": 30000 + "context": 200000, + "output": 64000 }, "temperature": true, "tool_call": true, "reasoning": { "supported": true, - "default": true + "default": false + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": false, + "mode": "mixed", + "budget": { + "min": 1024, + "unit": "tokens" + }, + "effort": "high", + "effort_options": [ + "low", + "medium", + "high" + ], + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ], + "notes": [ + "Claude Opus 4.5 uses manual thinking.type = \"enabled\" with budget_tokens; effort can be used alongside the thinking budget.", + "Interleaved thinking requires the interleaved-thinking-2025-05-14 beta header." + ] + } }, "attachment": true, "open_weights": false, - "release_date": "2026-03-09", - "last_updated": "2026-03-09", + "knowledge": "2025-03-31", + "release_date": "2025-11-24", + "last_updated": "2025-08-01", "cost": { - "input": 1.25, - "output": 2.5, - "cache_read": 0.2, - "tiers": [ - { - "input": 2.5, - "output": 5, - "cache_read": 0.4, - "tier": { - "type": "context", - "size": 200000 - } - } - ], - "context_over_200k": { - "input": 2.5, - "output": 5, - "cache_read": 0.4 - } + "input": 5, + "output": 25, + "cache_read": 0.5, + "cache_write": 6.25 }, "type": "chat" }, { - "id": "xai/grok-4.3", - "name": "Grok 4.3", - "display_name": "Grok 4.3", + "id": "global.anthropic.claude-fable-5", + "name": "Claude Fable 5 (Global)", + "display_name": "Claude Fable 5 (Global)", "modalities": { "input": [ "text", - "image", - "pdf" + "image" ], "output": [ "text" @@ -131160,9 +135260,9 @@ }, "limit": { "context": 1000000, - "output": 30000 + "output": 128000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { "supported": true, @@ -131170,40 +135270,47 @@ }, "extra_capabilities": { "reasoning": { - "supported": true + "supported": true, + "default_enabled": true, + "mode": "effort", + "effort": "high", + "effort_options": [ + "low", + "medium", + "high", + "xhigh", + "max" + ], + "interleaved": true, + "summaries": true, + "visibility": "omitted", + "continuation": [ + "thinking_blocks" + ], + "notes": [ + "Adaptive thinking is always on for Claude Fable 5 and Claude Mythos 5; thinking.type = \"disabled\" is rejected.", + "Manual budget_tokens requests return 400 on Claude Fable 5 and Claude Mythos 5.", + "thinking.display defaults to omitted; set display to summarized to receive readable thinking summaries." + ] } }, "attachment": true, "open_weights": false, - "release_date": "2026-04-17", - "last_updated": "2026-04-17", + "knowledge": "2026-01-31", + "release_date": "2026-06-09", + "last_updated": "2026-06-09", "cost": { - "input": 1.25, - "output": 2.5, - "cache_read": 0.2, - "tiers": [ - { - "input": 2.5, - "output": 5, - "cache_read": 0.4, - "tier": { - "type": "context", - "size": 200000 - } - } - ], - "context_over_200k": { - "input": 2.5, - "output": 5, - "cache_read": 0.4 - } + "input": 10, + "output": 50, + "cache_read": 1, + "cache_write": 12.5 }, "type": "chat" }, { - "id": "cohere/command-r-plus-08-2024", - "name": "Command R+", - "display_name": "Command R+", + "id": "openai.gpt-oss-120b-1:0", + "name": "gpt-oss-120b", + "display_name": "gpt-oss-120b", "modalities": { "input": [ "text" @@ -131214,92 +135321,121 @@ }, "limit": { "context": 128000, - "output": 4000 + "output": 16384 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "attachment": false, - "open_weights": true, - "knowledge": "2024-06-01", - "release_date": "2024-08-30", - "last_updated": "2024-08-30", + "open_weights": false, + "release_date": "2025-08-05", + "last_updated": "2025-08-05", "cost": { - "input": 2.5, - "output": 10 + "input": 0.15, + "output": 0.6 }, "type": "chat" }, { - "id": "cohere/command-r-08-2024", - "name": "Command R", - "display_name": "Command R", + "id": "anthropic.claude-sonnet-4-5-20250929-v1:0", + "name": "Claude Sonnet 4.5", + "display_name": "Claude Sonnet 4.5", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 4000 + "context": 200000, + "output": 64000 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": false }, - "attachment": false, - "open_weights": true, - "knowledge": "2024-06-01", - "release_date": "2024-08-30", - "last_updated": "2024-08-30", + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": false, + "mode": "budget", + "budget": { + "min": 1024, + "unit": "tokens" + }, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ], + "notes": [ + "Claude 4 manual thinking uses thinking.type = \"enabled\" with budget_tokens.", + "Interleaved thinking requires the interleaved-thinking-2025-05-14 beta header for this model family." + ] + } + }, + "attachment": true, + "open_weights": false, + "knowledge": "2025-07-31", + "release_date": "2025-09-29", + "last_updated": "2025-09-29", "cost": { - "input": 0.15, - "output": 0.6 + "input": 3, + "output": 15, + "cache_read": 0.3, + "cache_write": 3.75 }, "type": "chat" }, { - "id": "cohere/command-r7b-12-2024", - "name": "Command R7B", - "display_name": "Command R7B", + "id": "amazon.nova-pro-v1:0", + "name": "Nova Pro", + "display_name": "Nova Pro", "modalities": { "input": [ - "text" + "text", + "image", + "video" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 4000 + "context": 300000, + "output": 8192 }, "temperature": true, "tool_call": true, "reasoning": { "supported": false }, - "attachment": false, - "open_weights": true, - "knowledge": "2024-06-01", - "release_date": "2024-02-27", - "last_updated": "2024-02-27", + "attachment": true, + "open_weights": false, + "knowledge": "2024-10", + "release_date": "2024-12-03", + "last_updated": "2024-12-03", "cost": { - "input": 0.0375, - "output": 0.15 + "input": 0.8, + "output": 3.2, + "cache_read": 0.2 }, "type": "chat" }, { - "id": "cohere/command-a-03-2025", - "name": "Command A", - "display_name": "Command A", + "id": "qwen.qwen3-coder-next", + "name": "Qwen3 Coder Next", + "display_name": "Qwen3 Coder Next", "modalities": { "input": [ "text" @@ -131309,64 +135445,92 @@ ] }, "limit": { - "context": 256000, - "output": 8000 + "context": 131072, + "output": 65536 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "attachment": false, "open_weights": true, - "knowledge": "2024-06-01", - "release_date": "2025-03-13", - "last_updated": "2025-03-13", + "release_date": "2026-02-06", + "last_updated": "2026-02-06", "cost": { - "input": 2.5, - "output": 10 + "input": 0.22, + "output": 1.8 }, "type": "chat" }, { - "id": "zai/glm-4.7-flashx", - "name": "GLM-4.7-FlashX", - "display_name": "GLM-4.7-FlashX", + "id": "us.anthropic.claude-opus-4-7", + "name": "Claude Opus 4.7 (US)", + "display_name": "Claude Opus 4.7 (US)", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 131072 + "context": 1000000, + "output": 128000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { "supported": true, - "default": true + "default": false }, - "attachment": false, - "open_weights": true, - "knowledge": "2025-04", - "release_date": "2026-01-19", - "last_updated": "2026-01-19", + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": false, + "mode": "effort", + "effort": "high", + "effort_options": [ + "low", + "medium", + "high", + "xhigh", + "max" + ], + "interleaved": true, + "summaries": true, + "visibility": "omitted", + "continuation": [ + "thinking_blocks" + ], + "notes": [ + "Claude Opus 4.7 and newer Opus models require thinking.type = \"adaptive\" to enable thinking explicitly.", + "Manual budget_tokens requests return 400 on Claude Opus 4.7 and newer adaptive-only Opus models.", + "task_budget is separate from thinking control and should not be treated as a thinking budget." + ] + } + }, + "attachment": true, + "open_weights": false, + "knowledge": "2026-01-31", + "release_date": "2026-04-16", + "last_updated": "2026-04-16", "cost": { - "input": 0.07, - "output": 0.4, - "cache_read": 0.01, - "cache_write": 0 + "input": 5, + "output": 25, + "cache_read": 0.5, + "cache_write": 6.25 }, "type": "chat" }, { - "id": "zai/glm-4.6", - "name": "GLM-4.6", - "display_name": "GLM-4.6", + "id": "nvidia.nemotron-nano-9b-v2", + "name": "NVIDIA Nemotron Nano 9B v2", + "display_name": "NVIDIA Nemotron Nano 9B v2", "modalities": { "input": [ "text" @@ -131376,37 +135540,28 @@ ] }, "limit": { - "context": 204800, - "output": 131072 + "context": 128000, + "output": 4096 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true - } + "supported": false }, "attachment": false, - "open_weights": true, - "knowledge": "2025-04", - "release_date": "2025-09-30", - "last_updated": "2025-09-30", + "open_weights": false, + "release_date": "2024-12-01", + "last_updated": "2024-12-01", "cost": { - "input": 0.6, - "output": 2.2, - "cache_read": 0.11, - "cache_write": 0 + "input": 0.06, + "output": 0.23 }, "type": "chat" }, { - "id": "zai/glm-4.7", - "name": "GLM-4.7", - "display_name": "GLM-4.7", + "id": "qwen.qwen3-32b-v1:0", + "name": "Qwen3 32B (dense)", + "display_name": "Qwen3 32B (dense)", "modalities": { "input": [ "text" @@ -131416,8 +135571,8 @@ ] }, "limit": { - "context": 204800, - "output": 131072 + "context": 16384, + "output": 16384 }, "temperature": true, "tool_call": true, @@ -131425,79 +135580,86 @@ "supported": true, "default": true }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } - }, "attachment": false, "open_weights": true, - "knowledge": "2025-04", - "release_date": "2025-12-22", - "last_updated": "2025-12-22", + "knowledge": "2024-04", + "release_date": "2025-09-18", + "last_updated": "2025-09-18", "cost": { - "input": 0.6, - "output": 2.2, - "cache_read": 0.11, - "cache_write": 0 + "input": 0.15, + "output": 0.6 }, "type": "chat" }, { - "id": "zai/glm-5", - "name": "GLM-5", - "display_name": "GLM-5", + "id": "jp.anthropic.claude-sonnet-4-6", + "name": "Claude Sonnet 4.6 (JP)", + "display_name": "Claude Sonnet 4.6 (JP)", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 204800, - "output": 131072 + "context": 1000000, + "output": 64000 }, "temperature": true, "tool_call": true, "reasoning": { "supported": true, - "default": true + "default": false }, "extra_capabilities": { "reasoning": { "supported": true, + "default_enabled": false, + "mode": "mixed", + "budget": { + "min": 1024, + "unit": "tokens" + }, + "effort": "high", + "effort_options": [ + "low", + "medium", + "high", + "max" + ], "interleaved": true, "summaries": true, "visibility": "summary", "continuation": [ "thinking_blocks" + ], + "notes": [ + "Anthropic recommends adaptive thinking with effort for Claude 4.6; budget_tokens remains a deprecated compatibility path.", + "Anthropic API defaults effort to high; lower effort levels should be chosen per workload." ] } }, - "attachment": false, - "open_weights": true, - "release_date": "2026-02-11", - "last_updated": "2026-02-11", + "attachment": true, + "open_weights": false, + "knowledge": "2025-08-31", + "release_date": "2026-02-17", + "last_updated": "2026-03-13", "cost": { - "input": 1, - "output": 3.2, - "cache_read": 0.2, - "cache_write": 0 + "input": 3, + "output": 15, + "cache_read": 0.3, + "cache_write": 3.75 }, "type": "chat" }, { - "id": "zai/glm-5-turbo", - "name": "GLM-5-Turbo", - "display_name": "GLM-5-Turbo", + "id": "deepseek.r1-v1:0", + "name": "DeepSeek-R1", + "display_name": "DeepSeek-R1", "modalities": { "input": [ "text" @@ -131507,8 +135669,8 @@ ] }, "limit": { - "context": 200000, - "output": 131072 + "context": 128000, + "output": 32768 }, "temperature": true, "tool_call": true, @@ -131516,163 +135678,164 @@ "supported": true, "default": true }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } - }, "attachment": false, "open_weights": false, - "release_date": "2026-03-16", - "last_updated": "2026-03-16", + "knowledge": "2024-07", + "release_date": "2025-01-20", + "last_updated": "2025-05-29", "cost": { - "input": 1.2, - "output": 4, - "cache_read": 0.24, - "cache_write": 0 + "input": 1.35, + "output": 5.4 }, "type": "chat" }, { - "id": "zai/glm-4.5", - "name": "GLM-4.5", - "display_name": "GLM-4.5", + "id": "mistral.mistral-large-3-675b-instruct", + "name": "Mistral Large 3", + "display_name": "Mistral Large 3", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 131072, - "output": 98304 + "context": 256000, + "output": 8192 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, "attachment": false, "open_weights": true, - "knowledge": "2025-04", - "release_date": "2025-07-28", - "last_updated": "2025-07-28", + "release_date": "2025-12-02", + "last_updated": "2025-12-02", "cost": { - "input": 0.6, - "output": 2.2, - "cache_read": 0.11, - "cache_write": 0 + "input": 0.5, + "output": 1.5 }, "type": "chat" }, { - "id": "zai/glm-4.5-air", - "name": "GLM-4.5-Air", - "display_name": "GLM-4.5-Air", + "id": "google.gemma-3-27b-it", + "name": "Google Gemma 3 27B Instruct", + "display_name": "Google Gemma 3 27B Instruct", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 131072, - "output": 98304 + "context": 202752, + "output": 8192 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, - "attachment": false, + "attachment": true, "open_weights": true, - "knowledge": "2025-04", - "release_date": "2025-07-28", - "last_updated": "2025-07-28", + "knowledge": "2025-07", + "release_date": "2025-07-27", + "last_updated": "2025-07-27", "cost": { - "input": 0.2, - "output": 1.1, - "cache_read": 0.03, - "cache_write": 0 + "input": 0.12, + "output": 0.2 }, "type": "chat" }, { - "id": "zai/glm-5.1", - "name": "GLM-5.1", - "display_name": "GLM-5.1", + "id": "anthropic.claude-sonnet-4-6", + "name": "Claude Sonnet 4.6", + "display_name": "Claude Sonnet 4.6", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 131072 + "context": 1000000, + "output": 64000 }, "temperature": true, "tool_call": true, "reasoning": { "supported": true, - "default": true + "default": false }, "extra_capabilities": { "reasoning": { "supported": true, + "default_enabled": false, + "mode": "mixed", + "budget": { + "min": 1024, + "unit": "tokens" + }, + "effort": "high", + "effort_options": [ + "low", + "medium", + "high", + "max" + ], "interleaved": true, "summaries": true, "visibility": "summary", "continuation": [ "thinking_blocks" + ], + "notes": [ + "Anthropic recommends adaptive thinking with effort for Claude 4.6; budget_tokens remains a deprecated compatibility path.", + "Anthropic API defaults effort to high; lower effort levels should be chosen per workload." ] } }, - "attachment": false, - "open_weights": true, - "release_date": "2026-03-27", - "last_updated": "2026-03-27", + "attachment": true, + "open_weights": false, + "knowledge": "2025-08-31", + "release_date": "2026-02-17", + "last_updated": "2026-03-13", "cost": { - "input": 1.4, - "output": 4.4, - "cache_read": 0.26, - "cache_write": 0 + "input": 3, + "output": 15, + "cache_read": 0.3, + "cache_write": 3.75 }, "type": "chat" }, { - "id": "google/gemini-3.1-flash-lite-preview", - "name": "Gemini 3.1 Flash Lite Preview", - "display_name": "Gemini 3.1 Flash Lite Preview", + "id": "amazon.nova-2-lite-v1:0", + "name": "Nova 2 Lite", + "display_name": "Nova 2 Lite", "modalities": { "input": [ "text", "image", - "video", - "audio", - "pdf" + "video" ], "output": [ "text" ] }, "limit": { - "context": 1048576, - "output": 65536 + "context": 128000, + "output": 4096 }, "temperature": true, "tool_call": true, @@ -131680,101 +135843,86 @@ "supported": true, "default": true }, - "extra_capabilities": { - "reasoning": { - "supported": true - } - }, - "attachment": true, + "attachment": false, "open_weights": false, - "knowledge": "2025-01", - "release_date": "2026-03-03", - "last_updated": "2026-03-03", + "release_date": "2024-12-01", + "last_updated": "2024-12-01", "cost": { - "input": 0.25, - "output": 1.5, - "cache_read": 0.025, - "input_audio": 0.5 + "input": 0.33, + "output": 2.75 }, "type": "chat" }, { - "id": "google/gemma-4-31b-it", - "name": "Gemma 4 31B IT", - "display_name": "Gemma 4 31B IT", + "id": "openai.gpt-oss-safeguard-120b", + "name": "GPT OSS Safeguard 120B", + "display_name": "GPT OSS Safeguard 120B", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 262144, - "output": 32768 + "context": 128000, + "output": 16384 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false + }, + "attachment": false, + "open_weights": false, + "release_date": "2025-10-29", + "last_updated": "2025-10-29", + "cost": { + "input": 0.15, + "output": 0.6 }, - "attachment": true, - "open_weights": true, - "release_date": "2026-04-02", - "last_updated": "2026-04-02", "type": "chat" }, { - "id": "google/gemini-flash-lite-latest", - "name": "Gemini Flash-Lite Latest", - "display_name": "Gemini Flash-Lite Latest", + "id": "mistral.ministral-3-8b-instruct", + "name": "Ministral 3 8B", + "display_name": "Ministral 3 8B", "modalities": { "input": [ - "text", - "image", - "audio", - "video", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 1048576, - "output": 65536 + "context": 128000, + "output": 4096 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, - "attachment": true, + "attachment": false, "open_weights": false, - "knowledge": "2025-01", - "release_date": "2025-09-25", - "last_updated": "2025-09-25", + "release_date": "2024-12-01", + "last_updated": "2024-12-01", "cost": { - "input": 0.1, - "output": 0.4, - "cache_read": 0.025 + "input": 0.15, + "output": 0.15 }, "type": "chat" }, { - "id": "google/gemini-3-flash-preview", - "name": "Gemini 3 Flash Preview", - "display_name": "Gemini 3 Flash Preview", + "id": "eu.anthropic.claude-opus-4-6-v1", + "name": "Claude Opus 4.6 (EU)", + "display_name": "Claude Opus 4.6 (EU)", "modalities": { "input": [ "text", "image", - "video", - "audio", "pdf" ], "output": [ @@ -131782,57 +135930,64 @@ ] }, "limit": { - "context": 1048576, - "output": 65536 + "context": 1000000, + "output": 128000 }, "temperature": true, "tool_call": true, "reasoning": { "supported": true, - "default": true + "default": false }, "extra_capabilities": { "reasoning": { "supported": true, - "default_enabled": true, - "mode": "level", - "level": "high", - "level_options": [ - "minimal", + "default_enabled": false, + "mode": "mixed", + "budget": { + "min": 1024, + "unit": "tokens" + }, + "effort": "high", + "effort_options": [ "low", "medium", - "high" + "high", + "max" ], + "interleaved": true, "summaries": true, "visibility": "summary", "continuation": [ - "thought_signatures" + "thinking_blocks" + ], + "notes": [ + "Anthropic recommends adaptive thinking with effort for Claude 4.6; budget_tokens remains a deprecated compatibility path.", + "Anthropic API defaults effort to high; lower effort levels should be chosen per workload." ] } }, "attachment": true, "open_weights": false, - "knowledge": "2025-01", - "release_date": "2025-12-17", - "last_updated": "2025-12-17", + "knowledge": "2025-05-31", + "release_date": "2026-02-05", + "last_updated": "2026-03-13", "cost": { - "input": 0.5, - "output": 3, - "cache_read": 0.05, - "input_audio": 1 + "input": 5.5, + "output": 27.5, + "cache_read": 0.55, + "cache_write": 6.875 }, "type": "chat" }, { - "id": "google/gemini-3.1-pro-preview-customtools", - "name": "Gemini 3.1 Pro Preview Custom Tools", - "display_name": "Gemini 3.1 Pro Preview Custom Tools", + "id": "au.anthropic.claude-opus-4-6-v1", + "name": "AU Anthropic Claude Opus 4.6", + "display_name": "AU Anthropic Claude Opus 4.6", "modalities": { "input": [ "text", "image", - "video", - "audio", "pdf" ], "output": [ @@ -131840,79 +135995,71 @@ ] }, "limit": { - "context": 1048576, - "output": 65536 + "context": 1000000, + "output": 128000 }, "temperature": true, "tool_call": true, "reasoning": { "supported": true, - "default": true + "default": false }, "extra_capabilities": { "reasoning": { "supported": true, - "default_enabled": true, - "mode": "level", - "level": "high", - "level_options": [ + "default_enabled": false, + "mode": "mixed", + "budget": { + "min": 1024, + "unit": "tokens" + }, + "effort": "high", + "effort_options": [ "low", - "high" + "medium", + "high", + "max" ], + "interleaved": true, "summaries": true, "visibility": "summary", "continuation": [ - "thought_signatures" + "thinking_blocks" + ], + "notes": [ + "Anthropic recommends adaptive thinking with effort for Claude 4.6; budget_tokens remains a deprecated compatibility path.", + "Anthropic API defaults effort to high; lower effort levels should be chosen per workload." ] } }, "attachment": true, "open_weights": false, - "knowledge": "2025-01", - "release_date": "2026-02-19", - "last_updated": "2026-02-19", + "knowledge": "2025-05", + "release_date": "2026-02-05", + "last_updated": "2026-02-05", "cost": { - "input": 2, - "output": 12, - "cache_read": 0.2, - "tiers": [ - { - "input": 4, - "output": 18, - "cache_read": 0.4, - "tier": { - "type": "context", - "size": 200000 - } - } - ], - "context_over_200k": { - "input": 4, - "output": 18, - "cache_read": 0.4 - } + "input": 16.5, + "output": 82.5, + "cache_read": 1.65, + "cache_write": 20.625 }, "type": "chat" }, { - "id": "google/gemini-flash-latest", - "name": "Gemini Flash Latest", - "display_name": "Gemini Flash Latest", + "id": "openai.gpt-oss-120b", + "name": "gpt-oss-120b", + "display_name": "gpt-oss-120b", "modalities": { "input": [ - "text", - "image", - "audio", - "video", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 1048576, - "output": 65536 + "context": 128000, + "output": 16384 }, "temperature": true, "tool_call": true, @@ -131920,29 +136067,24 @@ "supported": true, "default": true }, - "attachment": true, + "attachment": false, "open_weights": false, - "knowledge": "2025-01", - "release_date": "2025-09-25", - "last_updated": "2025-09-25", + "release_date": "2025-08-05", + "last_updated": "2025-08-05", "cost": { - "input": 0.3, - "output": 2.5, - "cache_read": 0.075, - "input_audio": 1 + "input": 0.15, + "output": 0.6 }, "type": "chat" }, { - "id": "google/gemini-2.5-pro", - "name": "Gemini 2.5 Pro", - "display_name": "Gemini 2.5 Pro", + "id": "global.anthropic.claude-opus-4-8", + "name": "Claude Opus 4.8 (Global)", + "display_name": "Claude Opus 4.8 (Global)", "modalities": { "input": [ "text", "image", - "audio", - "video", "pdf" ], "output": [ @@ -131950,143 +136092,94 @@ ] }, "limit": { - "context": 1048576, - "output": 65536 + "context": 1000000, + "output": 128000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { "supported": true, - "default": true + "default": false }, "extra_capabilities": { "reasoning": { "supported": true, - "default_enabled": true, - "mode": "budget", - "budget": { - "default": -1, - "min": 128, - "max": 32768, - "auto": -1, - "unit": "tokens" - }, + "default_enabled": false, + "mode": "effort", + "effort": "high", + "effort_options": [ + "low", + "medium", + "high", + "xhigh", + "max" + ], + "interleaved": true, "summaries": true, - "visibility": "summary", + "visibility": "omitted", "continuation": [ - "thought_signatures" + "thinking_blocks" + ], + "notes": [ + "Claude Opus 4.7 and newer Opus models require thinking.type = \"adaptive\" to enable thinking explicitly.", + "Manual budget_tokens requests return 400 on Claude Opus 4.7 and newer adaptive-only Opus models.", + "task_budget is separate from thinking control and should not be treated as a thinking budget." ] } }, "attachment": true, "open_weights": false, - "knowledge": "2025-01", - "release_date": "2025-03-20", - "last_updated": "2025-06-05", + "release_date": "2026-05-28", + "last_updated": "2026-05-28", "cost": { - "input": 1.25, - "output": 10, - "cache_read": 0.125, - "tiers": [ - { - "input": 2.5, - "output": 15, - "cache_read": 0.25, - "tier": { - "type": "context", - "size": 200000 - } - } - ], - "context_over_200k": { - "input": 2.5, - "output": 15, - "cache_read": 0.25 - } + "input": 5, + "output": 25, + "cache_read": 0.5, + "cache_write": 6.25 }, "type": "chat" }, { - "id": "google/gemini-3.1-pro-preview", - "name": "Gemini 3.1 Pro Preview", - "display_name": "Gemini 3.1 Pro Preview", + "id": "us.meta.llama4-maverick-17b-instruct-v1:0", + "name": "Llama 4 Maverick 17B Instruct (US)", + "display_name": "Llama 4 Maverick 17B Instruct (US)", "modalities": { "input": [ "text", - "image", - "video", - "audio", - "pdf" + "image" ], "output": [ "text" ] }, "limit": { - "context": 1048576, - "output": 65536 + "context": 1000000, + "output": 16384 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": true, - "mode": "level", - "level": "high", - "level_options": [ - "low", - "high" - ], - "summaries": true, - "visibility": "summary", - "continuation": [ - "thought_signatures" - ] - } + "supported": false }, "attachment": true, - "open_weights": false, - "knowledge": "2025-01", - "release_date": "2026-02-19", - "last_updated": "2026-02-19", + "open_weights": true, + "knowledge": "2024-08", + "release_date": "2025-04-05", + "last_updated": "2025-04-05", "cost": { - "input": 2, - "output": 12, - "cache_read": 0.2, - "tiers": [ - { - "input": 4, - "output": 18, - "cache_read": 0.4, - "tier": { - "type": "context", - "size": 200000 - } - } - ], - "context_over_200k": { - "input": 4, - "output": 18, - "cache_read": 0.4 - } + "input": 0.24, + "output": 0.97 }, "type": "chat" }, { - "id": "google/gemini-3.1-flash-lite", - "name": "Gemini 3.1 Flash Lite", - "display_name": "Gemini 3.1 Flash Lite", + "id": "openai.gpt-5.4", + "name": "GPT-5.4", + "display_name": "GPT-5.4", "modalities": { "input": [ "text", "image", - "video", - "audio", "pdf" ], "output": [ @@ -132094,110 +136187,117 @@ ] }, "limit": { - "context": 1048576, - "output": 65536 + "context": 272000, + "output": 128000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { "supported": true, "default": true }, - "extra_capabilities": { - "reasoning": { - "supported": true - } - }, "attachment": true, "open_weights": false, - "knowledge": "2025-01", - "release_date": "2026-05-07", - "last_updated": "2026-05-07", + "knowledge": "2025-08-31", + "release_date": "2026-03-05", + "last_updated": "2026-06-01", "cost": { - "input": 0.25, - "output": 1.5, - "cache_read": 0.025, - "input_audio": 0.5 + "input": 2.75, + "output": 16.5, + "cache_read": 0.275 }, "type": "chat" }, { - "id": "google/gemini-2.5-flash-lite", - "name": "Gemini 2.5 Flash-Lite", - "display_name": "Gemini 2.5 Flash-Lite", + "id": "mistral.devstral-2-123b", + "name": "Devstral 2 123B", + "display_name": "Devstral 2 123B", "modalities": { "input": [ - "text", - "image", - "audio", - "video", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 1048576, - "output": 65536 + "context": 256000, + "output": 8192 + }, + "temperature": true, + "tool_call": true, + "reasoning": { + "supported": false + }, + "attachment": false, + "open_weights": true, + "release_date": "2026-02-17", + "last_updated": "2026-02-17", + "cost": { + "input": 0.4, + "output": 2 + }, + "type": "chat" + }, + { + "id": "zai.glm-4.7", + "name": "GLM-4.7", + "display_name": "GLM-4.7", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 204800, + "output": 131072 }, "temperature": true, "tool_call": true, "reasoning": { "supported": true, - "default": false + "default": true }, "extra_capabilities": { "reasoning": { "supported": true, - "default_enabled": false, - "mode": "budget", - "budget": { - "default": -1, - "min": 512, - "max": 24576, - "auto": -1, - "unit": "tokens" - }, + "interleaved": true, "summaries": true, "visibility": "summary", "continuation": [ - "thought_signatures" + "thinking_blocks" ] } }, - "attachment": true, - "open_weights": false, - "knowledge": "2025-01", - "release_date": "2025-06-17", - "last_updated": "2025-06-17", + "attachment": false, + "open_weights": true, + "knowledge": "2025-04", + "release_date": "2025-12-22", + "last_updated": "2025-12-22", "cost": { - "input": 0.1, - "output": 0.4, - "cache_read": 0.01, - "input_audio": 0.3 + "input": 0.6, + "output": 2.2 }, "type": "chat" }, { - "id": "google/gemini-2.5-flash", - "name": "Gemini 2.5 Flash", - "display_name": "Gemini 2.5 Flash", + "id": "writer.palmyra-x4-v1:0", + "name": "Palmyra X4", + "display_name": "Palmyra X4", "modalities": { "input": [ - "text", - "image", - "audio", - "video", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 1048576, - "output": 65536 + "context": 122880, + "output": 8192 }, "temperature": true, "tool_call": true, @@ -132205,43 +136305,20 @@ "supported": true, "default": true }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": true, - "mode": "budget", - "budget": { - "default": -1, - "min": 0, - "max": 24576, - "auto": -1, - "off": 0, - "unit": "tokens" - }, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thought_signatures" - ] - } - }, - "attachment": true, + "attachment": false, "open_weights": false, - "knowledge": "2025-01", - "release_date": "2025-03-20", - "last_updated": "2025-06-05", + "release_date": "2025-04-28", + "last_updated": "2025-04-28", "cost": { - "input": 0.3, - "output": 2.5, - "cache_read": 0.03, - "input_audio": 1 + "input": 2.5, + "output": 10 }, "type": "chat" }, { - "id": "google/gemma-4-26b-a4b-it", - "name": "Gemma 4 26B A4B IT", - "display_name": "Gemma 4 26B A4B IT", + "id": "mistral.magistral-small-2509", + "name": "Magistral Small 1.2", + "display_name": "Magistral Small 1.2", "modalities": { "input": [ "text", @@ -132252,8 +136329,8 @@ ] }, "limit": { - "context": 262144, - "output": 32768 + "context": 128000, + "output": 40000 }, "temperature": true, "tool_call": true, @@ -132261,145 +136338,85 @@ "supported": true, "default": true }, - "attachment": true, + "attachment": false, "open_weights": true, - "release_date": "2026-04-02", - "last_updated": "2026-04-02", + "release_date": "2025-12-02", + "last_updated": "2025-12-02", + "cost": { + "input": 0.5, + "output": 1.5 + }, "type": "chat" }, { - "id": "google/gemini-3.5-flash", - "name": "Gemini 3.5 Flash", - "display_name": "Gemini 3.5 Flash", + "id": "qwen.qwen3-coder-480b-a35b-v1:0", + "name": "Qwen3 Coder 480B A35B Instruct", + "display_name": "Qwen3 Coder 480B A35B Instruct", "modalities": { "input": [ - "text", - "image", - "video", - "audio", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 1048576, + "context": 131072, "output": 65536 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": true, - "mode": "level", - "level": "high", - "level_options": [ - "minimal", - "low", - "medium", - "high" - ], - "summaries": true, - "visibility": "summary", - "continuation": [ - "thought_signatures" - ] - } + "supported": false }, - "attachment": true, - "open_weights": false, - "knowledge": "2025-01", - "release_date": "2026-05-19", - "last_updated": "2026-05-19", + "attachment": false, + "open_weights": true, + "knowledge": "2024-04", + "release_date": "2025-09-18", + "last_updated": "2025-09-18", "cost": { - "input": 1.5, - "output": 9, - "cache_read": 0.15, - "input_audio": 1.5 + "input": 0.22, + "output": 1.8 }, "type": "chat" }, { - "id": "google/gemini-3-pro-preview", - "name": "Gemini 3 Pro Preview", - "display_name": "Gemini 3 Pro Preview", + "id": "amazon.nova-micro-v1:0", + "name": "Nova Micro", + "display_name": "Nova Micro", "modalities": { "input": [ - "text", - "image", - "video", - "audio", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 1048576, - "output": 65536 + "context": 128000, + "output": 8192 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": true, - "mode": "level", - "level": "high", - "level_options": [ - "low", - "high" - ], - "summaries": true, - "visibility": "summary", - "continuation": [ - "thought_signatures" - ] - } + "supported": false }, - "attachment": true, + "attachment": false, "open_weights": false, - "knowledge": "2025-01", - "release_date": "2025-11-18", - "last_updated": "2025-11-18", + "knowledge": "2024-10", + "release_date": "2024-12-03", + "last_updated": "2024-12-03", "cost": { - "input": 2, - "output": 12, - "cache_read": 0.2, - "tiers": [ - { - "input": 4, - "output": 18, - "cache_read": 0.4, - "tier": { - "type": "context", - "size": 200000 - } - } - ], - "context_over_200k": { - "input": 4, - "output": 18, - "cache_read": 0.4 - } + "input": 0.035, + "output": 0.14, + "cache_read": 0.00875 }, "type": "chat" }, { - "id": "openai/gpt-4o-2024-08-06", - "name": "GPT-4o (2024-08-06)", - "display_name": "GPT-4o (2024-08-06)", + "id": "mistral.pixtral-large-2502-v1:0", + "name": "Pixtral Large (25.02)", + "display_name": "Pixtral Large (25.02)", "modalities": { "input": [ "text", @@ -132411,85 +136428,92 @@ }, "limit": { "context": 128000, - "output": 16384 + "output": 8192 }, "temperature": true, "tool_call": true, "reasoning": { "supported": false }, - "attachment": true, + "attachment": false, "open_weights": false, - "knowledge": "2023-09", - "release_date": "2024-08-06", - "last_updated": "2024-08-06", + "release_date": "2025-04-08", + "last_updated": "2025-04-08", "cost": { - "input": 2.5, - "output": 10, - "cache_read": 1.25 + "input": 2, + "output": 6 }, "type": "chat" }, { - "id": "openai/gpt-5-mini", - "name": "GPT-5 Mini", - "display_name": "GPT-5 Mini", + "id": "us.anthropic.claude-opus-4-6-v1", + "name": "Claude Opus 4.6 (US)", + "display_name": "Claude Opus 4.6 (US)", "modalities": { "input": [ "text", - "image" + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 400000, + "context": 1000000, "output": 128000 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, - "default": true + "default": false }, "extra_capabilities": { "reasoning": { "supported": true, - "default_enabled": true, - "mode": "effort", - "effort": "medium", + "default_enabled": false, + "mode": "mixed", + "budget": { + "min": 1024, + "unit": "tokens" + }, + "effort": "high", "effort_options": [ - "minimal", "low", "medium", - "high" + "high", + "max" ], - "verbosity": "medium", - "verbosity_options": [ - "low", - "medium", - "high" + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" ], - "visibility": "hidden" + "notes": [ + "Anthropic recommends adaptive thinking with effort for Claude 4.6; budget_tokens remains a deprecated compatibility path.", + "Anthropic API defaults effort to high; lower effort levels should be chosen per workload." + ] } }, "attachment": true, "open_weights": false, - "knowledge": "2024-05-30", - "release_date": "2025-08-07", - "last_updated": "2025-08-07", + "knowledge": "2025-05-31", + "release_date": "2026-02-05", + "last_updated": "2026-03-13", "cost": { - "input": 0.25, - "output": 2, - "cache_read": 0.025 + "input": 5, + "output": 25, + "cache_read": 0.5, + "cache_write": 6.25 }, "type": "chat" }, { - "id": "openai/gpt-4o", - "name": "GPT-4o", - "display_name": "GPT-4o", + "id": "jp.anthropic.claude-opus-4-7", + "name": "Claude Opus 4.7 (JP)", + "display_name": "Claude Opus 4.7 (JP)", "modalities": { "input": [ "text", @@ -132501,44 +136525,73 @@ ] }, "limit": { - "context": 128000, - "output": 16384 + "context": 1000000, + "output": 128000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": false + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": false, + "mode": "effort", + "effort": "high", + "effort_options": [ + "low", + "medium", + "high", + "xhigh", + "max" + ], + "interleaved": true, + "summaries": true, + "visibility": "omitted", + "continuation": [ + "thinking_blocks" + ], + "notes": [ + "Claude Opus 4.7 and newer Opus models require thinking.type = \"adaptive\" to enable thinking explicitly.", + "Manual budget_tokens requests return 400 on Claude Opus 4.7 and newer adaptive-only Opus models.", + "task_budget is separate from thinking control and should not be treated as a thinking budget." + ] + } }, "attachment": true, "open_weights": false, - "knowledge": "2023-09", - "release_date": "2024-05-13", - "last_updated": "2024-08-06", + "knowledge": "2026-01-31", + "release_date": "2026-04-16", + "last_updated": "2026-04-16", "cost": { - "input": 2.5, - "output": 10, - "cache_read": 1.25 + "input": 5, + "output": 25, + "cache_read": 0.5, + "cache_write": 6.25 }, "type": "chat" }, { - "id": "openai/gpt-5.2", - "name": "GPT-5.2", - "display_name": "GPT-5.2", + "id": "au.anthropic.claude-sonnet-4-5-20250929-v1:0", + "name": "Claude Sonnet 4.5 (AU)", + "display_name": "Claude Sonnet 4.5 (AU)", "modalities": { "input": [ "text", - "image" + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 400000, - "output": 128000 + "context": 200000, + "output": 64000 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, @@ -132548,75 +136601,73 @@ "reasoning": { "supported": true, "default_enabled": false, - "mode": "effort", - "effort": "none", - "effort_options": [ - "none", - "low", - "medium", - "high", - "xhigh" - ], - "verbosity": "medium", - "verbosity_options": [ - "low", - "medium", - "high" + "mode": "budget", + "budget": { + "min": 1024, + "unit": "tokens" + }, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" ], - "visibility": "hidden" + "notes": [ + "Claude 4 manual thinking uses thinking.type = \"enabled\" with budget_tokens.", + "Interleaved thinking requires the interleaved-thinking-2025-05-14 beta header for this model family." + ] } }, "attachment": true, "open_weights": false, - "knowledge": "2025-08-31", - "release_date": "2025-12-11", - "last_updated": "2025-12-11", + "knowledge": "2025-07-31", + "release_date": "2025-09-29", + "last_updated": "2025-09-29", "cost": { - "input": 1.75, - "output": 14, - "cache_read": 0.175 + "input": 3, + "output": 15, + "cache_read": 0.3, + "cache_write": 3.75 }, "type": "chat" }, { - "id": "openai/gpt-5-chat-latest", - "name": "GPT-5 Chat (latest)", - "display_name": "GPT-5 Chat (latest)", + "id": "deepseek.v3-v1:0", + "name": "DeepSeek-V3.1", + "display_name": "DeepSeek-V3.1", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 400000, - "output": 128000 + "context": 163840, + "output": 81920 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { "supported": true, "default": true }, - "attachment": true, - "open_weights": false, - "knowledge": "2024-09-30", - "release_date": "2025-08-07", - "last_updated": "2025-08-07", + "attachment": false, + "open_weights": true, + "knowledge": "2024-07", + "release_date": "2025-09-18", + "last_updated": "2025-09-18", "cost": { - "input": 1.25, - "output": 10, - "cache_read": 0.125 + "input": 0.58, + "output": 1.68 }, "type": "chat" }, { - "id": "openai/o3", - "name": "o3", - "display_name": "o3", + "id": "anthropic.claude-opus-4-1-20250805-v1:0", + "name": "Claude Opus 4.1", + "display_name": "Claude Opus 4.1", "modalities": { "input": [ "text", @@ -132629,78 +136680,110 @@ }, "limit": { "context": 200000, - "output": 100000 + "output": 32000 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, - "default": true + "default": false }, "extra_capabilities": { "reasoning": { "supported": true, - "default_enabled": true, - "mode": "effort", - "effort": "medium", - "effort_options": [ - "low", - "medium", - "high" + "default_enabled": false, + "mode": "budget", + "budget": { + "min": 1024, + "unit": "tokens" + }, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" ], - "visibility": "hidden" + "notes": [ + "Claude 4 manual thinking uses thinking.type = \"enabled\" with budget_tokens.", + "Interleaved thinking requires the interleaved-thinking-2025-05-14 beta header for this model family." + ] } }, "attachment": true, "open_weights": false, - "knowledge": "2024-05", - "release_date": "2025-04-16", - "last_updated": "2025-04-16", + "knowledge": "2025-03-31", + "release_date": "2025-08-05", + "last_updated": "2025-08-05", "cost": { - "input": 2, - "output": 8, - "cache_read": 0.5 + "input": 15, + "output": 75, + "cache_read": 1.5, + "cache_write": 18.75 }, "type": "chat" }, { - "id": "openai/gpt-5.3-chat-latest", - "name": "GPT-5.3 Chat (latest)", - "display_name": "GPT-5.3 Chat (latest)", + "id": "jp.anthropic.claude-sonnet-4-5-20250929-v1:0", + "name": "Claude Sonnet 4.5 (JP)", + "display_name": "Claude Sonnet 4.5 (JP)", "modalities": { "input": [ "text", - "image" + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 16384 + "context": 200000, + "output": 64000 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": false + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": false, + "mode": "budget", + "budget": { + "min": 1024, + "unit": "tokens" + }, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ], + "notes": [ + "Claude 4 manual thinking uses thinking.type = \"enabled\" with budget_tokens.", + "Interleaved thinking requires the interleaved-thinking-2025-05-14 beta header for this model family." + ] + } }, "attachment": true, "open_weights": false, - "knowledge": "2025-08-31", - "release_date": "2026-03-03", - "last_updated": "2026-03-03", + "knowledge": "2025-07-31", + "release_date": "2025-09-29", + "last_updated": "2025-09-29", "cost": { - "input": 1.75, - "output": 14, - "cache_read": 0.175 + "input": 3, + "output": 15, + "cache_read": 0.3, + "cache_write": 3.75 }, "type": "chat" }, { - "id": "openai/gpt-4o-2024-11-20", - "name": "GPT-4o (2024-11-20)", - "display_name": "GPT-4o (2024-11-20)", + "id": "google.gemma-3-4b-it", + "name": "Gemma 3 4B IT", + "display_name": "Gemma 3 4B IT", "modalities": { "input": [ "text", @@ -132712,98 +136795,97 @@ }, "limit": { "context": 128000, - "output": 16384 + "output": 4096 }, "temperature": true, "tool_call": true, "reasoning": { "supported": false }, - "attachment": true, + "attachment": false, "open_weights": false, - "knowledge": "2023-09", - "release_date": "2024-11-20", - "last_updated": "2024-11-20", + "release_date": "2024-12-01", + "last_updated": "2024-12-01", "cost": { - "input": 2.5, - "output": 10, - "cache_read": 1.25 + "input": 0.04, + "output": 0.08 }, "type": "chat" }, { - "id": "openai/gpt-5", - "name": "GPT-5", - "display_name": "GPT-5", + "id": "eu.anthropic.claude-sonnet-4-5-20250929-v1:0", + "name": "Claude Sonnet 4.5 (EU)", + "display_name": "Claude Sonnet 4.5 (EU)", "modalities": { "input": [ "text", - "image" + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 400000, - "output": 128000 + "context": 200000, + "output": 64000 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, - "default": true + "default": false }, "extra_capabilities": { "reasoning": { "supported": true, - "default_enabled": true, - "mode": "effort", - "effort": "medium", - "effort_options": [ - "minimal", - "low", - "medium", - "high" - ], - "verbosity": "medium", - "verbosity_options": [ - "low", - "medium", - "high" + "default_enabled": false, + "mode": "budget", + "budget": { + "min": 1024, + "unit": "tokens" + }, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" ], - "visibility": "hidden" + "notes": [ + "Claude 4 manual thinking uses thinking.type = \"enabled\" with budget_tokens.", + "Interleaved thinking requires the interleaved-thinking-2025-05-14 beta header for this model family." + ] } }, "attachment": true, "open_weights": false, - "knowledge": "2024-09-30", - "release_date": "2025-08-07", - "last_updated": "2025-08-07", + "knowledge": "2025-07-31", + "release_date": "2025-09-29", + "last_updated": "2025-09-29", "cost": { - "input": 1.25, - "output": 10, - "cache_read": 0.125 + "input": 3.3, + "output": 16.5, + "cache_read": 0.33, + "cache_write": 4.125 }, "type": "chat" }, { - "id": "openai/gpt-4.1-mini", - "name": "GPT-4.1 mini", - "display_name": "GPT-4.1 mini", + "id": "qwen.qwen3-vl-235b-a22b", + "name": "Qwen/Qwen3-VL-235B-A22B-Instruct", + "display_name": "Qwen/Qwen3-VL-235B-A22B-Instruct", "modalities": { "input": [ "text", - "image", - "pdf" + "image" ], "output": [ "text" ] }, "limit": { - "context": 1047576, - "output": 32768 + "context": 262000, + "output": 262000 }, "temperature": true, "tool_call": true, @@ -132812,69 +136894,50 @@ }, "attachment": true, "open_weights": false, - "knowledge": "2024-04", - "release_date": "2025-04-14", - "last_updated": "2025-04-14", + "release_date": "2025-10-04", + "last_updated": "2025-11-25", "cost": { - "input": 0.4, - "output": 1.6, - "cache_read": 0.1 + "input": 0.3, + "output": 1.5 }, "type": "chat" }, { - "id": "openai/o4-mini", - "name": "o4-mini", - "display_name": "o4-mini", + "id": "writer.palmyra-x5-v1:0", + "name": "Palmyra X5", + "display_name": "Palmyra X5", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 100000 + "context": 1040000, + "output": 8192 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, "default": true }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": true, - "mode": "effort", - "effort": "medium", - "effort_options": [ - "low", - "medium", - "high" - ], - "visibility": "hidden" - } - }, - "attachment": true, + "attachment": false, "open_weights": false, - "knowledge": "2024-05", - "release_date": "2025-04-16", - "last_updated": "2025-04-16", + "release_date": "2025-04-28", + "last_updated": "2025-04-28", "cost": { - "input": 1.1, - "output": 4.4, - "cache_read": 0.275 + "input": 0.6, + "output": 6 }, "type": "chat" }, { - "id": "openai/gpt-5.4", - "name": "GPT-5.4", - "display_name": "GPT-5.4", + "id": "us.anthropic.claude-sonnet-4-6", + "name": "Claude Sonnet 4.6 (US)", + "display_name": "Claude Sonnet 4.6 (US)", "modalities": { "input": [ "text", @@ -132886,10 +136949,10 @@ ] }, "limit": { - "context": 1050000, - "output": 128000 + "context": 1000000, + "output": 64000 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, @@ -132899,59 +136962,52 @@ "reasoning": { "supported": true, "default_enabled": false, - "mode": "effort", - "effort": "none", + "mode": "mixed", + "budget": { + "min": 1024, + "unit": "tokens" + }, + "effort": "high", "effort_options": [ - "none", "low", "medium", "high", - "xhigh" + "max" ], - "verbosity": "medium", - "verbosity_options": [ - "low", - "medium", - "high" + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" ], - "visibility": "hidden" + "notes": [ + "Anthropic recommends adaptive thinking with effort for Claude 4.6; budget_tokens remains a deprecated compatibility path.", + "Anthropic API defaults effort to high; lower effort levels should be chosen per workload." + ] } }, "attachment": true, "open_weights": false, "knowledge": "2025-08-31", - "release_date": "2026-03-05", - "last_updated": "2026-03-05", + "release_date": "2026-02-17", + "last_updated": "2026-03-13", "cost": { - "input": 2.5, + "input": 3, "output": 15, - "cache_read": 0.25, - "tiers": [ - { - "input": 5, - "output": 22.5, - "cache_read": 0.5, - "tier": { - "type": "context", - "size": 272000 - } - } - ], - "context_over_200k": { - "input": 5, - "output": 22.5, - "cache_read": 0.5 - } + "cache_read": 0.3, + "cache_write": 3.75 }, "type": "chat" }, { - "id": "openai/o3-mini", - "name": "o3-mini", - "display_name": "o3-mini", + "id": "au.anthropic.claude-haiku-4-5-20251001-v1:0", + "name": "Claude Haiku 4.5 (AU)", + "display_name": "Claude Haiku 4.5 (AU)", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ "text" @@ -132959,163 +137015,139 @@ }, "limit": { "context": 200000, - "output": 100000 + "output": 64000 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, - "default": true + "default": false }, "extra_capabilities": { "reasoning": { "supported": true, - "default_enabled": true, - "mode": "effort", - "effort": "medium", - "effort_options": [ - "low", - "medium", - "high" + "default_enabled": false, + "mode": "budget", + "budget": { + "min": 1024, + "unit": "tokens" + }, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" ], - "visibility": "hidden" + "notes": [ + "Claude 4 manual thinking uses thinking.type = \"enabled\" with budget_tokens.", + "Interleaved thinking requires the interleaved-thinking-2025-05-14 beta header for this model family." + ] } }, - "attachment": false, + "attachment": true, "open_weights": false, - "knowledge": "2024-05", - "release_date": "2024-12-20", - "last_updated": "2025-01-29", + "knowledge": "2025-02-28", + "release_date": "2025-10-15", + "last_updated": "2025-10-15", "cost": { - "input": 1.1, - "output": 4.4, - "cache_read": 0.55 + "input": 1, + "output": 5, + "cache_read": 0.1, + "cache_write": 1.25 }, "type": "chat" }, { - "id": "openai/gpt-5.5", - "name": "GPT-5.5", - "display_name": "GPT-5.5", + "id": "meta.llama3-3-70b-instruct-v1:0", + "name": "Llama 3.3 70B Instruct", + "display_name": "Llama 3.3 70B Instruct", "modalities": { "input": [ - "text", - "image", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 1050000, - "output": 128000 + "context": 128000, + "output": 4096 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": true, - "mode": "effort", - "effort": "medium", - "effort_options": [ - "low", - "medium", - "high", - "xhigh" - ], - "verbosity": "medium", - "verbosity_options": [ - "low", - "medium", - "high" - ], - "visibility": "hidden" - } + "supported": false }, - "attachment": true, - "open_weights": false, - "knowledge": "2025-12-01", - "release_date": "2026-04-23", - "last_updated": "2026-04-23", + "attachment": false, + "open_weights": true, + "knowledge": "2023-12", + "release_date": "2024-12-06", + "last_updated": "2024-12-06", "cost": { - "input": 5, - "output": 30, - "cache_read": 0.5, - "tiers": [ - { - "input": 10, - "output": 45, - "cache_read": 1, - "tier": { - "type": "context", - "size": 272000 - } - } - ], - "context_over_200k": { - "input": 10, - "output": 45, - "cache_read": 1 - } + "input": 0.72, + "output": 0.72 }, "type": "chat" }, { - "id": "openai/gpt-5.2-chat-latest", - "name": "GPT-5.2 Chat", - "display_name": "GPT-5.2 Chat", + "id": "zai.glm-5", + "name": "GLM-5", + "display_name": "GLM-5", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 16384 + "context": 202752, + "output": 101376 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, "default": true }, - "attachment": true, - "open_weights": false, - "knowledge": "2025-08-31", - "release_date": "2025-12-11", - "last_updated": "2025-12-11", + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } + }, + "attachment": false, + "open_weights": true, + "release_date": "2026-03-18", + "last_updated": "2026-03-18", "cost": { - "input": 1.75, - "output": 14, - "cache_read": 0.175 + "input": 1, + "output": 3.2 }, "type": "chat" }, { - "id": "openai/gpt-5.1", - "name": "GPT-5.1", - "display_name": "GPT-5.1", + "id": "us.anthropic.claude-opus-4-8", + "name": "Claude Opus 4.8 (US)", + "display_name": "Claude Opus 4.8 (US)", "modalities": { "input": [ "text", - "image" + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 400000, + "context": 1000000, "output": 128000 }, "temperature": false, @@ -133129,164 +137161,106 @@ "supported": true, "default_enabled": false, "mode": "effort", - "effort": "none", + "effort": "high", "effort_options": [ - "none", "low", "medium", - "high" + "high", + "xhigh", + "max" ], - "verbosity": "medium", - "verbosity_options": [ - "low", - "medium", - "high" + "interleaved": true, + "summaries": true, + "visibility": "omitted", + "continuation": [ + "thinking_blocks" ], - "visibility": "hidden" + "notes": [ + "Claude Opus 4.7 and newer Opus models require thinking.type = \"adaptive\" to enable thinking explicitly.", + "Manual budget_tokens requests return 400 on Claude Opus 4.7 and newer adaptive-only Opus models.", + "task_budget is separate from thinking control and should not be treated as a thinking budget." + ] } }, "attachment": true, "open_weights": false, - "knowledge": "2024-09-30", - "release_date": "2025-11-13", - "last_updated": "2025-11-13", + "release_date": "2026-05-28", + "last_updated": "2026-05-28", "cost": { - "input": 1.25, - "output": 10, - "cache_read": 0.125 + "input": 5, + "output": 25, + "cache_read": 0.5, + "cache_write": 6.25 }, "type": "chat" }, { - "id": "openai/gpt-5-nano", - "name": "GPT-5 Nano", - "display_name": "GPT-5 Nano", + "id": "global.anthropic.claude-opus-4-7", + "name": "Claude Opus 4.7 (Global)", + "display_name": "Claude Opus 4.7 (Global)", "modalities": { "input": [ "text", - "image" + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 400000, + "context": 1000000, "output": 128000 }, "temperature": false, "tool_call": true, "reasoning": { "supported": true, - "default": true + "default": false }, "extra_capabilities": { "reasoning": { "supported": true, - "default_enabled": true, + "default_enabled": false, "mode": "effort", - "effort": "medium", + "effort": "high", "effort_options": [ - "minimal", "low", "medium", - "high" + "high", + "xhigh", + "max" ], - "verbosity": "medium", - "verbosity_options": [ - "low", - "medium", - "high" + "interleaved": true, + "summaries": true, + "visibility": "omitted", + "continuation": [ + "thinking_blocks" ], - "visibility": "hidden" + "notes": [ + "Claude Opus 4.7 and newer Opus models require thinking.type = \"adaptive\" to enable thinking explicitly.", + "Manual budget_tokens requests return 400 on Claude Opus 4.7 and newer adaptive-only Opus models.", + "task_budget is separate from thinking control and should not be treated as a thinking budget." + ] } }, "attachment": true, "open_weights": false, - "knowledge": "2024-05-30", - "release_date": "2025-08-07", - "last_updated": "2025-08-07", - "cost": { - "input": 0.05, - "output": 0.4, - "cache_read": 0.005 - }, - "type": "chat" - }, - { - "id": "openai/gpt-4o-mini", - "name": "GPT-4o mini", - "display_name": "GPT-4o mini", - "modalities": { - "input": [ - "text", - "image", - "pdf" - ], - "output": [ - "text" - ] - }, - "limit": { - "context": 128000, - "output": 16384 - }, - "temperature": true, - "tool_call": true, - "reasoning": { - "supported": false - }, - "attachment": true, - "open_weights": false, - "knowledge": "2023-09", - "release_date": "2024-07-18", - "last_updated": "2024-07-18", - "cost": { - "input": 0.15, - "output": 0.6, - "cache_read": 0.075 - }, - "type": "chat" - }, - { - "id": "openai/gpt-4.1", - "name": "GPT-4.1", - "display_name": "GPT-4.1", - "modalities": { - "input": [ - "text", - "image", - "pdf" - ], - "output": [ - "text" - ] - }, - "limit": { - "context": 1047576, - "output": 32768 - }, - "temperature": true, - "tool_call": true, - "reasoning": { - "supported": false - }, - "attachment": true, - "open_weights": false, - "knowledge": "2024-04", - "release_date": "2025-04-14", - "last_updated": "2025-04-14", + "knowledge": "2026-01-31", + "release_date": "2026-04-16", + "last_updated": "2026-04-16", "cost": { - "input": 2, - "output": 8, - "cache_read": 0.5 + "input": 5, + "output": 25, + "cache_read": 0.5, + "cache_write": 6.25 }, "type": "chat" }, { - "id": "openai/gpt-5.4-nano", - "name": "GPT-5.4 nano", - "display_name": "GPT-5.4 nano", + "id": "us.anthropic.claude-fable-5", + "name": "Claude Fable 5 (US)", + "display_name": "Claude Fable 5 (US)", "modalities": { "input": [ "text", @@ -133297,65 +137271,71 @@ ] }, "limit": { - "context": 400000, + "context": 1000000, "output": 128000 }, "temperature": false, "tool_call": true, "reasoning": { "supported": true, - "default": false + "default": true }, "extra_capabilities": { "reasoning": { "supported": true, - "default_enabled": false, + "default_enabled": true, "mode": "effort", - "effort": "none", + "effort": "high", "effort_options": [ - "none", "low", "medium", "high", - "xhigh" + "xhigh", + "max" ], - "verbosity": "medium", - "verbosity_options": [ - "low", - "medium", - "high" + "interleaved": true, + "summaries": true, + "visibility": "omitted", + "continuation": [ + "thinking_blocks" ], - "visibility": "hidden" + "notes": [ + "Adaptive thinking is always on for Claude Fable 5 and Claude Mythos 5; thinking.type = \"disabled\" is rejected.", + "Manual budget_tokens requests return 400 on Claude Fable 5 and Claude Mythos 5.", + "thinking.display defaults to omitted; set display to summarized to receive readable thinking summaries." + ] } }, "attachment": true, "open_weights": false, - "knowledge": "2025-08-31", - "release_date": "2026-03-17", - "last_updated": "2026-03-17", + "knowledge": "2026-01-31", + "release_date": "2026-06-09", + "last_updated": "2026-06-09", "cost": { - "input": 0.2, - "output": 1.25, - "cache_read": 0.02 + "input": 10, + "output": 50, + "cache_read": 1, + "cache_write": 12.5 }, "type": "chat" }, { - "id": "openai/gpt-4o-2024-05-13", - "name": "GPT-4o (2024-05-13)", - "display_name": "GPT-4o (2024-05-13)", + "id": "amazon.nova-lite-v1:0", + "name": "Nova Lite", + "display_name": "Nova Lite", "modalities": { "input": [ "text", - "image" + "image", + "video" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 4096 + "context": 300000, + "output": 8192 }, "temperature": true, "tool_call": true, @@ -133364,33 +137344,35 @@ }, "attachment": true, "open_weights": false, - "knowledge": "2023-09", - "release_date": "2024-05-13", - "last_updated": "2024-05-13", + "knowledge": "2024-10", + "release_date": "2024-12-03", + "last_updated": "2024-12-03", "cost": { - "input": 5, - "output": 15 + "input": 0.06, + "output": 0.24, + "cache_read": 0.015 }, "type": "chat" }, { - "id": "openai/gpt-5.4-mini", - "name": "GPT-5.4 mini", - "display_name": "GPT-5.4 mini", + "id": "us.anthropic.claude-haiku-4-5-20251001-v1:0", + "name": "Claude Haiku 4.5 (US)", + "display_name": "Claude Haiku 4.5 (US)", "modalities": { "input": [ "text", - "image" + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 400000, - "output": 128000 + "context": 200000, + "output": 64000 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, @@ -133400,44 +137382,44 @@ "reasoning": { "supported": true, "default_enabled": false, - "mode": "effort", - "effort": "none", - "effort_options": [ - "none", - "low", - "medium", - "high", - "xhigh" - ], - "verbosity": "medium", - "verbosity_options": [ - "low", - "medium", - "high" + "mode": "budget", + "budget": { + "min": 1024, + "unit": "tokens" + }, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" ], - "visibility": "hidden" + "notes": [ + "Claude 4 manual thinking uses thinking.type = \"enabled\" with budget_tokens.", + "Interleaved thinking requires the interleaved-thinking-2025-05-14 beta header for this model family." + ] } }, "attachment": true, "open_weights": false, - "knowledge": "2025-08-31", - "release_date": "2026-03-17", - "last_updated": "2026-03-17", + "knowledge": "2025-02-28", + "release_date": "2025-10-15", + "last_updated": "2025-10-15", "cost": { - "input": 0.75, - "output": 4.5, - "cache_read": 0.075 + "input": 1, + "output": 5, + "cache_read": 0.1, + "cache_write": 1.25 }, "type": "chat" }, { - "id": "openai/gpt-5.1-chat-latest", - "name": "GPT-5.1 Chat", - "display_name": "GPT-5.1 Chat", + "id": "mistral.voxtral-mini-3b-2507", + "name": "Voxtral Mini 3B 2507", + "display_name": "Voxtral Mini 3B 2507", "modalities": { "input": [ - "text", - "image" + "audio", + "text" ], "output": [ "text" @@ -133445,45 +137427,40 @@ }, "limit": { "context": 128000, - "output": 16384 + "output": 4096 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, - "attachment": true, + "attachment": false, "open_weights": false, - "knowledge": "2024-09-30", - "release_date": "2025-11-13", - "last_updated": "2025-11-13", + "release_date": "2024-12-01", + "last_updated": "2024-12-01", "cost": { - "input": 1.25, - "output": 10, - "cache_read": 0.125 + "input": 0.04, + "output": 0.04 }, "type": "chat" }, { - "id": "openai/o1", - "name": "o1", - "display_name": "o1", + "id": "moonshot.kimi-k2-thinking", + "name": "Kimi K2 Thinking", + "display_name": "Kimi K2 Thinking", "modalities": { "input": [ - "text", - "image", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 100000 + "context": 262143, + "output": 16000 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, @@ -133492,67 +137469,55 @@ "extra_capabilities": { "reasoning": { "supported": true, - "default_enabled": true, - "mode": "effort", - "effort": "medium", - "effort_options": [ - "low", - "medium", - "high" - ], - "visibility": "hidden" + "interleaved": true } }, - "attachment": true, - "open_weights": false, - "knowledge": "2023-09", - "release_date": "2024-12-05", - "last_updated": "2024-12-05", + "attachment": false, + "open_weights": true, + "release_date": "2025-12-02", + "last_updated": "2025-12-02", "cost": { - "input": 15, - "output": 60, - "cache_read": 7.5 + "input": 0.6, + "output": 2.5 }, "type": "chat" }, { - "id": "openai/gpt-4.1-nano", - "name": "GPT-4.1 nano", - "display_name": "GPT-4.1 nano", + "id": "meta.llama3-1-70b-instruct-v1:0", + "name": "Llama 3.1 70B Instruct", + "display_name": "Llama 3.1 70B Instruct", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 1047576, - "output": 32768 + "context": 128000, + "output": 4096 }, "temperature": true, "tool_call": true, "reasoning": { "supported": false }, - "attachment": true, - "open_weights": false, - "knowledge": "2024-04", - "release_date": "2025-04-14", - "last_updated": "2025-04-14", + "attachment": false, + "open_weights": true, + "knowledge": "2023-12", + "release_date": "2024-07-23", + "last_updated": "2024-07-23", "cost": { - "input": 0.1, - "output": 0.4, - "cache_read": 0.025 + "input": 0.72, + "output": 0.72 }, "type": "chat" }, { - "id": "minimax/minimax-m2.7-highspeed", - "name": "MiniMax-M2.7-highspeed", - "display_name": "MiniMax-M2.7-highspeed", + "id": "us.deepseek.r1-v1:0", + "name": "DeepSeek-R1 (US)", + "display_name": "DeepSeek-R1 (US)", "modalities": { "input": [ "text" @@ -133562,8 +137527,8 @@ ] }, "limit": { - "context": 204800, - "output": 131072 + "context": 128000, + "output": 32768 }, "temperature": true, "tool_call": true, @@ -133571,126 +137536,156 @@ "supported": true, "default": true }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } - }, "attachment": false, "open_weights": true, - "release_date": "2026-03-18", - "last_updated": "2026-03-18", + "knowledge": "2024-07", + "release_date": "2025-01-20", + "last_updated": "2025-05-29", "cost": { - "input": 0.6, - "output": 2.4, - "cache_read": 0.06, - "cache_write": 0.375 + "input": 1.35, + "output": 5.4 }, "type": "chat" }, { - "id": "minimax/minimax-m2.1", - "name": "MiniMax-M2.1", - "display_name": "MiniMax-M2.1", + "id": "global.anthropic.claude-sonnet-4-6", + "name": "Claude Sonnet 4.6 (Global)", + "display_name": "Claude Sonnet 4.6 (Global)", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 204800, - "output": 131072 + "context": 1000000, + "output": 64000 }, "temperature": true, "tool_call": true, "reasoning": { "supported": true, - "default": true + "default": false }, "extra_capabilities": { "reasoning": { - "supported": true + "supported": true, + "default_enabled": false, + "mode": "mixed", + "budget": { + "min": 1024, + "unit": "tokens" + }, + "effort": "high", + "effort_options": [ + "low", + "medium", + "high", + "max" + ], + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ], + "notes": [ + "Anthropic recommends adaptive thinking with effort for Claude 4.6; budget_tokens remains a deprecated compatibility path.", + "Anthropic API defaults effort to high; lower effort levels should be chosen per workload." + ] } }, - "attachment": false, - "open_weights": true, - "release_date": "2025-12-23", - "last_updated": "2025-12-23", + "attachment": true, + "open_weights": false, + "knowledge": "2025-08-31", + "release_date": "2026-02-17", + "last_updated": "2026-03-13", "cost": { - "input": 0.3, - "output": 1.2 + "input": 3, + "output": 15, + "cache_read": 0.3, + "cache_write": 3.75 }, "type": "chat" }, { - "id": "minimax/minimax-m2.7", - "name": "MiniMax-M2.7", - "display_name": "MiniMax-M2.7", + "id": "anthropic.claude-haiku-4-5-20251001-v1:0", + "name": "Claude Haiku 4.5", + "display_name": "Claude Haiku 4.5", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 204800, - "output": 131072 + "context": 200000, + "output": 64000 }, "temperature": true, "tool_call": true, "reasoning": { "supported": true, - "default": true + "default": false }, "extra_capabilities": { "reasoning": { "supported": true, + "default_enabled": false, + "mode": "budget", + "budget": { + "min": 1024, + "unit": "tokens" + }, "interleaved": true, "summaries": true, "visibility": "summary", "continuation": [ "thinking_blocks" + ], + "notes": [ + "Claude 4 manual thinking uses thinking.type = \"enabled\" with budget_tokens.", + "Interleaved thinking requires the interleaved-thinking-2025-05-14 beta header for this model family." ] } }, - "attachment": false, - "open_weights": true, - "release_date": "2026-03-18", - "last_updated": "2026-03-18", + "attachment": true, + "open_weights": false, + "knowledge": "2025-02-28", + "release_date": "2025-10-15", + "last_updated": "2025-10-15", "cost": { - "input": 0.3, - "output": 1.2, - "cache_read": 0.06, - "cache_write": 0.375 + "input": 1, + "output": 5, + "cache_read": 0.1, + "cache_write": 1.25 }, "type": "chat" }, { - "id": "minimax/minimax-m2", - "name": "MiniMax-M2", - "display_name": "MiniMax-M2", + "id": "moonshotai.kimi-k2.5", + "name": "Kimi K2.5", + "display_name": "Kimi K2.5", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 196608, - "output": 128000 + "context": 262143, + "output": 16000 }, "temperature": true, "tool_call": true, @@ -133700,110 +137695,118 @@ }, "extra_capabilities": { "reasoning": { - "supported": true + "supported": true, + "interleaved": true } }, "attachment": false, "open_weights": true, - "release_date": "2025-10-27", - "last_updated": "2025-10-27", + "release_date": "2026-02-06", + "last_updated": "2026-02-06", "cost": { - "input": 0.3, - "output": 1.2 + "input": 0.6, + "output": 3 }, "type": "chat" }, { - "id": "minimax/minimax-m2.5", - "name": "MiniMax-M2.5", - "display_name": "MiniMax-M2.5", + "id": "au.anthropic.claude-opus-4-8", + "name": "Claude Opus 4.8 (AU)", + "display_name": "Claude Opus 4.8 (AU)", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 204800, - "output": 131072 + "context": 1000000, + "output": 128000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { "supported": true, - "default": true + "default": false }, "extra_capabilities": { "reasoning": { - "supported": true + "supported": true, + "default_enabled": false, + "mode": "effort", + "effort": "high", + "effort_options": [ + "low", + "medium", + "high", + "xhigh", + "max" + ], + "interleaved": true, + "summaries": true, + "visibility": "omitted", + "continuation": [ + "thinking_blocks" + ], + "notes": [ + "Claude Opus 4.7 and newer Opus models require thinking.type = \"adaptive\" to enable thinking explicitly.", + "Manual budget_tokens requests return 400 on Claude Opus 4.7 and newer adaptive-only Opus models.", + "task_budget is separate from thinking control and should not be treated as a thinking budget." + ] } }, - "attachment": false, - "open_weights": true, - "release_date": "2026-02-12", - "last_updated": "2026-02-12", + "attachment": true, + "open_weights": false, + "release_date": "2026-05-28", + "last_updated": "2026-05-28", "cost": { - "input": 0.3, - "output": 1.2, - "cache_read": 0.03, - "cache_write": 0.375 + "input": 5, + "output": 25, + "cache_read": 0.5, + "cache_write": 6.25 }, "type": "chat" }, { - "id": "minimax/minimax-m2.5-highspeed", - "name": "MiniMax-M2.5-highspeed", - "display_name": "MiniMax-M2.5-highspeed", + "id": "nvidia.nemotron-nano-12b-v2", + "name": "NVIDIA Nemotron Nano 12B v2 VL BF16", + "display_name": "NVIDIA Nemotron Nano 12B v2 VL BF16", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 204800, - "output": 131072 + "context": 128000, + "output": 4096 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true - } + "supported": false }, "attachment": false, - "open_weights": true, - "release_date": "2026-02-13", - "last_updated": "2026-02-13", + "open_weights": false, + "release_date": "2024-12-01", + "last_updated": "2024-12-01", "cost": { - "input": 0.6, - "output": 2.4, - "cache_read": 0.06, - "cache_write": 0.375 + "input": 0.2, + "output": 0.6 }, "type": "chat" - } - ] - }, - "stepfun": { - "id": "stepfun", - "name": "StepFun", - "display_name": "StepFun", - "api": "https://api.stepfun.com/v1", - "doc": "https://platform.stepfun.com/docs/zh/overview/concept", - "models": [ + }, { - "id": "step-2-16k", - "name": "Step 2 (16K)", - "display_name": "Step 2 (16K)", + "id": "zai.glm-4.7-flash", + "name": "GLM-4.7-Flash", + "display_name": "GLM-4.7-Flash", "modalities": { "input": [ "text" @@ -133813,8 +137816,8 @@ ] }, "limit": { - "context": 16384, - "output": 8192 + "context": 200000, + "output": 131072 }, "temperature": true, "tool_call": true, @@ -133823,55 +137826,53 @@ "default": true }, "attachment": false, - "open_weights": false, - "knowledge": "2024-06", - "release_date": "2025-01-01", - "last_updated": "2026-02-13", + "open_weights": true, + "knowledge": "2025-04", + "release_date": "2026-01-19", + "last_updated": "2026-01-19", "cost": { - "input": 5.21, - "output": 16.44, - "cache_read": 1.04 + "input": 0.07, + "output": 0.4 }, "type": "chat" }, { - "id": "step-1-32k", - "name": "Step 1 (32K)", - "display_name": "Step 1 (32K)", + "id": "meta.llama4-scout-17b-instruct-v1:0", + "name": "Llama 4 Scout 17B Instruct", + "display_name": "Llama 4 Scout 17B Instruct", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 32768, - "output": 32768 + "context": 3500000, + "output": 16384 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, - "attachment": false, - "open_weights": false, - "knowledge": "2024-06", - "release_date": "2025-01-01", - "last_updated": "2026-02-13", + "attachment": true, + "open_weights": true, + "knowledge": "2024-08", + "release_date": "2025-04-05", + "last_updated": "2025-04-05", "cost": { - "input": 2.05, - "output": 9.59, - "cache_read": 0.41 + "input": 0.17, + "output": 0.66 }, "type": "chat" }, { - "id": "step-3.5-flash", - "name": "Step 3.5 Flash", - "display_name": "Step 3.5 Flash", + "id": "qwen.qwen3-235b-a22b-2507-v1:0", + "name": "Qwen3 235B A22B 2507", + "display_name": "Qwen3 235B A22B 2507", "modalities": { "input": [ "text" @@ -133881,134 +137882,186 @@ ] }, "limit": { - "context": 256000, - "output": 256000 + "context": 262144, + "output": 131072 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, "attachment": false, "open_weights": true, - "knowledge": "2025-01", - "release_date": "2026-01-29", - "last_updated": "2026-02-13", + "knowledge": "2024-04", + "release_date": "2025-09-18", + "last_updated": "2025-09-18", "cost": { - "input": 0.096, - "output": 0.288, - "cache_read": 0.019 + "input": 0.22, + "output": 0.88 }, "type": "chat" }, { - "id": "step-3.5-flash-2603", - "name": "Step 3.5 Flash 2603", - "display_name": "Step 3.5 Flash 2603", + "id": "eu.anthropic.claude-haiku-4-5-20251001-v1:0", + "name": "Claude Haiku 4.5 (EU)", + "display_name": "Claude Haiku 4.5 (EU)", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 256000, - "output": 256000 + "context": 200000, + "output": 64000 }, "temperature": true, "tool_call": true, "reasoning": { "supported": true, - "default": true + "default": false }, - "attachment": false, - "open_weights": true, - "knowledge": "2025-01", - "release_date": "2026-04-02", - "last_updated": "2026-04-02", + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": false, + "mode": "budget", + "budget": { + "min": 1024, + "unit": "tokens" + }, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ], + "notes": [ + "Claude 4 manual thinking uses thinking.type = \"enabled\" with budget_tokens.", + "Interleaved thinking requires the interleaved-thinking-2025-05-14 beta header for this model family." + ] + } + }, + "attachment": true, + "open_weights": false, + "knowledge": "2025-02-28", + "release_date": "2025-10-15", + "last_updated": "2025-10-15", "cost": { - "input": 0.1, - "output": 0.3, - "cache_read": 0.02 + "input": 1, + "output": 5, + "cache_read": 0.1, + "cache_write": 1.25 }, "type": "chat" - } - ] - }, - "anyapi": { - "id": "anyapi", - "name": "AnyAPI", - "display_name": "AnyAPI", - "api": "https://api.anyapi.ai/v1", - "doc": "https://docs.anyapi.ai", - "models": [ + }, { - "id": "mistralai/mistral-large-2512", - "name": "Mistral Large 3", - "display_name": "Mistral Large 3", + "id": "openai.gpt-oss-20b-1:0", + "name": "gpt-oss-20b", + "display_name": "gpt-oss-20b", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 262144, - "output": 262144 + "context": 128000, + "output": 16384 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true + }, + "attachment": false, + "open_weights": false, + "release_date": "2025-08-05", + "last_updated": "2025-08-05", + "cost": { + "input": 0.07, + "output": 0.3 }, - "attachment": true, - "open_weights": true, - "knowledge": "2024-11", - "release_date": "2024-11-01", - "last_updated": "2025-12-02", "type": "chat" }, { - "id": "mistralai/devstral-2512", - "name": "Devstral 2", - "display_name": "Devstral 2", + "id": "jp.anthropic.claude-opus-4-8", + "name": "Claude Opus 4.8 (JP)", + "display_name": "Claude Opus 4.8 (JP)", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 262144, - "output": 262144 + "context": 1000000, + "output": 128000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": false + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": false, + "mode": "effort", + "effort": "high", + "effort_options": [ + "low", + "medium", + "high", + "xhigh", + "max" + ], + "interleaved": true, + "summaries": true, + "visibility": "omitted", + "continuation": [ + "thinking_blocks" + ], + "notes": [ + "Claude Opus 4.7 and newer Opus models require thinking.type = \"adaptive\" to enable thinking explicitly.", + "Manual budget_tokens requests return 400 on Claude Opus 4.7 and newer adaptive-only Opus models.", + "task_budget is separate from thinking control and should not be treated as a thinking budget." + ] + } + }, + "attachment": true, + "open_weights": false, + "release_date": "2026-05-28", + "last_updated": "2026-05-28", + "cost": { + "input": 5, + "output": 25, + "cache_read": 0.5, + "cache_write": 6.25 }, - "attachment": false, - "open_weights": true, - "knowledge": "2025-12", - "release_date": "2025-12-09", - "last_updated": "2025-12-09", "type": "chat" }, { - "id": "deepseek/deepseek-r1", - "name": "DeepSeek Reasoner", - "display_name": "DeepSeek Reasoner", + "id": "anthropic.claude-opus-4-8", + "name": "Claude Opus 4.8", + "display_name": "Claude Opus 4.8", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ "text" @@ -134016,36 +138069,56 @@ }, "limit": { "context": 1000000, - "output": 384000 + "output": 128000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { "supported": true, - "default": true + "default": false }, "extra_capabilities": { "reasoning": { "supported": true, + "default_enabled": false, + "mode": "effort", + "effort": "high", + "effort_options": [ + "low", + "medium", + "high", + "xhigh", + "max" + ], "interleaved": true, "summaries": true, - "visibility": "summary", + "visibility": "omitted", "continuation": [ "thinking_blocks" + ], + "notes": [ + "Claude Opus 4.7 and newer Opus models require thinking.type = \"adaptive\" to enable thinking explicitly.", + "Manual budget_tokens requests return 400 on Claude Opus 4.7 and newer adaptive-only Opus models.", + "task_budget is separate from thinking control and should not be treated as a thinking budget." ] } }, "attachment": true, - "open_weights": true, - "knowledge": "2025-09", - "release_date": "2025-12-01", - "last_updated": "2026-02-28", + "open_weights": false, + "release_date": "2026-05-28", + "last_updated": "2026-05-28", + "cost": { + "input": 5, + "output": 25, + "cache_read": 0.5, + "cache_write": 6.25 + }, "type": "chat" }, { - "id": "deepseek/deepseek-chat", - "name": "DeepSeek Chat", - "display_name": "DeepSeek Chat", + "id": "qwen.qwen3-coder-30b-a3b-v1:0", + "name": "Qwen3 Coder 30B A3B Instruct", + "display_name": "Qwen3 Coder 30B A3B Instruct", "modalities": { "input": [ "text" @@ -134055,25 +138128,29 @@ ] }, "limit": { - "context": 1000000, - "output": 384000 + "context": 262144, + "output": 131072 }, "temperature": true, "tool_call": true, "reasoning": { "supported": false }, - "attachment": true, - "open_weights": true, - "knowledge": "2025-09", - "release_date": "2025-12-01", - "last_updated": "2026-02-28", + "attachment": false, + "open_weights": false, + "knowledge": "2024-04", + "release_date": "2025-09-18", + "last_updated": "2025-09-18", + "cost": { + "input": 0.15, + "output": 0.6 + }, "type": "chat" }, { - "id": "deepseek/deepseek-v4-flash", - "name": "DeepSeek V4 Flash", - "display_name": "DeepSeek V4 Flash", + "id": "qwen.qwen3-next-80b-a3b", + "name": "Qwen/Qwen3-Next-80B-A3B-Instruct", + "display_name": "Qwen/Qwen3-Next-80B-A3B-Instruct", "modalities": { "input": [ "text" @@ -134083,77 +138160,64 @@ ] }, "limit": { - "context": 1000000, - "output": 384000 + "context": 262000, + "output": 262000 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } + "supported": false }, "attachment": false, - "open_weights": true, - "knowledge": "2025-05", - "release_date": "2026-04-24", - "last_updated": "2026-04-24", + "open_weights": false, + "release_date": "2025-09-18", + "last_updated": "2025-11-25", + "cost": { + "input": 0.14, + "output": 1.4 + }, "type": "chat" }, { - "id": "deepseek/deepseek-v4-pro", - "name": "DeepSeek V4 Pro", - "display_name": "DeepSeek V4 Pro", + "id": "openai.gpt-5.5", + "name": "GPT-5.5", + "display_name": "GPT-5.5", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 1000000, - "output": 384000 + "context": 272000, + "output": 128000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { "supported": true, "default": true }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } + "attachment": true, + "open_weights": false, + "knowledge": "2025-12-01", + "release_date": "2026-04-23", + "last_updated": "2026-06-01", + "cost": { + "input": 5.5, + "output": 33, + "cache_read": 0.55 }, - "attachment": false, - "open_weights": true, - "knowledge": "2025-05", - "release_date": "2026-04-24", - "last_updated": "2026-04-24", "type": "chat" }, { - "id": "anthropic/claude-sonnet-4-6", - "name": "Claude Sonnet 4.6", - "display_name": "Claude Sonnet 4.6", + "id": "au.anthropic.claude-sonnet-4-6", + "name": "AU Anthropic Claude Sonnet 4.6", + "display_name": "AU Anthropic Claude Sonnet 4.6", "modalities": { "input": [ "text", @@ -134166,7 +138230,7 @@ }, "limit": { "context": 1000000, - "output": 64000 + "output": 128000 }, "temperature": true, "tool_call": true, @@ -134204,15 +138268,21 @@ }, "attachment": true, "open_weights": false, - "knowledge": "2025-08-31", + "knowledge": "2025-08", "release_date": "2026-02-17", - "last_updated": "2026-03-13", + "last_updated": "2026-02-17", + "cost": { + "input": 3.3, + "output": 16.5, + "cache_read": 0.33, + "cache_write": 4.125 + }, "type": "chat" }, { - "id": "anthropic/claude-haiku-4-5", - "name": "Claude Haiku 4.5 (latest)", - "display_name": "Claude Haiku 4.5 (latest)", + "id": "us.anthropic.claude-opus-4-5-20251101-v1:0", + "name": "Claude Opus 4.5 (US)", + "display_name": "Claude Opus 4.5 (US)", "modalities": { "input": [ "text", @@ -134237,11 +138307,17 @@ "reasoning": { "supported": true, "default_enabled": false, - "mode": "budget", + "mode": "mixed", "budget": { "min": 1024, "unit": "tokens" }, + "effort": "high", + "effort_options": [ + "low", + "medium", + "high" + ], "interleaved": true, "summaries": true, "visibility": "summary", @@ -134249,74 +138325,60 @@ "thinking_blocks" ], "notes": [ - "Claude 4 manual thinking uses thinking.type = \"enabled\" with budget_tokens.", - "Interleaved thinking requires the interleaved-thinking-2025-05-14 beta header for this model family." + "Claude Opus 4.5 uses manual thinking.type = \"enabled\" with budget_tokens; effort can be used alongside the thinking budget.", + "Interleaved thinking requires the interleaved-thinking-2025-05-14 beta header." ] } }, "attachment": true, "open_weights": false, - "knowledge": "2025-02-28", - "release_date": "2025-10-15", - "last_updated": "2025-10-15", + "knowledge": "2025-03-31", + "release_date": "2025-11-24", + "last_updated": "2025-08-01", + "cost": { + "input": 5, + "output": 25, + "cache_read": 0.5, + "cache_write": 6.25 + }, "type": "chat" }, { - "id": "anthropic/claude-sonnet-4-5", - "name": "Claude Sonnet 4.5 (latest)", - "display_name": "Claude Sonnet 4.5 (latest)", + "id": "minimax.minimax-m2.5", + "name": "MiniMax M2.5", + "display_name": "MiniMax M2.5", "modalities": { "input": [ - "text", - "image", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 64000 + "context": 196608, + "output": 98304 }, "temperature": true, "tool_call": true, "reasoning": { "supported": true, - "default": false + "default": true }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": false, - "mode": "budget", - "budget": { - "min": 1024, - "unit": "tokens" - }, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ], - "notes": [ - "Claude 4 manual thinking uses thinking.type = \"enabled\" with budget_tokens.", - "Interleaved thinking requires the interleaved-thinking-2025-05-14 beta header for this model family." - ] - } + "attachment": false, + "open_weights": true, + "release_date": "2026-03-18", + "last_updated": "2026-03-18", + "cost": { + "input": 0.3, + "output": 1.2 }, - "attachment": true, - "open_weights": false, - "knowledge": "2025-07-31", - "release_date": "2025-09-29", - "last_updated": "2025-09-29", "type": "chat" }, { - "id": "anthropic/claude-opus-4-6", - "name": "Claude Opus 4.6", - "display_name": "Claude Opus 4.6", + "id": "eu.anthropic.claude-opus-4-8", + "name": "Claude Opus 4.8 (EU)", + "display_name": "Claude Opus 4.8 (EU)", "modalities": { "input": [ "text", @@ -134331,7 +138393,7 @@ "context": 1000000, "output": 128000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { "supported": true, @@ -134341,41 +138403,44 @@ "reasoning": { "supported": true, "default_enabled": false, - "mode": "mixed", - "budget": { - "min": 1024, - "unit": "tokens" - }, + "mode": "effort", "effort": "high", "effort_options": [ "low", "medium", "high", + "xhigh", "max" ], "interleaved": true, "summaries": true, - "visibility": "summary", + "visibility": "omitted", "continuation": [ "thinking_blocks" ], "notes": [ - "Anthropic recommends adaptive thinking with effort for Claude 4.6; budget_tokens remains a deprecated compatibility path.", - "Anthropic API defaults effort to high; lower effort levels should be chosen per workload." + "Claude Opus 4.7 and newer Opus models require thinking.type = \"adaptive\" to enable thinking explicitly.", + "Manual budget_tokens requests return 400 on Claude Opus 4.7 and newer adaptive-only Opus models.", + "task_budget is separate from thinking control and should not be treated as a thinking budget." ] } }, "attachment": true, "open_weights": false, - "knowledge": "2025-05-31", - "release_date": "2026-02-05", - "last_updated": "2026-03-13", + "release_date": "2026-05-28", + "last_updated": "2026-05-28", + "cost": { + "input": 5.5, + "output": 27.5, + "cache_read": 0.55, + "cache_write": 6.875 + }, "type": "chat" }, { - "id": "anthropic/claude-opus-4-7", - "name": "Claude Opus 4.7", - "display_name": "Claude Opus 4.7", + "id": "eu.anthropic.claude-opus-4-7", + "name": "Claude Opus 4.7 (EU)", + "display_name": "Claude Opus 4.7 (EU)", "modalities": { "input": [ "text", @@ -134427,12 +138492,50 @@ "knowledge": "2026-01-31", "release_date": "2026-04-16", "last_updated": "2026-04-16", + "cost": { + "input": 5.5, + "output": 27.5, + "cache_read": 0.55, + "cache_write": 6.875 + }, "type": "chat" }, { - "id": "xai/grok-4.3", - "name": "Grok 4.3", - "display_name": "Grok 4.3", + "id": "meta.llama3-1-8b-instruct-v1:0", + "name": "Llama 3.1 8B Instruct", + "display_name": "Llama 3.1 8B Instruct", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 128000, + "output": 4096 + }, + "temperature": true, + "tool_call": true, + "reasoning": { + "supported": false + }, + "attachment": false, + "open_weights": true, + "knowledge": "2023-12", + "release_date": "2024-07-23", + "last_updated": "2024-07-23", + "cost": { + "input": 0.22, + "output": 0.22 + }, + "type": "chat" + }, + { + "id": "us.anthropic.claude-opus-4-1-20250805-v1:0", + "name": "Claude Opus 4.1 (US)", + "display_name": "Claude Opus 4.1 (US)", "modalities": { "input": [ "text", @@ -134444,62 +138547,91 @@ ] }, "limit": { - "context": 1000000, - "output": 30000 + "context": 200000, + "output": 32000 }, "temperature": true, "tool_call": true, "reasoning": { "supported": true, - "default": true + "default": false }, "extra_capabilities": { "reasoning": { - "supported": true + "supported": true, + "default_enabled": false, + "mode": "budget", + "budget": { + "min": 1024, + "unit": "tokens" + }, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ], + "notes": [ + "Claude 4 manual thinking uses thinking.type = \"enabled\" with budget_tokens.", + "Interleaved thinking requires the interleaved-thinking-2025-05-14 beta header for this model family." + ] } }, "attachment": true, "open_weights": false, - "release_date": "2026-04-17", - "last_updated": "2026-04-17", + "knowledge": "2025-03-31", + "release_date": "2025-08-05", + "last_updated": "2025-08-05", + "cost": { + "input": 15, + "output": 75, + "cache_read": 1.5, + "cache_write": 18.75 + }, "type": "chat" }, { - "id": "cohere/command-r-plus-08-2024", - "name": "Command R+", - "display_name": "Command R+", + "id": "meta.llama4-maverick-17b-instruct-v1:0", + "name": "Llama 4 Maverick 17B Instruct", + "display_name": "Llama 4 Maverick 17B Instruct", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 4000 + "context": 1000000, + "output": 16384 }, "temperature": true, "tool_call": true, "reasoning": { "supported": false }, - "attachment": false, + "attachment": true, "open_weights": true, - "knowledge": "2024-06-01", - "release_date": "2024-08-30", - "last_updated": "2024-08-30", + "knowledge": "2024-08", + "release_date": "2025-04-05", + "last_updated": "2025-04-05", + "cost": { + "input": 0.24, + "output": 0.97 + }, "type": "chat" }, { - "id": "perplexity/sonar-pro", - "name": "Sonar Pro", - "display_name": "Sonar Pro", + "id": "global.anthropic.claude-opus-4-5-20251101-v1:0", + "name": "Claude Opus 4.5 (Global)", + "display_name": "Claude Opus 4.5 (Global)", "modalities": { "input": [ "text", - "image" + "image", + "pdf" ], "output": [ "text" @@ -134507,112 +138639,126 @@ }, "limit": { "context": 200000, - "output": 8192 + "output": 64000 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": false + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": false, + "mode": "mixed", + "budget": { + "min": 1024, + "unit": "tokens" + }, + "effort": "high", + "effort_options": [ + "low", + "medium", + "high" + ], + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ], + "notes": [ + "Claude Opus 4.5 uses manual thinking.type = \"enabled\" with budget_tokens; effort can be used alongside the thinking budget.", + "Interleaved thinking requires the interleaved-thinking-2025-05-14 beta header." + ] + } }, "attachment": true, "open_weights": false, - "knowledge": "2025-09-01", - "release_date": "2024-01-01", - "last_updated": "2025-09-01", + "knowledge": "2025-03-31", + "release_date": "2025-11-24", + "last_updated": "2025-08-01", + "cost": { + "input": 5, + "output": 25, + "cache_read": 0.5, + "cache_write": 6.25 + }, "type": "chat" }, { - "id": "perplexity/sonar-reasoning-pro", - "name": "Sonar Reasoning Pro", - "display_name": "Sonar Reasoning Pro", + "id": "nvidia.nemotron-super-3-120b", + "name": "NVIDIA Nemotron 3 Super 120B A12B", + "display_name": "NVIDIA Nemotron 3 Super 120B A12B", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 4096 + "context": 262144, + "output": 131072 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { "supported": true, "default": true }, - "attachment": true, - "open_weights": false, - "knowledge": "2025-09-01", - "release_date": "2024-01-01", - "last_updated": "2025-09-01", + "attachment": false, + "open_weights": true, + "release_date": "2026-03-11", + "last_updated": "2026-03-11", + "cost": { + "input": 0.15, + "output": 0.65 + }, "type": "chat" }, { - "id": "google/gemini-3-flash-preview", - "name": "Gemini 3 Flash Preview", - "display_name": "Gemini 3 Flash Preview", + "id": "nvidia.nemotron-nano-3-30b", + "name": "NVIDIA Nemotron Nano 3 30B", + "display_name": "NVIDIA Nemotron Nano 3 30B", "modalities": { "input": [ - "text", - "image", - "video", - "audio", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 1048576, - "output": 65536 + "context": 128000, + "output": 4096 }, "temperature": true, "tool_call": true, "reasoning": { "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": true, - "mode": "level", - "level": "high", - "level_options": [ - "minimal", - "low", - "medium", - "high" - ], - "summaries": true, - "visibility": "summary", - "continuation": [ - "thought_signatures" - ] - } + "default": true + }, + "attachment": false, + "open_weights": true, + "release_date": "2025-12-23", + "last_updated": "2025-12-23", + "cost": { + "input": 0.06, + "output": 0.24 }, - "attachment": true, - "open_weights": false, - "knowledge": "2025-01", - "release_date": "2025-12-17", - "last_updated": "2025-12-17", "type": "chat" }, { - "id": "google/gemini-2.5-pro", - "name": "Gemini 2.5 Pro", - "display_name": "Gemini 2.5 Pro", + "id": "eu.anthropic.claude-opus-4-5-20251101-v1:0", + "name": "Claude Opus 4.5 (EU)", + "display_name": "Claude Opus 4.5 (EU)", "modalities": { "input": [ "text", "image", - "audio", - "video", "pdf" ], "output": [ @@ -134620,51 +138766,63 @@ ] }, "limit": { - "context": 1048576, - "output": 65536 + "context": 200000, + "output": 64000 }, "temperature": true, "tool_call": true, "reasoning": { "supported": true, - "default": true + "default": false }, "extra_capabilities": { "reasoning": { "supported": true, - "default_enabled": true, - "mode": "budget", + "default_enabled": false, + "mode": "mixed", "budget": { - "default": -1, - "min": 128, - "max": 32768, - "auto": -1, + "min": 1024, "unit": "tokens" }, + "effort": "high", + "effort_options": [ + "low", + "medium", + "high" + ], + "interleaved": true, "summaries": true, "visibility": "summary", "continuation": [ - "thought_signatures" + "thinking_blocks" + ], + "notes": [ + "Claude Opus 4.5 uses manual thinking.type = \"enabled\" with budget_tokens; effort can be used alongside the thinking budget.", + "Interleaved thinking requires the interleaved-thinking-2025-05-14 beta header." ] } }, "attachment": true, "open_weights": false, - "knowledge": "2025-01", - "release_date": "2025-03-20", - "last_updated": "2025-06-05", + "knowledge": "2025-03-31", + "release_date": "2025-11-24", + "last_updated": "2025-08-01", + "cost": { + "input": 5, + "output": 25, + "cache_read": 0.5, + "cache_write": 6.25 + }, "type": "chat" }, { - "id": "google/gemini-2.5-flash-lite", - "name": "Gemini 2.5 Flash-Lite", - "display_name": "Gemini 2.5 Flash-Lite", + "id": "global.anthropic.claude-opus-4-6-v1", + "name": "Claude Opus 4.6 (Global)", + "display_name": "Claude Opus 4.6 (Global)", "modalities": { "input": [ "text", "image", - "audio", - "video", "pdf" ], "output": [ @@ -134672,8 +138830,8 @@ ] }, "limit": { - "context": 1048576, - "output": 65536 + "context": 1000000, + "output": 128000 }, "temperature": true, "tool_call": true, @@ -134685,38 +138843,51 @@ "reasoning": { "supported": true, "default_enabled": false, - "mode": "budget", + "mode": "mixed", "budget": { - "default": -1, - "min": 512, - "max": 24576, - "auto": -1, + "min": 1024, "unit": "tokens" }, + "effort": "high", + "effort_options": [ + "low", + "medium", + "high", + "max" + ], + "interleaved": true, "summaries": true, "visibility": "summary", "continuation": [ - "thought_signatures" + "thinking_blocks" + ], + "notes": [ + "Anthropic recommends adaptive thinking with effort for Claude 4.6; budget_tokens remains a deprecated compatibility path.", + "Anthropic API defaults effort to high; lower effort levels should be chosen per workload." ] } }, "attachment": true, "open_weights": false, - "knowledge": "2025-01", - "release_date": "2025-06-17", - "last_updated": "2025-06-17", + "knowledge": "2025-05-31", + "release_date": "2026-02-05", + "last_updated": "2026-03-13", + "cost": { + "input": 5, + "output": 25, + "cache_read": 0.5, + "cache_write": 6.25 + }, "type": "chat" }, { - "id": "google/gemini-2.5-flash", - "name": "Gemini 2.5 Flash", - "display_name": "Gemini 2.5 Flash", + "id": "us.anthropic.claude-sonnet-4-5-20250929-v1:0", + "name": "Claude Sonnet 4.5 (US)", + "display_name": "Claude Sonnet 4.5 (US)", "modalities": { "input": [ "text", "image", - "audio", - "video", "pdf" ], "output": [ @@ -134724,147 +138895,118 @@ ] }, "limit": { - "context": 1048576, - "output": 65536 + "context": 200000, + "output": 64000 }, "temperature": true, "tool_call": true, "reasoning": { "supported": true, - "default": true + "default": false }, "extra_capabilities": { "reasoning": { "supported": true, - "default_enabled": true, + "default_enabled": false, "mode": "budget", "budget": { - "default": -1, - "min": 0, - "max": 24576, - "auto": -1, - "off": 0, + "min": 1024, "unit": "tokens" }, + "interleaved": true, "summaries": true, "visibility": "summary", "continuation": [ - "thought_signatures" + "thinking_blocks" + ], + "notes": [ + "Claude 4 manual thinking uses thinking.type = \"enabled\" with budget_tokens.", + "Interleaved thinking requires the interleaved-thinking-2025-05-14 beta header for this model family." ] } }, "attachment": true, "open_weights": false, - "knowledge": "2025-01", - "release_date": "2025-03-20", - "last_updated": "2025-06-05", + "knowledge": "2025-07-31", + "release_date": "2025-09-29", + "last_updated": "2025-09-29", + "cost": { + "input": 3, + "output": 15, + "cache_read": 0.3, + "cache_write": 3.75 + }, "type": "chat" }, { - "id": "google/gemini-3-pro-preview", - "name": "Gemini 3 Pro Preview", - "display_name": "Gemini 3 Pro Preview", + "id": "google.gemma-3-12b-it", + "name": "Google Gemma 3 12B", + "display_name": "Google Gemma 3 12B", "modalities": { "input": [ "text", - "image", - "video", - "audio", - "pdf" + "image" ], "output": [ "text" ] }, "limit": { - "context": 1048576, - "output": 65536 + "context": 131072, + "output": 8192 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": true, - "mode": "level", - "level": "high", - "level_options": [ - "low", - "high" - ], - "summaries": true, - "visibility": "summary", - "continuation": [ - "thought_signatures" - ] - } + "supported": false }, - "attachment": true, + "attachment": false, "open_weights": false, - "knowledge": "2025-01", - "release_date": "2025-11-18", - "last_updated": "2025-11-18", + "knowledge": "2024-12", + "release_date": "2024-12-01", + "last_updated": "2024-12-01", + "cost": { + "input": 0.049999999999999996, + "output": 0.09999999999999999 + }, "type": "chat" }, { - "id": "openai/gpt-5-mini", - "name": "GPT-5 Mini", - "display_name": "GPT-5 Mini", + "id": "minimax.minimax-m2.1", + "name": "MiniMax M2.1", + "display_name": "MiniMax M2.1", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 400000, - "output": 128000 + "context": 204800, + "output": 131072 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, "default": true }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": true, - "mode": "effort", - "effort": "medium", - "effort_options": [ - "minimal", - "low", - "medium", - "high" - ], - "verbosity": "medium", - "verbosity_options": [ - "low", - "medium", - "high" - ], - "visibility": "hidden" - } + "attachment": false, + "open_weights": true, + "release_date": "2025-12-23", + "last_updated": "2025-12-23", + "cost": { + "input": 0.3, + "output": 1.2 }, - "attachment": true, - "open_weights": false, - "knowledge": "2024-05-30", - "release_date": "2025-08-07", - "last_updated": "2025-08-07", "type": "chat" }, { - "id": "openai/gpt-5.2", - "name": "GPT-5.2", - "display_name": "GPT-5.2", + "id": "eu.anthropic.claude-fable-5", + "name": "Claude Fable 5 (EU)", + "display_name": "Claude Fable 5 (EU)", "modalities": { "input": [ "text", @@ -134875,284 +139017,239 @@ ] }, "limit": { - "context": 400000, + "context": 1000000, "output": 128000 }, "temperature": false, "tool_call": true, "reasoning": { "supported": true, - "default": false + "default": true }, "extra_capabilities": { "reasoning": { "supported": true, - "default_enabled": false, + "default_enabled": true, "mode": "effort", - "effort": "none", + "effort": "high", "effort_options": [ - "none", "low", "medium", "high", - "xhigh" + "xhigh", + "max" ], - "verbosity": "medium", - "verbosity_options": [ - "low", - "medium", - "high" + "interleaved": true, + "summaries": true, + "visibility": "omitted", + "continuation": [ + "thinking_blocks" ], - "visibility": "hidden" + "notes": [ + "Adaptive thinking is always on for Claude Fable 5 and Claude Mythos 5; thinking.type = \"disabled\" is rejected.", + "Manual budget_tokens requests return 400 on Claude Fable 5 and Claude Mythos 5.", + "thinking.display defaults to omitted; set display to summarized to receive readable thinking summaries." + ] } }, "attachment": true, "open_weights": false, - "knowledge": "2025-08-31", - "release_date": "2025-12-11", - "last_updated": "2025-12-11", + "knowledge": "2026-01-31", + "release_date": "2026-06-09", + "last_updated": "2026-06-09", + "cost": { + "input": 11, + "output": 55, + "cache_read": 1.1, + "cache_write": 13.75 + }, "type": "chat" }, { - "id": "openai/o3", - "name": "o3", - "display_name": "o3", + "id": "deepseek.v3.2", + "name": "DeepSeek-V3.2", + "display_name": "DeepSeek-V3.2", "modalities": { "input": [ - "text", - "image", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 100000 + "context": 163840, + "output": 81920 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, "default": true }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": true, - "mode": "effort", - "effort": "medium", - "effort_options": [ - "low", - "medium", - "high" - ], - "visibility": "hidden" - } + "attachment": false, + "open_weights": true, + "knowledge": "2024-07", + "release_date": "2026-02-06", + "last_updated": "2026-02-06", + "cost": { + "input": 0.62, + "output": 1.85 }, - "attachment": true, - "open_weights": false, - "knowledge": "2024-05", - "release_date": "2025-04-16", - "last_updated": "2025-04-16", "type": "chat" }, { - "id": "openai/gpt-5", - "name": "GPT-5", - "display_name": "GPT-5", + "id": "mistral.ministral-3-14b-instruct", + "name": "Ministral 14B 3.0", + "display_name": "Ministral 14B 3.0", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 400000, - "output": 128000 + "context": 128000, + "output": 4096 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": true, - "mode": "effort", - "effort": "medium", - "effort_options": [ - "minimal", - "low", - "medium", - "high" - ], - "verbosity": "medium", - "verbosity_options": [ - "low", - "medium", - "high" - ], - "visibility": "hidden" - } + "supported": false }, - "attachment": true, + "attachment": false, "open_weights": false, - "knowledge": "2024-09-30", - "release_date": "2025-08-07", - "last_updated": "2025-08-07", + "release_date": "2024-12-01", + "last_updated": "2024-12-01", + "cost": { + "input": 0.2, + "output": 0.2 + }, "type": "chat" - }, + } + ] + }, + "togetherai": { + "id": "togetherai", + "name": "Together AI", + "display_name": "Together AI", + "doc": "https://docs.together.ai/docs/serverless-models", + "models": [ { - "id": "openai/gpt-4.1-mini", - "name": "GPT-4.1 mini", - "display_name": "GPT-4.1 mini", + "id": "LiquidAI/LFM2-24B-A2B", + "name": "LFM2-24B-A2B", + "display_name": "LFM2-24B-A2B", "modalities": { "input": [ - "text", - "image", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 1047576, + "context": 32768, "output": 32768 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": false }, - "attachment": true, - "open_weights": false, - "knowledge": "2024-04", - "release_date": "2025-04-14", - "last_updated": "2025-04-14", + "attachment": false, + "open_weights": true, + "release_date": "2026-02-25", + "last_updated": "2026-02-25", + "cost": { + "input": 0.03, + "output": 0.12 + }, "type": "chat" }, { - "id": "openai/o4-mini", - "name": "o4-mini", - "display_name": "o4-mini", + "id": "meta-llama/Meta-Llama-3-8B-Instruct-Lite", + "name": "Meta Llama 3 8B Instruct Lite", + "display_name": "Meta Llama 3 8B Instruct Lite", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 100000 + "context": 8192, + "output": 8192 }, - "temperature": false, - "tool_call": true, + "temperature": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": true + "supported": false }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": true, - "mode": "effort", - "effort": "medium", - "effort_options": [ - "low", - "medium", - "high" - ], - "visibility": "hidden" - } + "attachment": false, + "open_weights": true, + "release_date": "2024-04-18", + "last_updated": "2024-04-18", + "cost": { + "input": 0.14, + "output": 0.14 }, - "attachment": true, - "open_weights": false, - "knowledge": "2024-05", - "release_date": "2025-04-16", - "last_updated": "2025-04-16", "type": "chat" }, { - "id": "openai/gpt-5.4", - "name": "GPT-5.4", - "display_name": "GPT-5.4", + "id": "meta-llama/Llama-3.3-70B-Instruct-Turbo", + "name": "Llama 3.3 70B", + "display_name": "Llama 3.3 70B", "modalities": { "input": [ - "text", - "image", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 1050000, - "output": 128000 + "context": 131072, + "output": 131072 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": false + "supported": false }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": false, - "mode": "effort", - "effort": "none", - "effort_options": [ - "none", - "low", - "medium", - "high", - "xhigh" - ], - "verbosity": "medium", - "verbosity_options": [ - "low", - "medium", - "high" - ], - "visibility": "hidden" - } + "attachment": false, + "open_weights": true, + "knowledge": "2023-12", + "release_date": "2024-12-06", + "last_updated": "2024-12-06", + "cost": { + "input": 0.88, + "output": 0.88 }, - "attachment": true, - "open_weights": false, - "knowledge": "2025-08-31", - "release_date": "2026-03-05", - "last_updated": "2026-03-05", "type": "chat" }, { - "id": "openai/o3-mini", - "name": "o3-mini", - "display_name": "o3-mini", + "id": "moonshotai/Kimi-K2.6", + "name": "Kimi K2.6", + "display_name": "Kimi K2.6", "modalities": { "input": [ - "text" + "text", + "image", + "video" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 100000 + "context": 262144, + "output": 131000 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, @@ -135160,29 +139257,25 @@ }, "extra_capabilities": { "reasoning": { - "supported": true, - "default_enabled": true, - "mode": "effort", - "effort": "medium", - "effort_options": [ - "low", - "medium", - "high" - ], - "visibility": "hidden" + "supported": true } }, - "attachment": false, - "open_weights": false, - "knowledge": "2024-05", - "release_date": "2024-12-20", - "last_updated": "2025-01-29", + "attachment": true, + "open_weights": true, + "knowledge": "2025-01", + "release_date": "2026-04-21", + "last_updated": "2026-04-21", + "cost": { + "input": 1.2, + "output": 4.5, + "cache_read": 0.2 + }, "type": "chat" }, { - "id": "openai/gpt-5.1", - "name": "GPT-5.1", - "display_name": "GPT-5.1", + "id": "moonshotai/Kimi-K2.5", + "name": "Kimi K2.5", + "display_name": "Kimi K2.5", "modalities": { "input": [ "text", @@ -135193,86 +139286,75 @@ ] }, "limit": { - "context": 400000, - "output": 128000 + "context": 262144, + "output": 262144 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, - "default": false + "default": true }, "extra_capabilities": { "reasoning": { "supported": true, - "default_enabled": false, - "mode": "effort", - "effort": "none", - "effort_options": [ - "none", - "low", - "medium", - "high" - ], - "verbosity": "medium", - "verbosity_options": [ - "low", - "medium", - "high" - ], - "visibility": "hidden" + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] } }, - "attachment": true, - "open_weights": false, - "knowledge": "2024-09-30", - "release_date": "2025-11-13", - "last_updated": "2025-11-13", + "attachment": false, + "open_weights": true, + "knowledge": "2026-01", + "release_date": "2026-01-27", + "last_updated": "2026-01-27", + "cost": { + "input": 0.5, + "output": 2.8 + }, "type": "chat" }, { - "id": "openai/gpt-4.1", - "name": "GPT-4.1", - "display_name": "GPT-4.1", + "id": "google/gemma-4-31B-it", + "name": "Gemma 4 31B Instruct", + "display_name": "Gemma 4 31B Instruct", "modalities": { "input": [ "text", - "image", - "pdf" + "image" ], "output": [ "text" ] }, "limit": { - "context": 1047576, - "output": 32768 + "context": 262144, + "output": 131072 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "attachment": true, - "open_weights": false, - "knowledge": "2024-04", - "release_date": "2025-04-14", - "last_updated": "2025-04-14", + "open_weights": true, + "knowledge": "2025-01", + "release_date": "2026-04-07", + "last_updated": "2026-04-07", + "cost": { + "input": 0.39, + "output": 0.97 + }, "type": "chat" - } - ] - }, - "vultr": { - "id": "vultr", - "name": "Vultr", - "display_name": "Vultr", - "api": "https://api.vultrinference.com/v1", - "doc": "https://api.vultrinference.com/", - "models": [ + }, { - "id": "MiniMaxAI/MiniMax-M2.7", - "name": "MiniMax-M2.7", - "display_name": "MiniMax-M2.7", + "id": "google/gemma-3n-E4B-it", + "name": "Gemma 3N E4B Instruct", + "display_name": "Gemma 3N E4B Instruct", "modalities": { "input": [ "text" @@ -135282,40 +139364,28 @@ ] }, "limit": { - "context": 204800, - "output": 131072 + "context": 32768, + "output": 32768 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } + "supported": false }, "attachment": false, "open_weights": true, - "release_date": "2026-03-18", - "last_updated": "2026-03-18", + "release_date": "2025-05-20", + "last_updated": "2025-05-20", "cost": { - "input": 0.3, - "output": 1.2 + "input": 0.06, + "output": 0.12 }, "type": "chat" }, { - "id": "zai-org/GLM-5.1-FP8", - "name": "GLM-5.1", - "display_name": "GLM-5.1", + "id": "Qwen/Qwen3.7-Max", + "name": "Qwen3.7 Max", + "display_name": "Qwen3.7 Max", "modalities": { "input": [ "text" @@ -135325,40 +139395,33 @@ ] }, "limit": { - "context": 200000, - "output": 131072 + "context": 1000000, + "output": 500000 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": true }, "extra_capabilities": { "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] + "supported": true } }, "attachment": false, - "open_weights": true, - "release_date": "2026-03-27", - "last_updated": "2026-03-27", + "open_weights": false, + "release_date": "2026-05-21", + "last_updated": "2026-05-21", "cost": { - "input": 0.85, - "output": 3.1 + "input": 2.5, + "output": 7.5 }, "type": "chat" }, { - "id": "moonshotai/Kimi-K2.6", - "name": "Kimi K2.6", - "display_name": "Kimi K2.6", + "id": "Qwen/Qwen3.6-Plus", + "name": "Qwen3.6 Plus", + "display_name": "Qwen3.6 Plus", "modalities": { "input": [ "text" @@ -135368,8 +139431,8 @@ ] }, "limit": { - "context": 262144, - "output": 131072 + "context": 1000000, + "output": 500000 }, "temperature": true, "tool_call": true, @@ -135388,24 +139451,24 @@ ] } }, - "attachment": true, + "attachment": false, "open_weights": true, - "knowledge": "2025-01", - "release_date": "2026-04-21", - "last_updated": "2026-04-21", + "release_date": "2026-04-30", + "last_updated": "2026-04-30", "cost": { - "input": 0.15, - "output": 0.6 + "input": 0.5, + "output": 3 }, "type": "chat" }, { - "id": "nvidia/Nemotron-Cascade-2-30B-A3B", - "name": "NVIDIA Nemotron Cascade 2", - "display_name": "NVIDIA Nemotron Cascade 2", + "id": "Qwen/Qwen3.5-397B-A17B", + "name": "Qwen3.5 397B A17B", + "display_name": "Qwen3.5 397B A17B", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" @@ -135413,7 +139476,7 @@ }, "limit": { "context": 262144, - "output": 131072 + "output": 130000 }, "temperature": true, "tool_call": true, @@ -135421,21 +139484,31 @@ "supported": true, "default": true }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } + }, "attachment": false, "open_weights": true, - "knowledge": "2024-07", - "release_date": "2025-12-01", - "last_updated": "2025-12-01", + "release_date": "2026-02-16", + "last_updated": "2026-02-16", "cost": { - "input": 0.15, - "output": 0.6 + "input": 0.6, + "output": 3.6 }, "type": "chat" }, { - "id": "nvidia/Nemotron-3-Nano-Omni-30B-A3B-Reasoning-BF16", - "name": "NVIDIA Nemotron 3 Nano Omni", - "display_name": "NVIDIA Nemotron 3 Nano Omni", + "id": "Qwen/Qwen3-Coder-Next-FP8", + "name": "Qwen3 Coder Next FP8", + "display_name": "Qwen3 Coder Next FP8", "modalities": { "input": [ "text" @@ -135446,29 +139519,28 @@ }, "limit": { "context": 262144, - "output": 131072 + "output": 262144 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, "attachment": false, "open_weights": true, - "knowledge": "2025-05", - "release_date": "2026-04-28", - "last_updated": "2026-04-28", + "knowledge": "2026-02-03", + "release_date": "2026-02-03", + "last_updated": "2026-02-03", "cost": { - "input": 0.13, - "output": 0.38 + "input": 0.5, + "output": 1.2 }, "type": "chat" }, { - "id": "nvidia/DeepSeek-V3.2-NVFP4", - "name": "DeepSeek V3.2", - "display_name": "DeepSeek V3.2", + "id": "Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8", + "name": "Qwen3 Coder 480B A35B Instruct", + "display_name": "Qwen3 Coder 480B A35B Instruct", "modalities": { "input": [ "text" @@ -135478,30 +139550,29 @@ ] }, "limit": { - "context": 131072, - "output": 131072 + "context": 262144, + "output": 262144 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, "attachment": false, "open_weights": true, - "knowledge": "2024-07", - "release_date": "2025-12-01", - "last_updated": "2025-12-01", + "knowledge": "2025-04", + "release_date": "2025-07-23", + "last_updated": "2025-07-23", "cost": { - "input": 0.55, - "output": 1.65 + "input": 2, + "output": 2 }, "type": "chat" }, { - "id": "nvidia/Llama-3.1-Nemotron-Safety-Guard-8B-v3", - "name": "Llama 3.1 Nemotron Safety Guard", - "display_name": "Llama 3.1 Nemotron Safety Guard", + "id": "Qwen/Qwen3-235B-A22B-Instruct-2507-tput", + "name": "Qwen3 235B A22B Instruct 2507 FP8", + "display_name": "Qwen3 235B A22B Instruct 2507 FP8", "modalities": { "input": [ "text" @@ -135511,38 +139582,29 @@ ] }, "limit": { - "context": 8192, - "output": 4096 + "context": 262144, + "output": 262144 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { "supported": false }, "attachment": false, "open_weights": true, - "knowledge": "2023-12", - "release_date": "2025-10-28", - "last_updated": "2025-10-28", + "knowledge": "2025-07", + "release_date": "2025-07-25", + "last_updated": "2025-07-25", "cost": { - "input": 0.01, - "output": 0.01 + "input": 0.2, + "output": 0.6 }, "type": "chat" - } - ] - }, - "zai-coding-plan": { - "id": "zai-coding-plan", - "name": "Z.AI Coding Plan", - "display_name": "Z.AI Coding Plan", - "api": "https://api.z.ai/api/coding/paas/v4", - "doc": "https://docs.z.ai/devpack/overview", - "models": [ + }, { - "id": "glm-4.7", - "name": "GLM-4.7", - "display_name": "GLM-4.7", + "id": "Qwen/Qwen2.5-7B-Instruct-Turbo", + "name": "Qwen 2.5 7B Instruct Turbo", + "display_name": "Qwen 2.5 7B Instruct Turbo", "modalities": { "input": [ "text" @@ -135552,57 +139614,40 @@ ] }, "limit": { - "context": 204800, - "output": 131072 + "context": 32768, + "output": 32768 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } + "supported": false }, "attachment": false, "open_weights": true, - "knowledge": "2025-04", - "release_date": "2025-12-22", - "last_updated": "2025-12-22", + "release_date": "2024-09-19", + "last_updated": "2024-09-19", "cost": { - "input": 0, - "output": 0, - "cache_read": 0, - "cache_write": 0 + "input": 0.3, + "output": 0.3 }, "type": "chat" }, { - "id": "glm-5v-turbo", - "name": "GLM-5V-Turbo", - "display_name": "GLM-5V-Turbo", + "id": "Qwen/Qwen3.5-9B", + "name": "Qwen3.5 9B", + "display_name": "Qwen3.5 9B", "modalities": { "input": [ "text", - "image", - "video", - "pdf" + "image" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 131072 + "context": 262144, + "output": 65536 }, "temperature": true, "tool_call": true, @@ -135622,21 +139667,19 @@ } }, "attachment": true, - "open_weights": false, - "release_date": "2026-04-01", - "last_updated": "2026-04-01", + "open_weights": true, + "release_date": "2026-03-03", + "last_updated": "2026-03-03", "cost": { - "input": 0, - "output": 0, - "cache_read": 0, - "cache_write": 0 + "input": 0.17, + "output": 0.25 }, "type": "chat" }, { - "id": "glm-5-turbo", - "name": "GLM-5-Turbo", - "display_name": "GLM-5-Turbo", + "id": "openai/gpt-oss-120b", + "name": "GPT OSS 120B", + "display_name": "GPT OSS 120B", "modalities": { "input": [ "text" @@ -135646,7 +139689,7 @@ ] }, "limit": { - "context": 200000, + "context": 131072, "output": 131072 }, "temperature": true, @@ -135657,31 +139700,24 @@ }, "extra_capabilities": { "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] + "supported": true } }, "attachment": false, - "open_weights": false, - "release_date": "2026-03-16", - "last_updated": "2026-03-16", + "open_weights": true, + "knowledge": "2025-08", + "release_date": "2025-08-05", + "last_updated": "2025-08-05", "cost": { - "input": 0, - "output": 0, - "cache_read": 0, - "cache_write": 0 + "input": 0.15, + "output": 0.6 }, "type": "chat" }, { - "id": "glm-4.5-air", - "name": "GLM-4.5-Air", - "display_name": "GLM-4.5-Air", + "id": "openai/gpt-oss-20b", + "name": "GPT OSS 20B", + "display_name": "GPT OSS 20B", "modalities": { "input": [ "text" @@ -135692,7 +139728,7 @@ }, "limit": { "context": 131072, - "output": 98304 + "output": 131072 }, "temperature": true, "tool_call": true, @@ -135700,23 +139736,25 @@ "supported": true, "default": true }, + "extra_capabilities": { + "reasoning": { + "supported": true + } + }, "attachment": false, "open_weights": true, - "knowledge": "2025-04", - "release_date": "2025-07-28", - "last_updated": "2025-07-28", + "release_date": "2025-08-05", + "last_updated": "2025-08-05", "cost": { - "input": 0, - "output": 0, - "cache_read": 0, - "cache_write": 0 + "input": 0.05, + "output": 0.2 }, "type": "chat" }, { - "id": "glm-5.1", - "name": "GLM-5.1", - "display_name": "GLM-5.1", + "id": "pearl-ai/gemma-4-31b-it", + "name": "Pearl AI Gemma 4 31B Instruct", + "display_name": "Pearl AI Gemma 4 31B Instruct", "modalities": { "input": [ "text" @@ -135726,108 +139764,62 @@ ] }, "limit": { - "context": 200000, - "output": 131072 + "context": 32000, + "output": 32000 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": true, "default": true }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } - }, "attachment": false, "open_weights": false, - "release_date": "2026-03-27", - "last_updated": "2026-03-27", + "release_date": "2026-04-07", + "last_updated": "2026-04-07", "cost": { - "input": 0, - "output": 0, - "cache_read": 0, - "cache_write": 0 + "input": 0.28, + "output": 0.86 }, "type": "chat" - } - ] - }, - "amazon-bedrock": { - "id": "amazon-bedrock", - "name": "Amazon Bedrock", - "display_name": "Amazon Bedrock", - "doc": "https://docs.aws.amazon.com/bedrock/latest/userguide/models-supported.html", - "models": [ + }, { - "id": "eu.anthropic.claude-haiku-4-5-20251001-v1:0", - "name": "Claude Haiku 4.5 (EU)", - "display_name": "Claude Haiku 4.5 (EU)", + "id": "nvidia/nemotron-3-ultra-550b-a55b", + "name": "Nemotron 3 Ultra 550B A55B", + "display_name": "Nemotron 3 Ultra 550B A55B", "modalities": { "input": [ - "text", - "image", - "pdf" + "text" ], "output": [ "text" ] }, - "limit": { - "context": 200000, - "output": 64000 - }, - "temperature": true, - "tool_call": true, - "reasoning": { - "supported": true, - "default": false - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": false, - "mode": "budget", - "budget": { - "min": 1024, - "unit": "tokens" - }, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ], - "notes": [ - "Claude 4 manual thinking uses thinking.type = \"enabled\" with budget_tokens.", - "Interleaved thinking requires the interleaved-thinking-2025-05-14 beta header for this model family." - ] - } + "limit": { + "context": 512300, + "output": 512300 }, - "attachment": true, - "open_weights": false, - "knowledge": "2025-02-28", - "release_date": "2025-10-15", - "last_updated": "2025-10-15", + "temperature": true, + "tool_call": true, + "reasoning": { + "supported": true, + "default": true + }, + "attachment": false, + "open_weights": true, + "release_date": "2026-06-04", + "last_updated": "2026-06-04", "cost": { - "input": 1, - "output": 5, - "cache_read": 0.1, - "cache_write": 1.25 + "input": 0.6, + "output": 3.6, + "cache_read": 0.2 }, "type": "chat" }, { - "id": "qwen.qwen3-coder-30b-a3b-v1:0", - "name": "Qwen3 Coder 30B A3B Instruct", - "display_name": "Qwen3 Coder 30B A3B Instruct", + "id": "deepcogito/cogito-v2-1-671b", + "name": "Cogito v2.1 671B", + "display_name": "Cogito v2.1 671B", "modalities": { "input": [ "text" @@ -135837,91 +139829,72 @@ ] }, "limit": { - "context": 262144, - "output": 131072 + "context": 163840, + "output": 163840 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": false + "supported": true, + "default": true }, "attachment": false, "open_weights": false, - "knowledge": "2024-04", - "release_date": "2025-09-18", - "last_updated": "2025-09-18", + "release_date": "2025-11-13", + "last_updated": "2025-11-13", "cost": { - "input": 0.15, - "output": 0.6 + "input": 1.25, + "output": 1.25 }, "type": "chat" }, { - "id": "jp.anthropic.claude-opus-4-8", - "name": "Claude Opus 4.8 (JP)", - "display_name": "Claude Opus 4.8 (JP)", + "id": "zai-org/GLM-5", + "name": "GLM-5", + "display_name": "GLM-5", "modalities": { "input": [ - "text", - "image", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 1000000, - "output": 128000 + "context": 202752, + "output": 131072 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, - "default": false + "default": true }, "extra_capabilities": { "reasoning": { "supported": true, - "default_enabled": false, - "mode": "effort", - "effort": "high", - "effort_options": [ - "low", - "medium", - "high", - "xhigh", - "max" - ], "interleaved": true, "summaries": true, - "visibility": "omitted", + "visibility": "summary", "continuation": [ "thinking_blocks" - ], - "notes": [ - "Claude Opus 4.7 and newer Opus models require thinking.type = \"adaptive\" to enable thinking explicitly.", - "Manual budget_tokens requests return 400 on Claude Opus 4.7 and newer adaptive-only Opus models.", - "task_budget is separate from thinking control and should not be treated as a thinking budget." ] } }, - "attachment": true, - "open_weights": false, - "release_date": "2026-05-28", - "last_updated": "2026-05-28", + "attachment": false, + "open_weights": true, + "release_date": "2026-02-11", + "last_updated": "2026-02-11", "cost": { - "input": 5, - "output": 25, - "cache_read": 0.5, - "cache_write": 6.25 + "input": 1, + "output": 3.2 }, "type": "chat" }, { - "id": "openai.gpt-oss-120b-1:0", - "name": "gpt-oss-120b", - "display_name": "gpt-oss-120b", + "id": "zai-org/GLM-5.1", + "name": "GLM-5.1", + "display_name": "GLM-5.1", "modalities": { "input": [ "text" @@ -135931,8 +139904,8 @@ ] }, "limit": { - "context": 128000, - "output": 16384 + "context": 202752, + "output": 131072 }, "temperature": true, "tool_call": true, @@ -135940,20 +139913,26 @@ "supported": true, "default": true }, + "extra_capabilities": { + "reasoning": { + "supported": true + } + }, "attachment": false, - "open_weights": false, - "release_date": "2025-08-05", - "last_updated": "2025-08-05", + "open_weights": true, + "knowledge": "2025-11", + "release_date": "2026-04-07", + "last_updated": "2026-04-07", "cost": { - "input": 0.15, - "output": 0.6 + "input": 1.4, + "output": 4.4 }, "type": "chat" }, { - "id": "mistral.ministral-3-8b-instruct", - "name": "Ministral 3 8B", - "display_name": "Ministral 3 8B", + "id": "deepseek-ai/DeepSeek-R1", + "name": "DeepSeek-R1", + "display_name": "DeepSeek-R1", "modalities": { "input": [ "text" @@ -135963,121 +139942,118 @@ ] }, "limit": { - "context": 128000, - "output": 4096 + "context": 163839, + "output": 163839 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": false + "supported": true, + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } }, "attachment": false, - "open_weights": false, - "release_date": "2024-12-01", - "last_updated": "2024-12-01", + "open_weights": true, + "knowledge": "2024-07", + "release_date": "2025-01-20", + "last_updated": "2025-03-24", "cost": { - "input": 0.15, - "output": 0.15 + "input": 3, + "output": 7 }, "type": "chat" }, { - "id": "amazon.nova-pro-v1:0", - "name": "Nova Pro", - "display_name": "Nova Pro", + "id": "deepseek-ai/DeepSeek-V3-1", + "name": "DeepSeek V3.1", + "display_name": "DeepSeek V3.1", "modalities": { "input": [ - "text", - "image", - "video" + "text" ], "output": [ "text" ] }, "limit": { - "context": 300000, - "output": 8192 + "context": 131072, + "output": 131072 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": true, - "open_weights": false, - "knowledge": "2024-10", - "release_date": "2024-12-03", - "last_updated": "2024-12-03", + "attachment": false, + "open_weights": true, + "knowledge": "2025-08", + "release_date": "2025-08-21", + "last_updated": "2025-08-21", "cost": { - "input": 0.8, - "output": 3.2, - "cache_read": 0.2 + "input": 0.6, + "output": 1.7 }, "type": "chat" }, { - "id": "au.anthropic.claude-haiku-4-5-20251001-v1:0", - "name": "Claude Haiku 4.5 (AU)", - "display_name": "Claude Haiku 4.5 (AU)", + "id": "deepseek-ai/DeepSeek-V4-Pro", + "name": "DeepSeek V4 Pro", + "display_name": "DeepSeek V4 Pro", "modalities": { "input": [ - "text", - "image", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 64000 + "context": 512000, + "output": 384000 }, "temperature": true, "tool_call": true, "reasoning": { "supported": true, - "default": false + "default": true }, "extra_capabilities": { "reasoning": { "supported": true, - "default_enabled": false, - "mode": "budget", - "budget": { - "min": 1024, - "unit": "tokens" - }, "interleaved": true, "summaries": true, "visibility": "summary", "continuation": [ "thinking_blocks" - ], - "notes": [ - "Claude 4 manual thinking uses thinking.type = \"enabled\" with budget_tokens.", - "Interleaved thinking requires the interleaved-thinking-2025-05-14 beta header for this model family." ] } }, - "attachment": true, - "open_weights": false, - "knowledge": "2025-02-28", - "release_date": "2025-10-15", - "last_updated": "2025-10-15", + "attachment": false, + "open_weights": true, + "release_date": "2026-04-24", + "last_updated": "2026-04-24", "cost": { - "input": 1, - "output": 5, - "cache_read": 0.1, - "cache_write": 1.25 + "input": 1.74, + "output": 3.48, + "cache_read": 0.2 }, "type": "chat" }, { - "id": "nvidia.nemotron-super-3-120b", - "name": "NVIDIA Nemotron 3 Super 120B A12B", - "display_name": "NVIDIA Nemotron 3 Super 120B A12B", + "id": "deepseek-ai/DeepSeek-V3", + "name": "DeepSeek-V3", + "display_name": "DeepSeek-V3", "modalities": { "input": [ "text" @@ -136087,7 +140063,39 @@ ] }, "limit": { - "context": 262144, + "context": 131072, + "output": 131072 + }, + "temperature": true, + "tool_call": true, + "reasoning": { + "supported": false + }, + "attachment": false, + "open_weights": true, + "knowledge": "2024-07", + "release_date": "2024-12-26", + "last_updated": "2025-05-29", + "cost": { + "input": 1.25, + "output": 1.25 + }, + "type": "chat" + }, + { + "id": "MiniMaxAI/MiniMax-M2.5", + "name": "MiniMax-M2.5", + "display_name": "MiniMax-M2.5", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 204800, "output": 131072 }, "temperature": true, @@ -136096,84 +140104,70 @@ "supported": true, "default": true }, + "extra_capabilities": { + "reasoning": { + "supported": true + } + }, "attachment": false, "open_weights": true, - "release_date": "2026-03-11", - "last_updated": "2026-03-11", + "release_date": "2026-02-12", + "last_updated": "2026-02-12", "cost": { - "input": 0.15, - "output": 0.65 + "input": 0.3, + "output": 1.2, + "cache_read": 0.06 }, "type": "chat" }, { - "id": "global.anthropic.claude-opus-4-5-20251101-v1:0", - "name": "Claude Opus 4.5 (Global)", - "display_name": "Claude Opus 4.5 (Global)", + "id": "MiniMaxAI/MiniMax-M2.7", + "name": "MiniMax-M2.7", + "display_name": "MiniMax-M2.7", "modalities": { "input": [ - "text", - "image", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 64000 + "context": 202752, + "output": 131072 }, "temperature": true, "tool_call": true, "reasoning": { "supported": true, - "default": false + "default": true }, "extra_capabilities": { "reasoning": { "supported": true, - "default_enabled": false, - "mode": "mixed", - "budget": { - "min": 1024, - "unit": "tokens" - }, - "effort": "high", - "effort_options": [ - "low", - "medium", - "high" - ], "interleaved": true, "summaries": true, "visibility": "summary", "continuation": [ "thinking_blocks" - ], - "notes": [ - "Claude Opus 4.5 uses manual thinking.type = \"enabled\" with budget_tokens; effort can be used alongside the thinking budget.", - "Interleaved thinking requires the interleaved-thinking-2025-05-14 beta header." ] } }, - "attachment": true, - "open_weights": false, - "knowledge": "2025-03-31", - "release_date": "2025-11-24", - "last_updated": "2025-08-01", + "attachment": false, + "open_weights": true, + "release_date": "2026-03-18", + "last_updated": "2026-03-18", "cost": { - "input": 5, - "output": 25, - "cache_read": 0.5, - "cache_write": 6.25 + "input": 0.3, + "output": 1.2, + "cache_read": 0.06 }, "type": "chat" }, { - "id": "deepseek.v3-v1:0", - "name": "DeepSeek-V3.1", - "display_name": "DeepSeek-V3.1", + "id": "essentialai/Rnj-1-Instruct", + "name": "Rnj-1 Instruct", + "display_name": "Rnj-1 Instruct", "modalities": { "input": [ "text" @@ -136183,30 +140177,38 @@ ] }, "limit": { - "context": 163840, - "output": 81920 + "context": 32768, + "output": 32768 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, "attachment": false, "open_weights": true, - "knowledge": "2024-07", - "release_date": "2025-09-18", - "last_updated": "2025-09-18", + "knowledge": "2024-10", + "release_date": "2025-12-05", + "last_updated": "2025-12-05", "cost": { - "input": 0.58, - "output": 1.68 + "input": 0.15, + "output": 0.15 }, "type": "chat" - }, + } + ] + }, + "frogbot": { + "id": "frogbot", + "name": "FrogBot", + "display_name": "FrogBot", + "api": "https://app.frogbot.ai/api/v1", + "doc": "https://docs.frogbot.ai", + "models": [ { - "id": "meta.llama3-1-70b-instruct-v1:0", - "name": "Llama 3.1 70B Instruct", - "display_name": "Llama 3.1 70B Instruct", + "id": "minimax-m2-5", + "name": "MiniMax-M2.5", + "display_name": "MiniMax-M2.5", "modalities": { "input": [ "text" @@ -136216,40 +140218,42 @@ ] }, "limit": { - "context": 128000, - "output": 4096 + "context": 192000, + "output": 8192 }, "temperature": true, "tool_call": true, "reasoning": { "supported": false }, - "attachment": false, - "open_weights": true, - "knowledge": "2023-12", - "release_date": "2024-07-23", - "last_updated": "2024-07-23", + "attachment": true, + "open_weights": false, + "knowledge": "2024-09", + "release_date": "2025-01-15", + "last_updated": "2025-02-22", "cost": { - "input": 0.72, - "output": 0.72 + "input": 0.3, + "output": 1.2, + "cache_read": 0.03 }, "type": "chat" }, { - "id": "writer.palmyra-x5-v1:0", - "name": "Palmyra X5", - "display_name": "Palmyra X5", + "id": "kimi-k2-6", + "name": "Kimi-K2.6", + "display_name": "Kimi-K2.6", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 1040000, - "output": 8192 + "context": 256000, + "output": 128000 }, "temperature": true, "tool_call": true, @@ -136259,81 +140263,52 @@ }, "attachment": false, "open_weights": false, - "release_date": "2025-04-28", - "last_updated": "2025-04-28", + "release_date": "1970-01-01", + "last_updated": "1970-01-01", "cost": { - "input": 0.6, - "output": 6 + "input": 0.95, + "output": 4, + "cache_read": 0.16 }, "type": "chat" }, { - "id": "global.anthropic.claude-opus-4-7", - "name": "Claude Opus 4.7 (Global)", - "display_name": "Claude Opus 4.7 (Global)", + "id": "zai-glm-5-1", + "name": "Z.AI GLM-5.1", + "display_name": "Z.AI GLM-5.1", "modalities": { "input": [ - "text", - "image", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 1000000, - "output": 128000 + "context": 198000, + "output": 8192 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": false - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": false, - "mode": "effort", - "effort": "high", - "effort_options": [ - "low", - "medium", - "high", - "xhigh", - "max" - ], - "interleaved": true, - "summaries": true, - "visibility": "omitted", - "continuation": [ - "thinking_blocks" - ], - "notes": [ - "Claude Opus 4.7 and newer Opus models require thinking.type = \"adaptive\" to enable thinking explicitly.", - "Manual budget_tokens requests return 400 on Claude Opus 4.7 and newer adaptive-only Opus models.", - "task_budget is separate from thinking control and should not be treated as a thinking budget." - ] - } + "supported": false }, "attachment": true, - "open_weights": false, - "knowledge": "2026-01-31", - "release_date": "2026-04-16", - "last_updated": "2026-04-16", + "open_weights": true, + "knowledge": "2024-10", + "release_date": "2025-01-20", + "last_updated": "2025-02-22", "cost": { - "input": 5, - "output": 25, - "cache_read": 0.5, - "cache_write": 6.25 + "input": 1.4, + "output": 4.4, + "cache_read": 0.26 }, "type": "chat" }, { - "id": "qwen.qwen3-235b-a22b-2507-v1:0", - "name": "Qwen3 235B A22B 2507", - "display_name": "Qwen3 235B A22B 2507", + "id": "grok-code-fast-1", + "name": "Grok 4.1 Fast (Reasoning)", + "display_name": "Grok 4.1 Fast (Reasoning)", "modalities": { "input": [ "text" @@ -136343,33 +140318,42 @@ ] }, "limit": { - "context": 262144, - "output": 131072 + "context": 256000, + "output": 128000 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true + } }, "attachment": false, - "open_weights": true, - "knowledge": "2024-04", - "release_date": "2025-09-18", - "last_updated": "2025-09-18", + "open_weights": false, + "knowledge": "2023-10", + "release_date": "2025-08-28", + "last_updated": "2025-08-28", "cost": { - "input": 0.22, - "output": 0.88 + "input": 0.2, + "output": 1.5, + "cache_read": 0.02 }, "type": "chat" }, { - "id": "eu.anthropic.claude-opus-4-7", - "name": "Claude Opus 4.7 (EU)", - "display_name": "Claude Opus 4.7 (EU)", + "id": "gemini-2.5-pro", + "name": "Gemini 2.5 Pro", + "display_name": "Gemini 2.5 Pro", "modalities": { "input": [ "text", "image", + "audio", + "video", "pdf" ], "output": [ @@ -136377,164 +140361,190 @@ ] }, "limit": { - "context": 1000000, - "output": 128000 + "context": 1048576, + "output": 65536 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, - "default": false + "default": true }, "extra_capabilities": { "reasoning": { "supported": true, - "default_enabled": false, - "mode": "effort", - "effort": "high", - "effort_options": [ - "low", - "medium", - "high", - "xhigh", - "max" - ], - "interleaved": true, + "default_enabled": true, + "mode": "budget", + "budget": { + "default": -1, + "min": 128, + "max": 32768, + "auto": -1, + "unit": "tokens" + }, "summaries": true, - "visibility": "omitted", + "visibility": "summary", "continuation": [ - "thinking_blocks" - ], - "notes": [ - "Claude Opus 4.7 and newer Opus models require thinking.type = \"adaptive\" to enable thinking explicitly.", - "Manual budget_tokens requests return 400 on Claude Opus 4.7 and newer adaptive-only Opus models.", - "task_budget is separate from thinking control and should not be treated as a thinking budget." + "thought_signatures" ] } }, "attachment": true, "open_weights": false, - "knowledge": "2026-01-31", - "release_date": "2026-04-16", - "last_updated": "2026-04-16", + "knowledge": "2025-01", + "release_date": "2025-03-20", + "last_updated": "2025-06-05", "cost": { - "input": 5.5, - "output": 27.5, - "cache_read": 0.55, - "cache_write": 6.875 + "input": 1.25, + "output": 10, + "cache_read": 0.31 }, "type": "chat" }, { - "id": "qwen.qwen3-vl-235b-a22b", - "name": "Qwen/Qwen3-VL-235B-A22B-Instruct", - "display_name": "Qwen/Qwen3-VL-235B-A22B-Instruct", + "id": "gemini-2.5-flash", + "name": "Gemini 2.5 Flash", + "display_name": "Gemini 2.5 Flash", "modalities": { "input": [ "text", - "image" + "image", + "audio", + "video", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 262000, - "output": 262000 + "context": 1048576, + "output": 65536 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": true, + "mode": "budget", + "budget": { + "default": -1, + "min": 0, + "max": 24576, + "auto": -1, + "off": 0, + "unit": "tokens" + }, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thought_signatures" + ] + } }, "attachment": true, "open_weights": false, - "release_date": "2025-10-04", - "last_updated": "2025-11-25", + "knowledge": "2025-01", + "release_date": "2025-07-17", + "last_updated": "2025-07-17", "cost": { "input": 0.3, - "output": 1.5 + "output": 2.5, + "cache_read": 0.075 }, "type": "chat" }, { - "id": "qwen.qwen3-coder-480b-a35b-v1:0", - "name": "Qwen3 Coder 480B A35B Instruct", - "display_name": "Qwen3 Coder 480B A35B Instruct", + "id": "gpt-4o", + "name": "GPT-4o", + "display_name": "GPT-4o", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 131072, - "output": 65536 + "context": 128000, + "output": 16384 }, "temperature": true, "tool_call": true, "reasoning": { "supported": false }, - "attachment": false, - "open_weights": true, - "knowledge": "2024-04", - "release_date": "2025-09-18", - "last_updated": "2025-09-18", + "attachment": true, + "open_weights": false, + "knowledge": "2023-09", + "release_date": "2024-05-13", + "last_updated": "2024-08-06", "cost": { - "input": 0.22, - "output": 1.8 + "input": 2.5, + "output": 10, + "cache_read": 1.25 }, "type": "chat" }, { - "id": "mistral.devstral-2-123b", - "name": "Devstral 2 123B", - "display_name": "Devstral 2 123B", + "id": "qwen-3-6-plus", + "name": "Qwen 3.6 Plus", + "display_name": "Qwen 3.6 Plus", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 256000, - "output": 8192 + "context": 1000000, + "output": 64000 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": false, - "open_weights": true, - "release_date": "2026-02-17", - "last_updated": "2026-02-17", + "attachment": true, + "open_weights": false, + "release_date": "2026-04-02", + "last_updated": "2026-04-03", "cost": { - "input": 0.4, - "output": 2 + "input": 0.5, + "output": 3, + "cache_read": 0.1 }, "type": "chat" }, { - "id": "minimax.minimax-m2.5", - "name": "MiniMax M2.5", - "display_name": "MiniMax M2.5", + "id": "grok-4-3", + "name": "Grok 4.3", + "display_name": "Grok 4.3", "modalities": { "input": [ - "text" + "text", + "image", + "video" ], "output": [ "text" ] }, "limit": { - "context": 196608, - "output": 98304 + "context": 1000000, + "output": 128000 }, "temperature": true, "tool_call": true, @@ -136542,20 +140552,22 @@ "supported": true, "default": true }, - "attachment": false, - "open_weights": true, - "release_date": "2026-03-18", - "last_updated": "2026-03-18", + "attachment": true, + "open_weights": false, + "knowledge": "2024-11", + "release_date": "2026-04-30", + "last_updated": "2026-04-30", "cost": { - "input": 0.3, - "output": 1.2 + "input": 1.25, + "output": 2.5, + "cache_read": 0.2 }, "type": "chat" }, { - "id": "openai.gpt-oss-120b", - "name": "gpt-oss-120b", - "display_name": "gpt-oss-120b", + "id": "deepseek-v4-pro", + "name": "DeepSeek v4 Pro", + "display_name": "DeepSeek v4 Pro", "modalities": { "input": [ "text" @@ -136566,28 +140578,40 @@ }, "limit": { "context": 128000, - "output": 16384 + "output": 8192 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": true }, - "attachment": false, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } + }, + "attachment": true, "open_weights": false, - "release_date": "2025-08-05", - "last_updated": "2025-08-05", + "knowledge": "2026-01", + "release_date": "2026-04-24", + "last_updated": "2026-04-24", "cost": { - "input": 0.15, - "output": 0.6 + "input": 1.74, + "output": 3.48, + "cache_read": 0.14 }, "type": "chat" }, { - "id": "us.anthropic.claude-opus-4-7", - "name": "Claude Opus 4.7 (US)", - "display_name": "Claude Opus 4.7 (US)", + "id": "claude-opus-4-7", + "name": "Claude Opus 4.7", + "display_name": "Claude Opus 4.7", "modalities": { "input": [ "text", @@ -136599,7 +140623,7 @@ ] }, "limit": { - "context": 1000000, + "context": 200000, "output": 128000 }, "temperature": false, @@ -136648,41 +140672,43 @@ "type": "chat" }, { - "id": "meta.llama3-1-8b-instruct-v1:0", - "name": "Llama 3.1 8B Instruct", - "display_name": "Llama 3.1 8B Instruct", + "id": "grok-4-1-fast-non-reasoning", + "name": "Grok 4.1 Fast (Non-Reasoning)", + "display_name": "Grok 4.1 Fast (Non-Reasoning)", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 4096 + "context": 2000000, + "output": 128000 }, "temperature": true, "tool_call": true, "reasoning": { "supported": false }, - "attachment": false, - "open_weights": true, - "knowledge": "2023-12", - "release_date": "2024-07-23", - "last_updated": "2024-07-23", + "attachment": true, + "open_weights": false, + "knowledge": "2025-11", + "release_date": "2025-11-25", + "last_updated": "2025-11-25", "cost": { - "input": 0.22, - "output": 0.22 + "input": 0.2, + "output": 0.5, + "cache_read": 0.05 }, "type": "chat" }, { - "id": "qwen.qwen3-next-80b-a3b", - "name": "Qwen/Qwen3-Next-80B-A3B-Instruct", - "display_name": "Qwen/Qwen3-Next-80B-A3B-Instruct", + "id": "minimax-m2-7", + "name": "MiniMax-M2.7", + "display_name": "MiniMax-M2.7", "modalities": { "input": [ "text" @@ -136692,139 +140718,100 @@ ] }, "limit": { - "context": 262000, - "output": 262000 + "context": 192000, + "output": 8192 }, "temperature": true, "tool_call": true, "reasoning": { "supported": false }, - "attachment": false, + "attachment": true, "open_weights": false, - "release_date": "2025-09-18", - "last_updated": "2025-11-25", + "knowledge": "2024-09", + "release_date": "2026-03-18", + "last_updated": "2026-03-18", "cost": { - "input": 0.14, - "output": 1.4 + "input": 0.3, + "output": 1.2, + "cache_read": 0.06 }, "type": "chat" }, { - "id": "us.anthropic.claude-opus-4-6-v1", - "name": "Claude Opus 4.6 (US)", - "display_name": "Claude Opus 4.6 (US)", + "id": "gpt-5-3-codex", + "name": "GPT-5.3 Codex", + "display_name": "GPT-5.3 Codex", "modalities": { "input": [ "text", - "image", - "pdf" + "image" ], "output": [ "text" ] }, "limit": { - "context": 1000000, + "context": 400000, "output": 128000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { "supported": true, - "default": false + "default": true }, "extra_capabilities": { "reasoning": { "supported": true, - "default_enabled": false, - "mode": "mixed", - "budget": { - "min": 1024, - "unit": "tokens" - }, - "effort": "high", + "default_enabled": true, + "mode": "effort", + "effort": "medium", "effort_options": [ "low", "medium", "high", - "max" + "xhigh" ], - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" + "verbosity": "medium", + "verbosity_options": [ + "low", + "medium", + "high" ], - "notes": [ - "Anthropic recommends adaptive thinking with effort for Claude 4.6; budget_tokens remains a deprecated compatibility path.", - "Anthropic API defaults effort to high; lower effort levels should be chosen per workload." - ] + "visibility": "hidden" } }, "attachment": true, "open_weights": false, - "knowledge": "2025-05-31", - "release_date": "2026-02-05", - "last_updated": "2026-03-13", - "cost": { - "input": 5, - "output": 25, - "cache_read": 0.5, - "cache_write": 6.25 - }, - "type": "chat" - }, - { - "id": "mistral.ministral-3-14b-instruct", - "name": "Ministral 14B 3.0", - "display_name": "Ministral 14B 3.0", - "modalities": { - "input": [ - "text" - ], - "output": [ - "text" - ] - }, - "limit": { - "context": 128000, - "output": 4096 - }, - "temperature": true, - "tool_call": true, - "reasoning": { - "supported": false - }, - "attachment": false, - "open_weights": false, - "release_date": "2024-12-01", - "last_updated": "2024-12-01", + "knowledge": "2026-01-31", + "release_date": "2026-02-15", + "last_updated": "2026-02-15", "cost": { - "input": 0.2, - "output": 0.2 + "input": 1.75, + "output": 14, + "cache_read": 0.175 }, "type": "chat" }, { - "id": "anthropic.claude-haiku-4-5-20251001-v1:0", - "name": "Claude Haiku 4.5", - "display_name": "Claude Haiku 4.5", + "id": "gpt-5-4-nano", + "name": "GPT-5.4 Nano", + "display_name": "GPT-5.4 Nano", "modalities": { "input": [ "text", - "image", - "pdf" + "image" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 64000 + "context": 400000, + "output": 128000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { "supported": true, @@ -136834,52 +140821,51 @@ "reasoning": { "supported": true, "default_enabled": false, - "mode": "budget", - "budget": { - "min": 1024, - "unit": "tokens" - }, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" + "mode": "effort", + "effort": "none", + "effort_options": [ + "none", + "low", + "medium", + "high", + "xhigh" ], - "notes": [ - "Claude 4 manual thinking uses thinking.type = \"enabled\" with budget_tokens.", - "Interleaved thinking requires the interleaved-thinking-2025-05-14 beta header for this model family." - ] + "verbosity": "medium", + "verbosity_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" } }, "attachment": true, "open_weights": false, - "knowledge": "2025-02-28", - "release_date": "2025-10-15", - "last_updated": "2025-10-15", + "knowledge": "2024-05-30", + "release_date": "2025-08-07", + "last_updated": "2025-08-07", "cost": { - "input": 1, - "output": 5, - "cache_read": 0.1, - "cache_write": 1.25 + "input": 0.2, + "output": 1.25, + "cache_read": 0.02 }, "type": "chat" }, { - "id": "au.anthropic.claude-opus-4-8", - "name": "Claude Opus 4.8 (AU)", - "display_name": "Claude Opus 4.8 (AU)", + "id": "gpt-5-4-mini", + "name": "GPT-5.4 Mini", + "display_name": "GPT-5.4 Mini", "modalities": { "input": [ "text", - "image", - "pdf" + "image" ], "output": [ "text" ] }, "limit": { - "context": 1000000, + "context": 400000, "output": 128000 }, "temperature": false, @@ -136893,87 +140879,95 @@ "supported": true, "default_enabled": false, "mode": "effort", - "effort": "high", + "effort": "none", "effort_options": [ + "none", "low", "medium", "high", - "xhigh", - "max" + "xhigh" ], - "interleaved": true, - "summaries": true, - "visibility": "omitted", - "continuation": [ - "thinking_blocks" + "verbosity": "medium", + "verbosity_options": [ + "low", + "medium", + "high" ], - "notes": [ - "Claude Opus 4.7 and newer Opus models require thinking.type = \"adaptive\" to enable thinking explicitly.", - "Manual budget_tokens requests return 400 on Claude Opus 4.7 and newer adaptive-only Opus models.", - "task_budget is separate from thinking control and should not be treated as a thinking budget." - ] + "visibility": "hidden" } }, "attachment": true, "open_weights": false, - "release_date": "2026-05-28", - "last_updated": "2026-05-28", + "knowledge": "2025-08-31", + "release_date": "2026-03-17", + "last_updated": "2026-03-17", "cost": { - "input": 5, - "output": 25, - "cache_read": 0.5, - "cache_write": 6.25 + "input": 0.75, + "output": 4.5, + "cache_read": 0.075 }, "type": "chat" }, { - "id": "mistral.voxtral-mini-3b-2507", - "name": "Voxtral Mini 3B 2507", - "display_name": "Voxtral Mini 3B 2507", + "id": "kimi-k2.5", + "name": "Kimi-K2.5", + "display_name": "Kimi-K2.5", "modalities": { "input": [ - "audio", - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 4096 + "context": 256000, + "output": 128000 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } }, "attachment": false, "open_weights": false, - "release_date": "2024-12-01", - "last_updated": "2024-12-01", + "release_date": "1970-01-01", + "last_updated": "1970-01-01", "cost": { - "input": 0.04, - "output": 0.04 + "input": 0.6, + "output": 3, + "cache_read": 0.1 }, "type": "chat" }, { - "id": "moonshotai.kimi-k2.5", - "name": "Kimi K2.5", - "display_name": "Kimi K2.5", + "id": "gpt-oss-120b", + "name": "GPT OSS 120B", + "display_name": "GPT OSS 120B", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 262143, - "output": 16000 + "context": 131072, + "output": 32768 }, "temperature": true, "tool_call": true, @@ -136983,121 +140977,79 @@ }, "extra_capabilities": { "reasoning": { - "supported": true, - "interleaved": true + "supported": true } }, "attachment": false, "open_weights": true, - "release_date": "2026-02-06", - "last_updated": "2026-02-06", + "release_date": "1970-01-01", + "last_updated": "1970-01-01", "cost": { - "input": 0.6, - "output": 3 + "input": 0.15, + "output": 0.6 }, "type": "chat" }, { - "id": "global.anthropic.claude-opus-4-6-v1", - "name": "Claude Opus 4.6 (Global)", - "display_name": "Claude Opus 4.6 (Global)", + "id": "gpt-5-5", + "name": "GPT-5.5", + "display_name": "GPT-5.5", "modalities": { "input": [ "text", - "image", - "pdf" + "image" ], "output": [ "text" ] }, "limit": { - "context": 1000000, + "context": 272000, "output": 128000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { "supported": true, - "default": false + "default": true }, "extra_capabilities": { "reasoning": { "supported": true, - "default_enabled": false, - "mode": "mixed", - "budget": { - "min": 1024, - "unit": "tokens" - }, - "effort": "high", + "default_enabled": true, + "mode": "effort", + "effort": "medium", "effort_options": [ "low", "medium", "high", - "max" + "xhigh" ], - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" + "verbosity": "medium", + "verbosity_options": [ + "low", + "medium", + "high" ], - "notes": [ - "Anthropic recommends adaptive thinking with effort for Claude 4.6; budget_tokens remains a deprecated compatibility path.", - "Anthropic API defaults effort to high; lower effort levels should be chosen per workload." - ] + "visibility": "hidden" } }, "attachment": true, "open_weights": false, - "knowledge": "2025-05-31", - "release_date": "2026-02-05", - "last_updated": "2026-03-13", - "cost": { - "input": 5, - "output": 25, - "cache_read": 0.5, - "cache_write": 6.25 - }, - "type": "chat" - }, - { - "id": "mistral.ministral-3-3b-instruct", - "name": "Ministral 3 3B", - "display_name": "Ministral 3 3B", - "modalities": { - "input": [ - "text", - "image" - ], - "output": [ - "text" - ] - }, - "limit": { - "context": 256000, - "output": 8192 - }, - "temperature": true, - "tool_call": true, - "reasoning": { - "supported": false - }, - "attachment": false, - "open_weights": true, - "release_date": "2025-12-02", - "last_updated": "2025-12-02", + "knowledge": "2025-08-31", + "release_date": "2026-03-05", + "last_updated": "2026-03-05", "cost": { - "input": 0.1, - "output": 0.1 + "input": 2.5, + "output": 15, + "cache_read": 0.25 }, "type": "chat" }, { - "id": "us.anthropic.claude-opus-4-1-20250805-v1:0", - "name": "Claude Opus 4.1 (US)", - "display_name": "Claude Opus 4.1 (US)", + "id": "claude-haiku-4-5", + "name": "Claude Haiku 4.5", + "display_name": "Claude Haiku 4.5", "modalities": { "input": [ "text", @@ -137110,7 +141062,7 @@ }, "limit": { "context": 200000, - "output": 32000 + "output": 64000 }, "temperature": true, "tool_call": true, @@ -137141,21 +141093,21 @@ }, "attachment": true, "open_weights": false, - "knowledge": "2025-03-31", - "release_date": "2025-08-05", - "last_updated": "2025-08-05", + "knowledge": "2025-02-28", + "release_date": "2025-10-15", + "last_updated": "2025-10-15", "cost": { - "input": 15, - "output": 75, - "cache_read": 1.5, - "cache_write": 18.75 + "input": 1, + "output": 5, + "cache_read": 0.1, + "cache_write": 1.25 }, "type": "chat" }, { - "id": "eu.anthropic.claude-opus-4-6-v1", - "name": "Claude Opus 4.6 (EU)", - "display_name": "Claude Opus 4.6 (EU)", + "id": "claude-opus-4-6", + "name": "Claude Opus 4.6", + "display_name": "Claude Opus 4.6", "modalities": { "input": [ "text", @@ -137167,7 +141119,7 @@ ] }, "limit": { - "context": 1000000, + "context": 200000, "output": 128000 }, "temperature": true, @@ -137208,19 +141160,97 @@ "open_weights": false, "knowledge": "2025-05-31", "release_date": "2026-02-05", - "last_updated": "2026-03-13", + "last_updated": "2026-02-05", "cost": { - "input": 5.5, - "output": 27.5, - "cache_read": 0.55, - "cache_write": 6.875 + "input": 5, + "output": 25, + "cache_read": 0.5, + "cache_write": 6.25 }, "type": "chat" }, { - "id": "us.anthropic.claude-haiku-4-5-20251001-v1:0", - "name": "Claude Haiku 4.5 (US)", - "display_name": "Claude Haiku 4.5 (US)", + "id": "gemini-3-1-pro-preview", + "name": "Gemini 3.1 Pro Preview", + "display_name": "Gemini 3.1 Pro Preview", + "modalities": { + "input": [ + "text", + "image", + "video", + "audio", + "pdf" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 1000000, + "output": 64000 + }, + "temperature": true, + "tool_call": true, + "reasoning": { + "supported": true, + "default": true + }, + "attachment": true, + "open_weights": false, + "knowledge": "2026-01", + "release_date": "2026-02-18", + "last_updated": "2026-02-18", + "cost": { + "input": 2, + "output": 12, + "cache_read": 0.2 + }, + "type": "chat" + }, + { + "id": "grok-4-1-fast-reasoning", + "name": "Grok 4.1 Fast (Reasoning)", + "display_name": "Grok 4.1 Fast (Reasoning)", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 2000000, + "output": 128000 + }, + "temperature": true, + "tool_call": true, + "reasoning": { + "supported": true, + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true + } + }, + "attachment": true, + "open_weights": false, + "knowledge": "2025-11", + "release_date": "2025-11-25", + "last_updated": "2025-11-25", + "cost": { + "input": 0.2, + "output": 0.5, + "cache_read": 0.05 + }, + "type": "chat" + }, + { + "id": "claude-sonnet-4-6", + "name": "Claude Sonnet 4.6", + "display_name": "Claude Sonnet 4.6", "modalities": { "input": [ "text", @@ -137245,11 +141275,18 @@ "reasoning": { "supported": true, "default_enabled": false, - "mode": "budget", + "mode": "mixed", "budget": { "min": 1024, "unit": "tokens" }, + "effort": "high", + "effort_options": [ + "low", + "medium", + "high", + "max" + ], "interleaved": true, "summaries": true, "visibility": "summary", @@ -137257,32 +141294,34 @@ "thinking_blocks" ], "notes": [ - "Claude 4 manual thinking uses thinking.type = \"enabled\" with budget_tokens.", - "Interleaved thinking requires the interleaved-thinking-2025-05-14 beta header for this model family." + "Anthropic recommends adaptive thinking with effort for Claude 4.6; budget_tokens remains a deprecated compatibility path.", + "Anthropic API defaults effort to high; lower effort levels should be chosen per workload." ] } }, "attachment": true, "open_weights": false, - "knowledge": "2025-02-28", - "release_date": "2025-10-15", - "last_updated": "2025-10-15", + "knowledge": "2025-08-31", + "release_date": "2026-02-17", + "last_updated": "2026-02-17", "cost": { - "input": 1, - "output": 5, - "cache_read": 0.1, - "cache_write": 1.25 + "input": 3, + "output": 15, + "cache_read": 0.3, + "cache_write": 3.75 }, "type": "chat" }, { - "id": "global.anthropic.claude-haiku-4-5-20251001-v1:0", - "name": "Claude Haiku 4.5 (Global)", - "display_name": "Claude Haiku 4.5 (Global)", + "id": "gemini-3-flash-preview", + "name": "Gemini 3 Flash Preview", + "display_name": "Gemini 3 Flash Preview", "modalities": { "input": [ "text", "image", + "video", + "audio", "pdf" ], "output": [ @@ -137290,53 +141329,50 @@ ] }, "limit": { - "context": 200000, - "output": 64000 + "context": 1048576, + "output": 65536 }, "temperature": true, "tool_call": true, "reasoning": { "supported": true, - "default": false + "default": true }, "extra_capabilities": { "reasoning": { "supported": true, - "default_enabled": false, - "mode": "budget", - "budget": { - "min": 1024, - "unit": "tokens" - }, - "interleaved": true, + "default_enabled": true, + "mode": "level", + "level": "high", + "level_options": [ + "minimal", + "low", + "medium", + "high" + ], "summaries": true, "visibility": "summary", "continuation": [ - "thinking_blocks" - ], - "notes": [ - "Claude 4 manual thinking uses thinking.type = \"enabled\" with budget_tokens.", - "Interleaved thinking requires the interleaved-thinking-2025-05-14 beta header for this model family." + "thought_signatures" ] } }, "attachment": true, "open_weights": false, - "knowledge": "2025-02-28", - "release_date": "2025-10-15", - "last_updated": "2025-10-15", + "knowledge": "2025-01", + "release_date": "2025-12-17", + "last_updated": "2025-12-17", "cost": { - "input": 1, - "output": 5, - "cache_read": 0.1, - "cache_write": 1.25 + "input": 0.5, + "output": 3, + "cache_read": 0.05 }, "type": "chat" }, { - "id": "moonshot.kimi-k2-thinking", - "name": "Kimi K2 Thinking", - "display_name": "Kimi K2 Thinking", + "id": "gpt-oss-20b", + "name": "GPT OSS 20B", + "display_name": "GPT OSS 20B", "modalities": { "input": [ "text" @@ -137346,8 +141382,8 @@ ] }, "limit": { - "context": 262143, - "output": 16000 + "context": 131072, + "output": 32768 }, "temperature": true, "tool_call": true, @@ -137357,60 +141393,73 @@ }, "extra_capabilities": { "reasoning": { - "supported": true, - "interleaved": true + "supported": true } }, "attachment": false, "open_weights": true, - "release_date": "2025-12-02", - "last_updated": "2025-12-02", + "release_date": "1970-01-01", + "last_updated": "1970-01-01", "cost": { - "input": 0.6, - "output": 2.5 + "input": 0.07, + "output": 0.2 }, "type": "chat" - }, + } + ] + }, + "nova": { + "id": "nova", + "name": "Nova", + "display_name": "Nova", + "api": "https://api.nova.amazon.com/v1", + "doc": "https://nova.amazon.com/dev/documentation", + "models": [ { - "id": "google.gemma-3-4b-it", - "name": "Gemma 3 4B IT", - "display_name": "Gemma 3 4B IT", + "id": "nova-2-pro-v1", + "name": "Nova 2 Pro", + "display_name": "Nova 2 Pro", "modalities": { "input": [ "text", - "image" + "image", + "video", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 4096 + "context": 1000000, + "output": 64000 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": false, + "attachment": true, "open_weights": false, - "release_date": "2024-12-01", - "last_updated": "2024-12-01", + "release_date": "2025-12-03", + "last_updated": "2026-01-03", "cost": { - "input": 0.04, - "output": 0.08 + "input": 0, + "output": 0, + "reasoning": 0 }, "type": "chat" }, { - "id": "openai.gpt-5.5", - "name": "GPT-5.5", - "display_name": "GPT-5.5", + "id": "nova-2-lite-v1", + "name": "Nova 2 Lite", + "display_name": "Nova 2 Lite", "modalities": { "input": [ "text", "image", + "video", "pdf" ], "output": [ @@ -137418,10 +141467,10 @@ ] }, "limit": { - "context": 272000, - "output": 128000 + "context": 1000000, + "output": 64000 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, @@ -137429,20 +141478,28 @@ }, "attachment": true, "open_weights": false, - "knowledge": "2025-12-01", - "release_date": "2026-04-23", - "last_updated": "2026-06-01", + "release_date": "2025-12-01", + "last_updated": "2025-12-01", "cost": { - "input": 5.5, - "output": 33, - "cache_read": 0.55 + "input": 0, + "output": 0, + "reasoning": 0 }, "type": "chat" - }, + } + ] + }, + "alibaba-token-plan": { + "id": "alibaba-token-plan", + "name": "Alibaba Token Plan", + "display_name": "Alibaba Token Plan", + "api": "https://token-plan.ap-southeast-1.maas.aliyuncs.com/compatible-mode/v1", + "doc": "https://www.alibabacloud.com/help/en/model-studio/token-plan-overview", + "models": [ { - "id": "zai.glm-4.7", - "name": "GLM-4.7", - "display_name": "GLM-4.7", + "id": "deepseek-v4-flash", + "name": "DeepSeek V4 Flash", + "display_name": "DeepSeek V4 Flash", "modalities": { "input": [ "text" @@ -137452,8 +141509,8 @@ ] }, "limit": { - "context": 204800, - "output": 131072 + "context": 1000000, + "output": 384000 }, "temperature": true, "tool_call": true, @@ -137474,24 +141531,24 @@ }, "attachment": false, "open_weights": true, - "knowledge": "2025-04", - "release_date": "2025-12-22", - "last_updated": "2025-12-22", + "knowledge": "2025-05", + "release_date": "2026-04-24", + "last_updated": "2026-04-24", "cost": { - "input": 0.6, - "output": 2.2 + "input": 0, + "output": 0, + "cache_read": 0 }, "type": "chat" }, { - "id": "global.anthropic.claude-sonnet-4-6", - "name": "Claude Sonnet 4.6 (Global)", - "display_name": "Claude Sonnet 4.6 (Global)", + "id": "qwen3.7-plus", + "name": "Qwen3.7 Plus", + "display_name": "Qwen3.7 Plus", "modalities": { "input": [ "text", - "image", - "pdf" + "image" ], "output": [ "text" @@ -137505,53 +141562,30 @@ "tool_call": true, "reasoning": { "supported": true, - "default": false + "default": true }, "extra_capabilities": { "reasoning": { - "supported": true, - "default_enabled": false, - "mode": "mixed", - "budget": { - "min": 1024, - "unit": "tokens" - }, - "effort": "high", - "effort_options": [ - "low", - "medium", - "high", - "max" - ], - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ], - "notes": [ - "Anthropic recommends adaptive thinking with effort for Claude 4.6; budget_tokens remains a deprecated compatibility path.", - "Anthropic API defaults effort to high; lower effort levels should be chosen per workload." - ] + "supported": true } }, - "attachment": true, + "attachment": false, "open_weights": false, - "knowledge": "2025-08-31", - "release_date": "2026-02-17", - "last_updated": "2026-03-13", + "knowledge": "2025-04", + "release_date": "2026-06-02", + "last_updated": "2026-06-02", "cost": { - "input": 3, - "output": 15, - "cache_read": 0.3, - "cache_write": 3.75 + "input": 0, + "output": 0, + "cache_read": 0, + "cache_write": 0 }, "type": "chat" }, { - "id": "nvidia.nemotron-nano-9b-v2", - "name": "NVIDIA Nemotron Nano 9B v2", - "display_name": "NVIDIA Nemotron Nano 9B v2", + "id": "qwen3.7-max", + "name": "Qwen3.7 Max", + "display_name": "Qwen3.7 Max", "modalities": { "input": [ "text" @@ -137561,129 +141595,84 @@ ] }, "limit": { - "context": 128000, - "output": 4096 + "context": 1000000, + "output": 65536 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true + } }, "attachment": false, "open_weights": false, - "release_date": "2024-12-01", - "last_updated": "2024-12-01", + "release_date": "2026-05-21", + "last_updated": "2026-05-21", "cost": { - "input": 0.06, - "output": 0.23 + "input": 0, + "output": 0, + "cache_read": 0, + "cache_write": 0 }, "type": "chat" }, { - "id": "eu.anthropic.claude-sonnet-4-6", - "name": "Claude Sonnet 4.6 (EU)", - "display_name": "Claude Sonnet 4.6 (EU)", + "id": "glm-5.1", + "name": "GLM-5.1", + "display_name": "GLM-5.1", "modalities": { "input": [ - "text", - "image", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 1000000, - "output": 64000 + "context": 202752, + "output": 128000 }, "temperature": true, "tool_call": true, "reasoning": { "supported": true, - "default": false + "default": true }, "extra_capabilities": { "reasoning": { "supported": true, - "default_enabled": false, - "mode": "mixed", - "budget": { - "min": 1024, - "unit": "tokens" - }, - "effort": "high", - "effort_options": [ - "low", - "medium", - "high", - "max" - ], "interleaved": true, "summaries": true, "visibility": "summary", "continuation": [ "thinking_blocks" - ], - "notes": [ - "Anthropic recommends adaptive thinking with effort for Claude 4.6; budget_tokens remains a deprecated compatibility path.", - "Anthropic API defaults effort to high; lower effort levels should be chosen per workload." ] } }, - "attachment": true, - "open_weights": false, - "knowledge": "2025-08-31", - "release_date": "2026-02-17", - "last_updated": "2026-03-13", - "cost": { - "input": 3.3, - "output": 16.5, - "cache_read": 0.33, - "cache_write": 4.125 - }, - "type": "chat" - }, - { - "id": "openai.gpt-oss-safeguard-20b", - "name": "GPT OSS Safeguard 20B", - "display_name": "GPT OSS Safeguard 20B", - "modalities": { - "input": [ - "text" - ], - "output": [ - "text" - ] - }, - "limit": { - "context": 128000, - "output": 16384 - }, - "temperature": true, - "tool_call": true, - "reasoning": { - "supported": false - }, "attachment": false, - "open_weights": false, - "release_date": "2025-10-29", - "last_updated": "2025-10-29", + "open_weights": true, + "release_date": "2026-03-27", + "last_updated": "2026-03-27", "cost": { - "input": 0.07, - "output": 0.2 + "input": 0, + "output": 0, + "cache_read": 0, + "cache_write": 0 }, "type": "chat" }, { - "id": "jp.anthropic.claude-sonnet-4-6", - "name": "Claude Sonnet 4.6 (JP)", - "display_name": "Claude Sonnet 4.6 (JP)", + "id": "deepseek-v4-pro", + "name": "DeepSeek V4 Pro", + "display_name": "DeepSeek V4 Pro", "modalities": { "input": [ - "text", - "image", - "pdf" + "text" ], "output": [ "text" @@ -137691,96 +141680,77 @@ }, "limit": { "context": 1000000, - "output": 64000 + "output": 384000 }, "temperature": true, "tool_call": true, "reasoning": { "supported": true, - "default": false + "default": true }, "extra_capabilities": { "reasoning": { "supported": true, - "default_enabled": false, - "mode": "mixed", - "budget": { - "min": 1024, - "unit": "tokens" - }, - "effort": "high", - "effort_options": [ - "low", - "medium", - "high", - "max" - ], "interleaved": true, "summaries": true, "visibility": "summary", "continuation": [ "thinking_blocks" - ], - "notes": [ - "Anthropic recommends adaptive thinking with effort for Claude 4.6; budget_tokens remains a deprecated compatibility path.", - "Anthropic API defaults effort to high; lower effort levels should be chosen per workload." ] } }, - "attachment": true, - "open_weights": false, - "knowledge": "2025-08-31", - "release_date": "2026-02-17", - "last_updated": "2026-03-13", + "attachment": false, + "open_weights": true, + "knowledge": "2025-05", + "release_date": "2026-04-24", + "last_updated": "2026-04-24", "cost": { - "input": 3, - "output": 15, - "cache_read": 0.3, - "cache_write": 3.75 + "input": 0, + "output": 0, + "cache_read": 0 }, "type": "chat" }, { - "id": "minimax.minimax-m2.1", - "name": "MiniMax M2.1", - "display_name": "MiniMax M2.1", + "id": "wan2.7-image-pro", + "name": "Wan2.7 Image Pro", + "display_name": "Wan2.7 Image Pro", "modalities": { "input": [ "text" ], "output": [ - "text" + "image" ] }, "limit": { - "context": 204800, - "output": 131072 + "context": 8192, + "output": 8192 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": true + "supported": false }, "attachment": false, - "open_weights": true, - "release_date": "2025-12-23", - "last_updated": "2025-12-23", + "open_weights": false, + "release_date": "2026-05-29", + "last_updated": "2026-05-29", "cost": { - "input": 0.3, - "output": 1.2 + "input": 0, + "output": 0 }, - "type": "chat" + "type": "imageGeneration" }, { - "id": "global.anthropic.claude-opus-4-8", - "name": "Claude Opus 4.8 (Global)", - "display_name": "Claude Opus 4.8 (Global)", + "id": "qwen3.6-flash", + "name": "Qwen3.6 Flash", + "display_name": "Qwen3.6 Flash", "modalities": { "input": [ "text", "image", - "pdf" + "video" ], "output": [ "text" @@ -137788,67 +141758,54 @@ }, "limit": { "context": 1000000, - "output": 128000 + "output": 65536 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, - "default": false + "default": true }, "extra_capabilities": { "reasoning": { "supported": true, - "default_enabled": false, - "mode": "effort", - "effort": "high", - "effort_options": [ - "low", - "medium", - "high", - "xhigh", - "max" - ], "interleaved": true, "summaries": true, - "visibility": "omitted", + "visibility": "summary", "continuation": [ "thinking_blocks" - ], - "notes": [ - "Claude Opus 4.7 and newer Opus models require thinking.type = \"adaptive\" to enable thinking explicitly.", - "Manual budget_tokens requests return 400 on Claude Opus 4.7 and newer adaptive-only Opus models.", - "task_budget is separate from thinking control and should not be treated as a thinking budget." ] } }, "attachment": true, "open_weights": false, - "release_date": "2026-05-28", - "last_updated": "2026-05-28", + "release_date": "2026-04-27", + "last_updated": "2026-04-27", "cost": { - "input": 5, - "output": 25, - "cache_read": 0.5, - "cache_write": 6.25 + "input": 0, + "output": 0, + "cache_read": 0, + "cache_write": 0 }, "type": "chat" }, { - "id": "minimax.minimax-m2", - "name": "MiniMax M2", - "display_name": "MiniMax M2", + "id": "kimi-k2.5", + "name": "Kimi K2.5", + "display_name": "Kimi K2.5", "modalities": { "input": [ - "text" + "text", + "image", + "video" ], "output": [ "text" ] }, "limit": { - "context": 204608, - "output": 128000 + "context": 262144, + "output": 32768 }, "temperature": true, "tool_call": true, @@ -137856,52 +141813,65 @@ "supported": true, "default": true }, - "attachment": false, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } + }, + "attachment": true, "open_weights": true, - "release_date": "2025-10-27", - "last_updated": "2025-10-27", + "knowledge": "2025-01", + "release_date": "2026-01", + "last_updated": "2026-01", "cost": { - "input": 0.3, - "output": 1.2 + "input": 0, + "output": 0, + "cache_read": 0, + "cache_write": 0 }, "type": "chat" }, { - "id": "mistral.voxtral-small-24b-2507", - "name": "Voxtral Small 24B 2507", - "display_name": "Voxtral Small 24B 2507", + "id": "qwen-image-2.0", + "name": "Qwen Image 2.0", + "display_name": "Qwen Image 2.0", "modalities": { "input": [ - "text", - "audio" + "text" ], "output": [ - "text" + "image" ] }, "limit": { - "context": 32000, + "context": 8192, "output": 8192 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": false }, - "attachment": true, - "open_weights": true, - "release_date": "2025-07-01", - "last_updated": "2025-07-01", + "attachment": false, + "open_weights": false, + "release_date": "2026-03-03", + "last_updated": "2026-03-03", "cost": { - "input": 0.15, - "output": 0.35 + "input": 0, + "output": 0 }, - "type": "chat" + "type": "imageGeneration" }, { - "id": "deepseek.v3.2", - "name": "DeepSeek-V3.2", - "display_name": "DeepSeek-V3.2", + "id": "MiniMax-M2.5", + "name": "MiniMax-M2.5", + "display_name": "MiniMax-M2.5", "modalities": { "input": [ "text" @@ -137911,8 +141881,8 @@ ] }, "limit": { - "context": 163840, - "output": 81920 + "context": 196608, + "output": 24576 }, "temperature": true, "tool_call": true, @@ -137920,273 +141890,231 @@ "supported": true, "default": true }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } + }, "attachment": false, "open_weights": true, - "knowledge": "2024-07", - "release_date": "2026-02-06", - "last_updated": "2026-02-06", + "release_date": "2026-02-12", + "last_updated": "2026-02-12", "cost": { - "input": 0.62, - "output": 1.85 + "input": 0, + "output": 0, + "cache_read": 0, + "cache_write": 0 }, "type": "chat" }, { - "id": "anthropic.claude-sonnet-4-5-20250929-v1:0", - "name": "Claude Sonnet 4.5", - "display_name": "Claude Sonnet 4.5", + "id": "kimi-k2.6", + "name": "Kimi K2.6", + "display_name": "Kimi K2.6", "modalities": { "input": [ "text", "image", - "pdf" + "video" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 64000 + "context": 262144, + "output": 16384 }, "temperature": true, "tool_call": true, "reasoning": { "supported": true, - "default": false + "default": true }, "extra_capabilities": { "reasoning": { "supported": true, - "default_enabled": false, - "mode": "budget", - "budget": { - "min": 1024, - "unit": "tokens" - }, "interleaved": true, "summaries": true, "visibility": "summary", "continuation": [ "thinking_blocks" - ], - "notes": [ - "Claude 4 manual thinking uses thinking.type = \"enabled\" with budget_tokens.", - "Interleaved thinking requires the interleaved-thinking-2025-05-14 beta header for this model family." ] } }, "attachment": true, - "open_weights": false, - "knowledge": "2025-07-31", - "release_date": "2025-09-29", - "last_updated": "2025-09-29", + "open_weights": true, + "knowledge": "2025-01", + "release_date": "2026-04-21", + "last_updated": "2026-04-21", "cost": { - "input": 3, - "output": 15, - "cache_read": 0.3, - "cache_write": 3.75 + "input": 0, + "output": 0, + "cache_read": 0, + "cache_write": 0 }, "type": "chat" }, { - "id": "eu.anthropic.claude-opus-4-8", - "name": "Claude Opus 4.8 (EU)", - "display_name": "Claude Opus 4.8 (EU)", + "id": "qwen-image-2.0-pro", + "name": "Qwen Image 2.0 Pro", + "display_name": "Qwen Image 2.0 Pro", "modalities": { "input": [ - "text", - "image", - "pdf" + "text" ], "output": [ - "text" + "image" ] }, "limit": { - "context": 1000000, - "output": 128000 + "context": 8192, + "output": 8192 }, - "temperature": false, - "tool_call": true, + "temperature": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": false + "supported": false }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": false, - "mode": "effort", - "effort": "high", - "effort_options": [ - "low", - "medium", - "high", - "xhigh", - "max" - ], - "interleaved": true, - "summaries": true, - "visibility": "omitted", - "continuation": [ - "thinking_blocks" - ], - "notes": [ - "Claude Opus 4.7 and newer Opus models require thinking.type = \"adaptive\" to enable thinking explicitly.", - "Manual budget_tokens requests return 400 on Claude Opus 4.7 and newer adaptive-only Opus models.", - "task_budget is separate from thinking control and should not be treated as a thinking budget." - ] - } + "attachment": false, + "open_weights": false, + "release_date": "2026-03-03", + "last_updated": "2026-03-03", + "cost": { + "input": 0, + "output": 0 }, - "attachment": true, + "type": "imageGeneration" + }, + { + "id": "wan2.7-image", + "name": "Wan2.7 Image", + "display_name": "Wan2.7 Image", + "modalities": { + "input": [ + "text" + ], + "output": [ + "image" + ] + }, + "limit": { + "context": 8192, + "output": 8192 + }, + "temperature": true, + "tool_call": false, + "reasoning": { + "supported": false + }, + "attachment": false, "open_weights": false, - "release_date": "2026-05-28", - "last_updated": "2026-05-28", + "release_date": "2026-05-29", + "last_updated": "2026-05-29", "cost": { - "input": 5.5, - "output": 27.5, - "cache_read": 0.55, - "cache_write": 6.875 + "input": 0, + "output": 0 }, - "type": "chat" + "type": "imageGeneration" }, { - "id": "anthropic.claude-opus-4-7", - "name": "Claude Opus 4.7", - "display_name": "Claude Opus 4.7", + "id": "glm-5", + "name": "GLM-5", + "display_name": "GLM-5", "modalities": { "input": [ - "text", - "image", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 1000000, - "output": 128000 + "context": 202752, + "output": 16384 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, - "default": false + "default": true }, "extra_capabilities": { "reasoning": { "supported": true, - "default_enabled": false, - "mode": "effort", - "effort": "high", - "effort_options": [ - "low", - "medium", - "high", - "xhigh", - "max" - ], "interleaved": true, "summaries": true, - "visibility": "omitted", + "visibility": "summary", "continuation": [ "thinking_blocks" - ], - "notes": [ - "Claude Opus 4.7 and newer Opus models require thinking.type = \"adaptive\" to enable thinking explicitly.", - "Manual budget_tokens requests return 400 on Claude Opus 4.7 and newer adaptive-only Opus models.", - "task_budget is separate from thinking control and should not be treated as a thinking budget." ] } }, - "attachment": true, + "attachment": false, "open_weights": false, - "knowledge": "2026-01-31", - "release_date": "2026-04-16", - "last_updated": "2026-04-16", + "release_date": "2026-02-11", + "last_updated": "2026-02-11", "cost": { - "input": 5, - "output": 25, - "cache_read": 0.5, - "cache_write": 6.25 + "input": 0, + "output": 0, + "cache_read": 0, + "cache_write": 0 }, "type": "chat" }, { - "id": "us.anthropic.claude-opus-4-5-20251101-v1:0", - "name": "Claude Opus 4.5 (US)", - "display_name": "Claude Opus 4.5 (US)", + "id": "deepseek-v3.2", + "name": "DeepSeek V3.2", + "display_name": "DeepSeek V3.2", "modalities": { "input": [ - "text", - "image", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 64000 + "context": 131072, + "output": 65536 }, "temperature": true, "tool_call": true, "reasoning": { "supported": true, - "default": false + "default": true }, "extra_capabilities": { "reasoning": { - "supported": true, - "default_enabled": false, - "mode": "mixed", - "budget": { - "min": 1024, - "unit": "tokens" - }, - "effort": "high", - "effort_options": [ - "low", - "medium", - "high" - ], - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ], - "notes": [ - "Claude Opus 4.5 uses manual thinking.type = \"enabled\" with budget_tokens; effort can be used alongside the thinking budget.", - "Interleaved thinking requires the interleaved-thinking-2025-05-14 beta header." - ] + "supported": true } }, - "attachment": true, - "open_weights": false, - "knowledge": "2025-03-31", - "release_date": "2025-11-24", - "last_updated": "2025-08-01", + "attachment": false, + "open_weights": true, + "knowledge": "2025-01", + "release_date": "2025-12-03", + "last_updated": "2025-12-05", "cost": { - "input": 5, - "output": 25, - "cache_read": 0.5, - "cache_write": 6.25 + "input": 0, + "output": 0 }, "type": "chat" }, { - "id": "anthropic.claude-sonnet-4-6", - "name": "Claude Sonnet 4.6", - "display_name": "Claude Sonnet 4.6", + "id": "qwen3.6-plus", + "name": "Qwen3.6 Plus", + "display_name": "Qwen3.6 Plus", "modalities": { "input": [ "text", "image", - "pdf" + "video" ], "output": [ "text" @@ -138194,126 +142122,104 @@ }, "limit": { "context": 1000000, - "output": 64000 + "output": 65536 }, "temperature": true, "tool_call": true, "reasoning": { "supported": true, - "default": false + "default": true }, "extra_capabilities": { "reasoning": { "supported": true, - "default_enabled": false, - "mode": "mixed", - "budget": { - "min": 1024, - "unit": "tokens" - }, - "effort": "high", - "effort_options": [ - "low", - "medium", - "high", - "max" - ], "interleaved": true, "summaries": true, "visibility": "summary", "continuation": [ "thinking_blocks" - ], - "notes": [ - "Anthropic recommends adaptive thinking with effort for Claude 4.6; budget_tokens remains a deprecated compatibility path.", - "Anthropic API defaults effort to high; lower effort levels should be chosen per workload." ] } }, - "attachment": true, + "attachment": false, "open_weights": false, - "knowledge": "2025-08-31", - "release_date": "2026-02-17", - "last_updated": "2026-03-13", + "knowledge": "2025-04", + "release_date": "2026-04-02", + "last_updated": "2026-04-02", "cost": { - "input": 3, - "output": 15, - "cache_read": 0.3, - "cache_write": 3.75 + "input": 0, + "output": 0, + "cache_read": 0, + "cache_write": 0 }, "type": "chat" - }, + } + ] + }, + "alibaba": { + "id": "alibaba", + "name": "alibaba", + "display_name": "alibaba", + "api": "https://dashscope-intl.aliyuncs.com/compatible-mode/v1", + "doc": "https://www.alibabacloud.com/help/en/model-studio/models", + "models": [ { - "id": "us.anthropic.claude-opus-4-8", - "name": "Claude Opus 4.8 (US)", - "display_name": "Claude Opus 4.8 (US)", + "id": "qwen3-omni-flash", + "name": "Qwen3-Omni Flash", + "display_name": "Qwen3-Omni Flash", "modalities": { "input": [ "text", "image", - "pdf" + "audio", + "video" ], "output": [ - "text" + "text", + "audio" ] }, "limit": { - "context": 1000000, - "output": 128000 + "context": 65536, + "output": 16384 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, - "default": false + "default": true }, "extra_capabilities": { "reasoning": { "supported": true, - "default_enabled": false, - "mode": "effort", - "effort": "high", - "effort_options": [ - "low", - "medium", - "high", - "xhigh", - "max" - ], "interleaved": true, "summaries": true, - "visibility": "omitted", + "visibility": "summary", "continuation": [ "thinking_blocks" - ], - "notes": [ - "Claude Opus 4.7 and newer Opus models require thinking.type = \"adaptive\" to enable thinking explicitly.", - "Manual budget_tokens requests return 400 on Claude Opus 4.7 and newer adaptive-only Opus models.", - "task_budget is separate from thinking control and should not be treated as a thinking budget." ] } }, - "attachment": true, + "attachment": false, "open_weights": false, - "release_date": "2026-05-28", - "last_updated": "2026-05-28", + "knowledge": "2024-04", + "release_date": "2025-09-15", + "last_updated": "2025-09-15", "cost": { - "input": 5, - "output": 25, - "cache_read": 0.5, - "cache_write": 6.25 + "input": 0.43, + "output": 1.66, + "input_audio": 3.81, + "output_audio": 15.11 }, "type": "chat" }, { - "id": "au.anthropic.claude-opus-4-6-v1", - "name": "AU Anthropic Claude Opus 4.6", - "display_name": "AU Anthropic Claude Opus 4.6", + "id": "qwen3-coder-plus", + "name": "Qwen3 Coder Plus", + "display_name": "Qwen3 Coder Plus", "modalities": { "input": [ - "text", - "image", - "pdf" + "text" ], "output": [ "text" @@ -138321,129 +142227,131 @@ }, "limit": { "context": 1000000, - "output": 128000 + "output": 65536 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": false - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": false, - "mode": "mixed", - "budget": { - "min": 1024, - "unit": "tokens" - }, - "effort": "high", - "effort_options": [ - "low", - "medium", - "high", - "max" - ], - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ], - "notes": [ - "Anthropic recommends adaptive thinking with effort for Claude 4.6; budget_tokens remains a deprecated compatibility path.", - "Anthropic API defaults effort to high; lower effort levels should be chosen per workload." - ] - } + "supported": false }, - "attachment": true, - "open_weights": false, - "knowledge": "2025-05", - "release_date": "2026-02-05", - "last_updated": "2026-02-05", + "attachment": false, + "open_weights": true, + "knowledge": "2025-04", + "release_date": "2025-07-23", + "last_updated": "2025-07-23", "cost": { - "input": 16.5, - "output": 82.5, - "cache_read": 1.65, - "cache_write": 20.625 + "input": 1, + "output": 5 }, "type": "chat" }, { - "id": "us.anthropic.claude-sonnet-4-5-20250929-v1:0", - "name": "Claude Sonnet 4.5 (US)", - "display_name": "Claude Sonnet 4.5 (US)", + "id": "qwen-plus", + "name": "Qwen Plus", + "display_name": "Qwen Plus", "modalities": { "input": [ - "text", - "image", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 64000 + "context": 1000000, + "output": 32768 }, "temperature": true, "tool_call": true, "reasoning": { "supported": true, - "default": false + "default": false, + "budget": { + "default": 81920, + "min": 0, + "max": 81920 + } }, "extra_capabilities": { "reasoning": { "supported": true, - "default_enabled": false, - "mode": "budget", - "budget": { - "min": 1024, - "unit": "tokens" - }, "interleaved": true, "summaries": true, "visibility": "summary", "continuation": [ "thinking_blocks" - ], - "notes": [ - "Claude 4 manual thinking uses thinking.type = \"enabled\" with budget_tokens.", - "Interleaved thinking requires the interleaved-thinking-2025-05-14 beta header for this model family." ] } }, - "attachment": true, + "search": { + "supported": true, + "default": false, + "forced_search": false, + "search_strategy": "turbo" + }, + "attachment": false, "open_weights": false, - "knowledge": "2025-07-31", - "release_date": "2025-09-29", - "last_updated": "2025-09-29", + "knowledge": "2024-04", + "release_date": "2024-01-25", + "last_updated": "2025-09-11", "cost": { - "input": 3, - "output": 15, - "cache_read": 0.3, - "cache_write": 3.75 + "input": 0.4, + "output": 1.2, + "reasoning": 4 }, "type": "chat" }, { - "id": "nvidia.nemotron-nano-12b-v2", - "name": "NVIDIA Nemotron Nano 12B v2 VL BF16", - "display_name": "NVIDIA Nemotron Nano 12B v2 VL BF16", + "id": "qwen3-coder-30b-a3b-instruct", + "name": "Qwen3-Coder 30B-A3B Instruct", + "display_name": "Qwen3-Coder 30B-A3B Instruct", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 4096 + "context": 262144, + "output": 65536 + }, + "temperature": true, + "tool_call": true, + "reasoning": { + "supported": false + }, + "attachment": false, + "open_weights": true, + "knowledge": "2025-04", + "release_date": "2025-04", + "last_updated": "2025-04", + "cost": { + "input": 0.45, + "output": 2.25 + }, + "type": "chat" + }, + { + "id": "qwen3-omni-flash-realtime", + "name": "Qwen3-Omni Flash Realtime", + "display_name": "Qwen3-Omni Flash Realtime", + "modalities": { + "input": [ + "text", + "image", + "audio", + "video" + ], + "output": [ + "text", + "audio" + ] + }, + "limit": { + "context": 65536, + "output": 16384 }, "temperature": true, "tool_call": true, @@ -138452,18 +142360,21 @@ }, "attachment": false, "open_weights": false, - "release_date": "2024-12-01", - "last_updated": "2024-12-01", + "knowledge": "2024-04", + "release_date": "2025-09-15", + "last_updated": "2025-09-15", "cost": { - "input": 0.2, - "output": 0.6 + "input": 0.52, + "output": 1.99, + "input_audio": 4.57, + "output_audio": 18.13 }, "type": "chat" }, { - "id": "zai.glm-5", - "name": "GLM-5", - "display_name": "GLM-5", + "id": "qwen3-32b", + "name": "Qwen3 32B", + "display_name": "Qwen3 32B", "modalities": { "input": [ "text" @@ -138473,14 +142384,19 @@ ] }, "limit": { - "context": 202752, - "output": 101376 + "context": 131072, + "output": 16384 }, "temperature": true, "tool_call": true, "reasoning": { "supported": true, - "default": true + "default": true, + "budget": { + "default": 38912, + "min": 0, + "max": 38912 + } }, "extra_capabilities": { "reasoning": { @@ -138495,114 +142411,126 @@ }, "attachment": false, "open_weights": true, - "release_date": "2026-03-18", - "last_updated": "2026-03-18", + "knowledge": "2025-04", + "release_date": "2025-04", + "last_updated": "2025-04", "cost": { - "input": 1, - "output": 3.2 + "input": 0.7, + "output": 2.8, + "reasoning": 8.4 }, "type": "chat" }, { - "id": "meta.llama4-maverick-17b-instruct-v1:0", - "name": "Llama 4 Maverick 17B Instruct", - "display_name": "Llama 4 Maverick 17B Instruct", + "id": "qwen-omni-turbo-realtime", + "name": "Qwen-Omni Turbo Realtime", + "display_name": "Qwen-Omni Turbo Realtime", "modalities": { "input": [ "text", - "image" + "image", + "audio" ], "output": [ - "text" + "text", + "audio" ] }, "limit": { - "context": 1000000, - "output": 16384 + "context": 32768, + "output": 2048 }, "temperature": true, "tool_call": true, "reasoning": { "supported": false }, - "attachment": true, - "open_weights": true, - "knowledge": "2024-08", - "release_date": "2025-04-05", - "last_updated": "2025-04-05", + "attachment": false, + "open_weights": false, + "knowledge": "2024-04", + "release_date": "2025-05-08", + "last_updated": "2025-05-08", "cost": { - "input": 0.24, - "output": 0.97 + "input": 0.27, + "output": 1.07, + "input_audio": 4.44, + "output_audio": 8.89 }, "type": "chat" }, { - "id": "anthropic.claude-opus-4-1-20250805-v1:0", - "name": "Claude Opus 4.1", - "display_name": "Claude Opus 4.1", + "id": "qwen-plus-character-ja", + "name": "Qwen Plus Character (Japanese)", + "display_name": "Qwen Plus Character (Japanese)", "modalities": { "input": [ - "text", - "image", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 32000 + "context": 8192, + "output": 512 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": false - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": false, - "mode": "budget", - "budget": { - "min": 1024, - "unit": "tokens" - }, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ], - "notes": [ - "Claude 4 manual thinking uses thinking.type = \"enabled\" with budget_tokens.", - "Interleaved thinking requires the interleaved-thinking-2025-05-14 beta header for this model family." - ] - } + "supported": false }, - "attachment": true, + "attachment": false, "open_weights": false, - "knowledge": "2025-03-31", - "release_date": "2025-08-05", - "last_updated": "2025-08-05", + "knowledge": "2024-04", + "release_date": "2024-01", + "last_updated": "2024-01", "cost": { - "input": 15, - "output": 75, - "cache_read": 1.5, - "cache_write": 18.75 + "input": 0.5, + "output": 1.4 }, "type": "chat" }, { - "id": "us.anthropic.claude-sonnet-4-6", - "name": "Claude Sonnet 4.6 (US)", - "display_name": "Claude Sonnet 4.6 (US)", + "id": "qwen3-next-80b-a3b-instruct", + "name": "Qwen3 Next 80B A3B Instruct", + "display_name": "Qwen3 Next 80B A3B Instruct", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 131072, + "output": 32768 + }, + "temperature": true, + "tool_call": true, + "reasoning": { + "supported": false + }, + "attachment": false, + "open_weights": true, + "knowledge": "2025-04", + "release_date": "2025-09", + "last_updated": "2025-09", + "cost": { + "input": 0.5, + "output": 2 + }, + "type": "chat" + }, + { + "id": "qwen3.7-plus", + "name": "Qwen3.7 Plus", + "display_name": "Qwen3.7 Plus", "modalities": { "input": [ "text", "image", - "pdf" + "video" ], "output": [ "text" @@ -138610,91 +142538,100 @@ }, "limit": { "context": 1000000, - "output": 64000 + "output": 65536 }, "temperature": true, "tool_call": true, "reasoning": { "supported": true, - "default": false + "default": true }, "extra_capabilities": { "reasoning": { - "supported": true, - "default_enabled": false, - "mode": "mixed", - "budget": { - "min": 1024, - "unit": "tokens" - }, - "effort": "high", - "effort_options": [ - "low", - "medium", - "high", - "max" - ], - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ], - "notes": [ - "Anthropic recommends adaptive thinking with effort for Claude 4.6; budget_tokens remains a deprecated compatibility path.", - "Anthropic API defaults effort to high; lower effort levels should be chosen per workload." - ] + "supported": true } }, - "attachment": true, + "attachment": false, "open_weights": false, - "knowledge": "2025-08-31", - "release_date": "2026-02-17", - "last_updated": "2026-03-13", + "knowledge": "2025-04", + "release_date": "2026-06-02", + "last_updated": "2026-06-04", "cost": { - "input": 3, - "output": 15, - "cache_read": 0.3, - "cache_write": 3.75 + "input": 0.5, + "output": 3, + "cache_read": 0.05, + "cache_write": 0.625, + "tiers": [ + { + "input": 2, + "output": 6, + "cache_read": 0.2, + "cache_write": 2.5, + "tier": { + "type": "context", + "size": 256000 + } + } + ], + "context_over_200k": { + "input": 2, + "output": 6, + "cache_read": 0.2, + "cache_write": 2.5 + } }, "type": "chat" }, { - "id": "meta.llama3-3-70b-instruct-v1:0", - "name": "Llama 3.3 70B Instruct", - "display_name": "Llama 3.3 70B Instruct", + "id": "qwen3.6-35b-a3b", + "name": "Qwen3.6 35B-A3B", + "display_name": "Qwen3.6 35B-A3B", "modalities": { "input": [ - "text" + "text", + "image", + "video", + "audio" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 4096 + "context": 262144, + "output": 65536 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": false, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } + }, + "attachment": true, "open_weights": true, - "knowledge": "2023-12", - "release_date": "2024-12-06", - "last_updated": "2024-12-06", + "release_date": "2026-04-17", + "last_updated": "2026-04-17", "cost": { - "input": 0.72, - "output": 0.72 + "input": 0.248, + "output": 1.485 }, "type": "chat" }, { - "id": "qwen.qwen3-coder-next", - "name": "Qwen3 Coder Next", - "display_name": "Qwen3 Coder Next", + "id": "qwen3.7-max", + "name": "Qwen3.7 Max", + "display_name": "Qwen3.7 Max", "modalities": { "input": [ "text" @@ -138704,7 +142641,7 @@ ] }, "limit": { - "context": 131072, + "context": 1000000, "output": 65536 }, "temperature": true, @@ -138713,96 +142650,85 @@ "supported": true, "default": true }, + "extra_capabilities": { + "reasoning": { + "supported": true + } + }, "attachment": false, - "open_weights": true, - "release_date": "2026-02-06", - "last_updated": "2026-02-06", + "open_weights": false, + "release_date": "2026-05-21", + "last_updated": "2026-05-21", "cost": { - "input": 0.22, - "output": 1.8 + "input": 2.5, + "output": 7.5, + "cache_read": 0.5, + "cache_write": 3.125 }, "type": "chat" }, { - "id": "eu.anthropic.claude-opus-4-5-20251101-v1:0", - "name": "Claude Opus 4.5 (EU)", - "display_name": "Claude Opus 4.5 (EU)", + "id": "qwen3-max", + "name": "Qwen3 Max", + "display_name": "Qwen3 Max", "modalities": { "input": [ - "text", - "image", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 64000 + "context": 262144, + "output": 65536 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": false + "supported": true }, "extra_capabilities": { "reasoning": { "supported": true, - "default_enabled": false, - "mode": "mixed", - "budget": { - "min": 1024, - "unit": "tokens" - }, - "effort": "high", - "effort_options": [ - "low", - "medium", - "high" - ], "interleaved": true, "summaries": true, "visibility": "summary", "continuation": [ "thinking_blocks" - ], - "notes": [ - "Claude Opus 4.5 uses manual thinking.type = \"enabled\" with budget_tokens; effort can be used alongside the thinking budget.", - "Interleaved thinking requires the interleaved-thinking-2025-05-14 beta header." ] } }, - "attachment": true, + "attachment": false, "open_weights": false, - "knowledge": "2025-03-31", - "release_date": "2025-11-24", - "last_updated": "2025-08-01", + "knowledge": "2025-04", + "release_date": "2025-09-23", + "last_updated": "2025-09-23", "cost": { - "input": 5, - "output": 25, - "cache_read": 0.5, - "cache_write": 6.25 + "input": 1.2, + "output": 6 }, "type": "chat" }, { - "id": "mistral.mistral-large-3-675b-instruct", - "name": "Mistral Large 3", - "display_name": "Mistral Large 3", + "id": "qwen2-5-omni-7b", + "name": "Qwen2.5-Omni 7B", + "display_name": "Qwen2.5-Omni 7B", "modalities": { "input": [ "text", - "image" + "image", + "audio", + "video" ], "output": [ - "text" + "text", + "audio" ] }, "limit": { - "context": 256000, - "output": 8192 + "context": 32768, + "output": 2048 }, "temperature": true, "tool_call": true, @@ -138811,18 +142737,20 @@ }, "attachment": false, "open_weights": true, - "release_date": "2025-12-02", - "last_updated": "2025-12-02", + "knowledge": "2024-04", + "release_date": "2024-12", + "last_updated": "2024-12", "cost": { - "input": 0.5, - "output": 1.5 + "input": 0.1, + "output": 0.4, + "input_audio": 6.76 }, "type": "chat" }, { - "id": "writer.palmyra-x4-v1:0", - "name": "Palmyra X4", - "display_name": "Palmyra X4", + "id": "qwen3-8b", + "name": "Qwen3 8B", + "display_name": "Qwen3 8B", "modalities": { "input": [ "text" @@ -138832,40 +142760,57 @@ ] }, "limit": { - "context": 122880, + "context": 131072, "output": 8192 }, "temperature": true, "tool_call": true, "reasoning": { "supported": true, - "default": true + "default": true, + "budget": { + "default": 38912, + "min": 0, + "max": 38912 + } + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } }, "attachment": false, - "open_weights": false, - "release_date": "2025-04-28", - "last_updated": "2025-04-28", + "open_weights": true, + "knowledge": "2025-04", + "release_date": "2025-04", + "last_updated": "2025-04", "cost": { - "input": 2.5, - "output": 10 + "input": 0.18, + "output": 0.7, + "reasoning": 2.1 }, "type": "chat" }, { - "id": "mistral.pixtral-large-2502-v1:0", - "name": "Pixtral Large (25.02)", - "display_name": "Pixtral Large (25.02)", + "id": "qwen2-5-14b-instruct", + "name": "Qwen2.5 14B Instruct", + "display_name": "Qwen2.5 14B Instruct", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 128000, + "context": 131072, "output": 8192 }, "temperature": true, @@ -138874,19 +142819,20 @@ "supported": false }, "attachment": false, - "open_weights": false, - "release_date": "2025-04-08", - "last_updated": "2025-04-08", + "open_weights": true, + "knowledge": "2024-04", + "release_date": "2024-09", + "last_updated": "2024-09", "cost": { - "input": 2, - "output": 6 + "input": 0.35, + "output": 1.4 }, "type": "chat" }, { - "id": "amazon.nova-micro-v1:0", - "name": "Nova Micro", - "display_name": "Nova Micro", + "id": "qwen3-next-80b-a3b-thinking", + "name": "Qwen3 Next 80B A3B Thinking", + "display_name": "Qwen3 Next 80B A3B Thinking", "modalities": { "input": [ "text" @@ -138896,35 +142842,85 @@ ] }, "limit": { - "context": 128000, + "context": 131072, + "output": 32768 + }, + "temperature": true, + "tool_call": false, + "reasoning": { + "supported": true, + "default": true, + "budget": { + "default": 81920, + "min": 0, + "max": 81920 + } + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } + }, + "attachment": false, + "open_weights": true, + "knowledge": "2025-04", + "release_date": "2025-09", + "last_updated": "2025-09", + "cost": { + "input": 0.5, + "output": 6 + }, + "type": "chat" + }, + { + "id": "qvq-max", + "name": "QVQ Max", + "display_name": "QVQ Max", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 131072, "output": 8192 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "attachment": false, "open_weights": false, - "knowledge": "2024-10", - "release_date": "2024-12-03", - "last_updated": "2024-12-03", + "knowledge": "2024-04", + "release_date": "2025-03-25", + "last_updated": "2025-03-25", "cost": { - "input": 0.035, - "output": 0.14, - "cache_read": 0.00875 + "input": 1.2, + "output": 4.8 }, "type": "chat" }, { - "id": "anthropic.claude-opus-4-6-v1", - "name": "Claude Opus 4.6", - "display_name": "Claude Opus 4.6", + "id": "qwen3.6-flash", + "name": "Qwen3.6 Flash", + "display_name": "Qwen3.6 Flash", "modalities": { "input": [ "text", "image", - "pdf" + "video" ], "output": [ "text" @@ -138932,117 +142928,124 @@ }, "limit": { "context": 1000000, - "output": 128000 + "output": 65536 }, "temperature": true, "tool_call": true, "reasoning": { "supported": true, - "default": false + "default": true }, "extra_capabilities": { "reasoning": { "supported": true, - "default_enabled": false, - "mode": "mixed", - "budget": { - "min": 1024, - "unit": "tokens" - }, - "effort": "high", - "effort_options": [ - "low", - "medium", - "high", - "max" - ], "interleaved": true, "summaries": true, "visibility": "summary", "continuation": [ "thinking_blocks" - ], - "notes": [ - "Anthropic recommends adaptive thinking with effort for Claude 4.6; budget_tokens remains a deprecated compatibility path.", - "Anthropic API defaults effort to high; lower effort levels should be chosen per workload." ] } }, "attachment": true, "open_weights": false, - "knowledge": "2025-05-31", - "release_date": "2026-02-05", - "last_updated": "2026-03-13", + "release_date": "2026-04-27", + "last_updated": "2026-04-27", "cost": { - "input": 5, - "output": 25, - "cache_read": 0.5, - "cache_write": 6.25 + "input": 0.1875, + "output": 1.125, + "cache_write": 0.234375 }, "type": "chat" }, { - "id": "eu.anthropic.claude-sonnet-4-5-20250929-v1:0", - "name": "Claude Sonnet 4.5 (EU)", - "display_name": "Claude Sonnet 4.5 (EU)", + "id": "qwen2-5-vl-72b-instruct", + "name": "Qwen2.5-VL 72B Instruct", + "display_name": "Qwen2.5-VL 72B Instruct", "modalities": { "input": [ "text", - "image", - "pdf" + "image" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 64000 + "context": 131072, + "output": 8192 }, "temperature": true, "tool_call": true, + "reasoning": { + "supported": false + }, + "attachment": false, + "open_weights": true, + "knowledge": "2024-04", + "release_date": "2024-09", + "last_updated": "2024-09", + "cost": { + "input": 2.8, + "output": 8.4 + }, + "type": "chat" + }, + { + "id": "qwen3-vl-plus", + "name": "Qwen3 VL Plus", + "display_name": "Qwen3 VL Plus", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 262144, + "output": 32768 + }, + "temperature": true, + "tool_call": false, "reasoning": { "supported": true, - "default": false + "default": false, + "budget": { + "default": 81920, + "min": 0, + "max": 81920 + } }, "extra_capabilities": { "reasoning": { "supported": true, - "default_enabled": false, - "mode": "budget", - "budget": { - "min": 1024, - "unit": "tokens" - }, "interleaved": true, "summaries": true, "visibility": "summary", "continuation": [ "thinking_blocks" - ], - "notes": [ - "Claude 4 manual thinking uses thinking.type = \"enabled\" with budget_tokens.", - "Interleaved thinking requires the interleaved-thinking-2025-05-14 beta header for this model family." ] } }, - "attachment": true, + "attachment": false, "open_weights": false, - "knowledge": "2025-07-31", - "release_date": "2025-09-29", - "last_updated": "2025-09-29", + "knowledge": "2025-04", + "release_date": "2025-09-23", + "last_updated": "2025-09-23", "cost": { - "input": 3.3, - "output": 16.5, - "cache_read": 0.33, - "cache_write": 4.125 + "input": 0.2, + "output": 1.6, + "reasoning": 4.8 }, "type": "chat" }, { - "id": "google.gemma-3-12b-it", - "name": "Google Gemma 3 12B", - "display_name": "Google Gemma 3 12B", + "id": "qwen-vl-ocr", + "name": "Qwen Vl Ocr", + "display_name": "Qwen Vl Ocr", "modalities": { "input": [ "text", @@ -139053,7 +143056,39 @@ ] }, "limit": { - "context": 131072, + "context": 34096, + "output": 4096 + }, + "temperature": true, + "tool_call": false, + "reasoning": { + "supported": false + }, + "attachment": false, + "open_weights": false, + "knowledge": "2024-04", + "release_date": "2024-10-28", + "last_updated": "2025-04-13", + "cost": { + "input": 0.72, + "output": 0.72 + }, + "type": "chat" + }, + { + "id": "qwen-mt-turbo", + "name": "Qwen Mt Turbo", + "display_name": "Qwen Mt Turbo", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 16384, "output": 8192 }, "temperature": true, @@ -139063,127 +143098,146 @@ }, "attachment": false, "open_weights": false, - "knowledge": "2024-12", - "release_date": "2024-12-01", - "last_updated": "2024-12-01", + "knowledge": "2024-04", + "release_date": "2025-01", + "last_updated": "2025-01", "cost": { - "input": 0.049999999999999996, - "output": 0.09999999999999999 + "input": 0.16, + "output": 0.49 }, "type": "chat" }, { - "id": "mistral.magistral-small-2509", - "name": "Magistral Small 1.2", - "display_name": "Magistral Small 1.2", + "id": "qwen-mt-plus", + "name": "Qwen Mt Plus", + "display_name": "Qwen Mt Plus", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 40000 + "context": 16384, + "output": 8192 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": true + "supported": false }, "attachment": false, - "open_weights": true, - "release_date": "2025-12-02", - "last_updated": "2025-12-02", + "open_weights": false, + "knowledge": "2024-04", + "release_date": "2025-01", + "last_updated": "2025-01", "cost": { - "input": 0.5, - "output": 1.5 + "input": 2.46, + "output": 7.37 }, "type": "chat" }, { - "id": "anthropic.claude-opus-4-5-20251101-v1:0", - "name": "Claude Opus 4.5", - "display_name": "Claude Opus 4.5", + "id": "qwen3.5-plus", + "name": "Qwen3.5 Plus", + "display_name": "Qwen3.5 Plus", "modalities": { "input": [ "text", "image", - "pdf" + "video" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 64000 + "context": 1000000, + "output": 65536 }, "temperature": true, "tool_call": true, "reasoning": { "supported": true, - "default": false + "default": true }, "extra_capabilities": { "reasoning": { "supported": true, - "default_enabled": false, - "mode": "mixed", - "budget": { - "min": 1024, - "unit": "tokens" - }, - "effort": "high", - "effort_options": [ - "low", - "medium", - "high" - ], "interleaved": true, "summaries": true, "visibility": "summary", "continuation": [ "thinking_blocks" - ], - "notes": [ - "Claude Opus 4.5 uses manual thinking.type = \"enabled\" with budget_tokens; effort can be used alongside the thinking budget.", - "Interleaved thinking requires the interleaved-thinking-2025-05-14 beta header." ] } }, - "attachment": true, + "attachment": false, + "open_weights": false, + "knowledge": "2025-04", + "release_date": "2026-02-16", + "last_updated": "2026-02-16", + "cost": { + "input": 0.4, + "output": 2.4, + "reasoning": 2.4 + }, + "type": "chat" + }, + { + "id": "qwen-omni-turbo", + "name": "Qwen-Omni Turbo", + "display_name": "Qwen-Omni Turbo", + "modalities": { + "input": [ + "text", + "image", + "audio", + "video" + ], + "output": [ + "text", + "audio" + ] + }, + "limit": { + "context": 32768, + "output": 2048 + }, + "temperature": true, + "tool_call": true, + "reasoning": { + "supported": false + }, + "attachment": false, "open_weights": false, - "knowledge": "2025-03-31", - "release_date": "2025-11-24", - "last_updated": "2025-08-01", + "knowledge": "2024-04", + "release_date": "2025-01-19", + "last_updated": "2025-03-26", "cost": { - "input": 5, - "output": 25, - "cache_read": 0.5, - "cache_write": 6.25 + "input": 0.07, + "output": 0.27, + "input_audio": 4.44, + "output_audio": 8.89 }, "type": "chat" }, { - "id": "google.gemma-3-27b-it", - "name": "Google Gemma 3 27B Instruct", - "display_name": "Google Gemma 3 27B Instruct", + "id": "qwen2-5-72b-instruct", + "name": "Qwen2.5 72B Instruct", + "display_name": "Qwen2.5 72B Instruct", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 202752, + "context": 131072, "output": 8192 }, "temperature": true, @@ -139191,25 +143245,24 @@ "reasoning": { "supported": false }, - "attachment": true, + "attachment": false, "open_weights": true, - "knowledge": "2025-07", - "release_date": "2025-07-27", - "last_updated": "2025-07-27", + "knowledge": "2024-04", + "release_date": "2024-09", + "last_updated": "2024-09", "cost": { - "input": 0.12, - "output": 0.2 + "input": 1.4, + "output": 5.6 }, "type": "chat" }, { - "id": "global.anthropic.claude-fable-5", - "name": "Claude Fable 5 (Global)", - "display_name": "Claude Fable 5 (Global)", + "id": "qwen-flash", + "name": "Qwen Flash", + "display_name": "Qwen Flash", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" @@ -139217,57 +143270,51 @@ }, "limit": { "context": 1000000, - "output": 128000 + "output": 32768 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, - "default": true + "default": false, + "budget": { + "default": 81920, + "min": 0, + "max": 81920 + } }, "extra_capabilities": { "reasoning": { "supported": true, - "default_enabled": true, - "mode": "effort", - "effort": "high", - "effort_options": [ - "low", - "medium", - "high", - "xhigh", - "max" - ], "interleaved": true, "summaries": true, - "visibility": "omitted", + "visibility": "summary", "continuation": [ "thinking_blocks" - ], - "notes": [ - "Adaptive thinking is always on for Claude Fable 5 and Claude Mythos 5; thinking.type = \"disabled\" is rejected.", - "Manual budget_tokens requests return 400 on Claude Fable 5 and Claude Mythos 5.", - "thinking.display defaults to omitted; set display to summarized to receive readable thinking summaries." ] } }, - "attachment": true, + "search": { + "supported": true, + "default": false, + "forced_search": false, + "search_strategy": "turbo" + }, + "attachment": false, "open_weights": false, - "knowledge": "2026-01-31", - "release_date": "2026-06-09", - "last_updated": "2026-06-09", + "knowledge": "2024-04", + "release_date": "2025-07-28", + "last_updated": "2025-07-28", "cost": { - "input": 10, - "output": 50, - "cache_read": 1, - "cache_write": 12.5 + "input": 0.05, + "output": 0.4 }, "type": "chat" }, { - "id": "eu.anthropic.claude-fable-5", - "name": "Claude Fable 5 (EU)", - "display_name": "Claude Fable 5 (EU)", + "id": "qwen3-vl-235b-a22b", + "name": "Qwen3-VL 235B-A22B", + "display_name": "Qwen3-VL 235B-A22B", "modalities": { "input": [ "text", @@ -139278,10 +143325,10 @@ ] }, "limit": { - "context": 1000000, - "output": 128000 + "context": 131072, + "output": 32768 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, @@ -139290,46 +143337,30 @@ "extra_capabilities": { "reasoning": { "supported": true, - "default_enabled": true, - "mode": "effort", - "effort": "high", - "effort_options": [ - "low", - "medium", - "high", - "xhigh", - "max" - ], "interleaved": true, "summaries": true, - "visibility": "omitted", + "visibility": "summary", "continuation": [ "thinking_blocks" - ], - "notes": [ - "Adaptive thinking is always on for Claude Fable 5 and Claude Mythos 5; thinking.type = \"disabled\" is rejected.", - "Manual budget_tokens requests return 400 on Claude Fable 5 and Claude Mythos 5.", - "thinking.display defaults to omitted; set display to summarized to receive readable thinking summaries." ] } }, - "attachment": true, - "open_weights": false, - "knowledge": "2026-01-31", - "release_date": "2026-06-09", - "last_updated": "2026-06-09", + "attachment": false, + "open_weights": true, + "knowledge": "2025-04", + "release_date": "2025-04", + "last_updated": "2025-04", "cost": { - "input": 11, - "output": 55, - "cache_read": 1.1, - "cache_write": 13.75 + "input": 0.7, + "output": 2.8, + "reasoning": 8.4 }, "type": "chat" }, { - "id": "us.meta.llama4-maverick-17b-instruct-v1:0", - "name": "Llama 4 Maverick 17B Instruct (US)", - "display_name": "Llama 4 Maverick 17B Instruct (US)", + "id": "qwen3-vl-30b-a3b", + "name": "Qwen3-VL 30B-A3B", + "display_name": "Qwen3-VL 30B-A3B", "modalities": { "input": [ "text", @@ -139340,154 +143371,121 @@ ] }, "limit": { - "context": 1000000, - "output": 16384 + "context": 131072, + "output": 32768 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": true, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } + }, + "attachment": false, "open_weights": true, - "knowledge": "2024-08", - "release_date": "2025-04-05", - "last_updated": "2025-04-05", + "knowledge": "2025-04", + "release_date": "2025-04", + "last_updated": "2025-04", "cost": { - "input": 0.24, - "output": 0.97 + "input": 0.2, + "output": 0.8, + "reasoning": 2.4 }, "type": "chat" }, { - "id": "amazon.nova-2-lite-v1:0", - "name": "Nova 2 Lite", - "display_name": "Nova 2 Lite", + "id": "qwen-vl-max", + "name": "Qwen-VL Max", + "display_name": "Qwen-VL Max", "modalities": { "input": [ "text", - "image", - "video" + "image" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 4096 + "context": 131072, + "output": 8192 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, "attachment": false, "open_weights": false, - "release_date": "2024-12-01", - "last_updated": "2024-12-01", + "knowledge": "2024-04", + "release_date": "2024-04-08", + "last_updated": "2025-08-13", "cost": { - "input": 0.33, - "output": 2.75 + "input": 0.8, + "output": 3.2 }, "type": "chat" }, { - "id": "jp.anthropic.claude-sonnet-4-5-20250929-v1:0", - "name": "Claude Sonnet 4.5 (JP)", - "display_name": "Claude Sonnet 4.5 (JP)", + "id": "qwen3.5-27b", + "name": "Qwen3.5 27B", + "display_name": "Qwen3.5 27B", "modalities": { "input": [ "text", "image", - "pdf" + "video", + "audio" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 64000 + "context": 262144, + "output": 65536 }, "temperature": true, "tool_call": true, "reasoning": { "supported": true, - "default": false + "default": true }, "extra_capabilities": { "reasoning": { "supported": true, - "default_enabled": false, - "mode": "budget", - "budget": { - "min": 1024, - "unit": "tokens" - }, "interleaved": true, "summaries": true, "visibility": "summary", "continuation": [ "thinking_blocks" - ], - "notes": [ - "Claude 4 manual thinking uses thinking.type = \"enabled\" with budget_tokens.", - "Interleaved thinking requires the interleaved-thinking-2025-05-14 beta header for this model family." ] } }, "attachment": true, - "open_weights": false, - "knowledge": "2025-07-31", - "release_date": "2025-09-29", - "last_updated": "2025-09-29", - "cost": { - "input": 3, - "output": 15, - "cache_read": 0.3, - "cache_write": 3.75 - }, - "type": "chat" - }, - { - "id": "us.meta.llama4-scout-17b-instruct-v1:0", - "name": "Llama 4 Scout 17B Instruct (US)", - "display_name": "Llama 4 Scout 17B Instruct (US)", - "modalities": { - "input": [ - "text", - "image" - ], - "output": [ - "text" - ] - }, - "limit": { - "context": 3500000, - "output": 16384 - }, - "temperature": true, - "tool_call": true, - "reasoning": { - "supported": false - }, - "attachment": true, "open_weights": true, - "knowledge": "2024-08", - "release_date": "2025-04-05", - "last_updated": "2025-04-05", + "release_date": "2026-02-23", + "last_updated": "2026-02-23", "cost": { - "input": 0.17, - "output": 0.66 + "input": 0.3, + "output": 2.4 }, "type": "chat" }, { - "id": "nvidia.nemotron-nano-3-30b", - "name": "NVIDIA Nemotron Nano 3 30B", - "display_name": "NVIDIA Nemotron Nano 3 30B", + "id": "qwen-max", + "name": "Qwen Max", + "display_name": "Qwen Max", "modalities": { "input": [ "text" @@ -139497,226 +143495,215 @@ ] }, "limit": { - "context": 128000, - "output": 4096 + "context": 32768, + "output": 8192 }, "temperature": true, "tool_call": true, "reasoning": { + "supported": false + }, + "search": { "supported": true, - "default": true + "default": false, + "forced_search": false, + "search_strategy": "turbo" }, "attachment": false, - "open_weights": true, - "release_date": "2025-12-23", - "last_updated": "2025-12-23", + "open_weights": false, + "knowledge": "2024-04", + "release_date": "2024-04-03", + "last_updated": "2025-01-25", "cost": { - "input": 0.06, - "output": 0.24 + "input": 1.6, + "output": 6.4 }, "type": "chat" }, { - "id": "au.anthropic.claude-sonnet-4-6", - "name": "AU Anthropic Claude Sonnet 4.6", - "display_name": "AU Anthropic Claude Sonnet 4.6", + "id": "qwen3-235b-a22b", + "name": "Qwen3 235B A22B", + "display_name": "Qwen3 235B A22B", "modalities": { "input": [ - "text", - "image", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 1000000, - "output": 128000 + "context": 131072, + "output": 32768 }, "temperature": true, "tool_call": true, "reasoning": { "supported": true, - "default": false + "default": false, + "budget": { + "default": 81920, + "min": 0, + "max": 81920 + } }, "extra_capabilities": { "reasoning": { "supported": true, - "default_enabled": false, - "mode": "mixed", - "budget": { - "min": 1024, - "unit": "tokens" - }, - "effort": "high", - "effort_options": [ - "low", - "medium", - "high", - "max" - ], "interleaved": true, "summaries": true, "visibility": "summary", "continuation": [ "thinking_blocks" - ], - "notes": [ - "Anthropic recommends adaptive thinking with effort for Claude 4.6; budget_tokens remains a deprecated compatibility path.", - "Anthropic API defaults effort to high; lower effort levels should be chosen per workload." ] } }, - "attachment": true, - "open_weights": false, - "knowledge": "2025-08", - "release_date": "2026-02-17", - "last_updated": "2026-02-17", + "attachment": false, + "open_weights": true, + "knowledge": "2025-04", + "release_date": "2025-04", + "last_updated": "2025-04", "cost": { - "input": 3.3, - "output": 16.5, - "cache_read": 0.33, - "cache_write": 4.125 + "input": 0.7, + "output": 2.8, + "reasoning": 8.4 }, "type": "chat" }, { - "id": "openai.gpt-5.4", - "name": "GPT-5.4", - "display_name": "GPT-5.4", + "id": "qwen3-livetranslate-flash-realtime", + "name": "Qwen3-LiveTranslate Flash Realtime", + "display_name": "Qwen3-LiveTranslate Flash Realtime", "modalities": { "input": [ "text", "image", - "pdf" + "audio", + "video" ], "output": [ - "text" + "text", + "audio" ] }, "limit": { - "context": 272000, - "output": 128000 + "context": 53248, + "output": 4096 }, - "temperature": false, - "tool_call": true, + "temperature": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": true + "supported": false }, - "attachment": true, + "attachment": false, "open_weights": false, - "knowledge": "2025-08-31", - "release_date": "2026-03-05", - "last_updated": "2026-06-01", + "knowledge": "2024-04", + "release_date": "2025-09-22", + "last_updated": "2025-09-22", "cost": { - "input": 2.75, - "output": 16.5, - "cache_read": 0.275 + "input": 10, + "output": 10, + "input_audio": 10, + "output_audio": 38 }, "type": "chat" }, { - "id": "jp.anthropic.claude-opus-4-7", - "name": "Claude Opus 4.7 (JP)", - "display_name": "Claude Opus 4.7 (JP)", + "id": "qwen3.6-27b", + "name": "Qwen3.6 27B", + "display_name": "Qwen3.6 27B", "modalities": { "input": [ "text", "image", - "pdf" + "video", + "audio" ], "output": [ "text" ] }, "limit": { - "context": 1000000, - "output": 128000 + "context": 262144, + "output": 65536 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, - "default": false + "default": true }, "extra_capabilities": { "reasoning": { "supported": true, - "default_enabled": false, - "mode": "effort", - "effort": "high", - "effort_options": [ - "low", - "medium", - "high", - "xhigh", - "max" - ], "interleaved": true, "summaries": true, - "visibility": "omitted", + "visibility": "summary", "continuation": [ "thinking_blocks" - ], - "notes": [ - "Claude Opus 4.7 and newer Opus models require thinking.type = \"adaptive\" to enable thinking explicitly.", - "Manual budget_tokens requests return 400 on Claude Opus 4.7 and newer adaptive-only Opus models.", - "task_budget is separate from thinking control and should not be treated as a thinking budget." ] } }, "attachment": true, - "open_weights": false, - "knowledge": "2026-01-31", - "release_date": "2026-04-16", - "last_updated": "2026-04-16", + "open_weights": true, + "release_date": "2026-04-22", + "last_updated": "2026-04-22", "cost": { - "input": 5, - "output": 25, - "cache_read": 0.5, - "cache_write": 6.25 + "input": 0.6, + "output": 3.6 }, "type": "chat" }, { - "id": "meta.llama4-scout-17b-instruct-v1:0", - "name": "Llama 4 Scout 17B Instruct", - "display_name": "Llama 4 Scout 17B Instruct", + "id": "qwen3.5-35b-a3b", + "name": "Qwen3.5 35B-A3B", + "display_name": "Qwen3.5 35B-A3B", "modalities": { "input": [ "text", - "image" + "image", + "video", + "audio" ], "output": [ "text" ] }, "limit": { - "context": 3500000, - "output": 16384 + "context": 262144, + "output": 65536 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } }, "attachment": true, "open_weights": true, - "knowledge": "2024-08", - "release_date": "2025-04-05", - "last_updated": "2025-04-05", + "release_date": "2026-02-23", + "last_updated": "2026-02-23", "cost": { - "input": 0.17, - "output": 0.66 + "input": 0.25, + "output": 2 }, "type": "chat" }, { - "id": "openai.gpt-oss-safeguard-120b", - "name": "GPT OSS Safeguard 120B", - "display_name": "GPT OSS Safeguard 120B", + "id": "qwen3-coder-480b-a35b-instruct", + "name": "Qwen3-Coder 480B-A35B Instruct", + "display_name": "Qwen3-Coder 480B-A35B Instruct", "modalities": { "input": [ "text" @@ -139726,8 +143713,8 @@ ] }, "limit": { - "context": 128000, - "output": 16384 + "context": 262144, + "output": 65536 }, "temperature": true, "tool_call": true, @@ -139735,91 +143722,123 @@ "supported": false }, "attachment": false, - "open_weights": false, - "release_date": "2025-10-29", - "last_updated": "2025-10-29", + "open_weights": true, + "knowledge": "2025-04", + "release_date": "2025-04", + "last_updated": "2025-04", "cost": { - "input": 0.15, - "output": 0.6 + "input": 1.5, + "output": 7.5 }, "type": "chat" }, { - "id": "global.anthropic.claude-sonnet-4-5-20250929-v1:0", - "name": "Claude Sonnet 4.5 (Global)", - "display_name": "Claude Sonnet 4.5 (Global)", + "id": "qwq-plus", + "name": "QwQ Plus", + "display_name": "QwQ Plus", "modalities": { "input": [ - "text", - "image", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 64000 + "context": 131072, + "output": 8192 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": true, - "default": false + "default": true, + "budget": { + "default": 32768, + "min": 0, + "max": 32768 + } }, "extra_capabilities": { "reasoning": { "supported": true, - "default_enabled": false, - "mode": "budget", - "budget": { - "min": 1024, - "unit": "tokens" - }, "interleaved": true, "summaries": true, "visibility": "summary", "continuation": [ "thinking_blocks" - ], - "notes": [ - "Claude 4 manual thinking uses thinking.type = \"enabled\" with budget_tokens.", - "Interleaved thinking requires the interleaved-thinking-2025-05-14 beta header for this model family." ] } }, - "attachment": true, + "search": { + "supported": true, + "default": false, + "forced_search": false, + "search_strategy": "turbo" + }, + "attachment": false, "open_weights": false, - "knowledge": "2025-07-31", - "release_date": "2025-09-29", - "last_updated": "2025-09-29", + "knowledge": "2024-04", + "release_date": "2025-03-05", + "last_updated": "2025-03-05", "cost": { - "input": 3, - "output": 15, - "cache_read": 0.3, - "cache_write": 3.75 + "input": 0.8, + "output": 2.4 }, "type": "chat" }, { - "id": "us.anthropic.claude-fable-5", - "name": "Claude Fable 5 (US)", - "display_name": "Claude Fable 5 (US)", + "id": "qwen2-5-32b-instruct", + "name": "Qwen2.5 32B Instruct", + "display_name": "Qwen2.5 32B Instruct", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 131072, + "output": 8192 + }, + "temperature": true, + "tool_call": true, + "reasoning": { + "supported": false + }, + "attachment": false, + "open_weights": true, + "knowledge": "2024-04", + "release_date": "2024-09", + "last_updated": "2024-09", + "cost": { + "input": 0.7, + "output": 2.8 + }, + "type": "chat" + }, + { + "id": "qwen3.5-397b-a17b", + "name": "Qwen3.5 397B-A17B", + "display_name": "Qwen3.5 397B-A17B", "modalities": { "input": [ "text", - "image" + "image", + "video", + "audio" ], "output": [ "text" ] }, "limit": { - "context": 1000000, - "output": 128000 + "context": 262144, + "output": 65536 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, @@ -139828,46 +143847,28 @@ "extra_capabilities": { "reasoning": { "supported": true, - "default_enabled": true, - "mode": "effort", - "effort": "high", - "effort_options": [ - "low", - "medium", - "high", - "xhigh", - "max" - ], "interleaved": true, "summaries": true, - "visibility": "omitted", + "visibility": "summary", "continuation": [ "thinking_blocks" - ], - "notes": [ - "Adaptive thinking is always on for Claude Fable 5 and Claude Mythos 5; thinking.type = \"disabled\" is rejected.", - "Manual budget_tokens requests return 400 on Claude Fable 5 and Claude Mythos 5.", - "thinking.display defaults to omitted; set display to summarized to receive readable thinking summaries." ] } }, "attachment": true, - "open_weights": false, - "knowledge": "2026-01-31", - "release_date": "2026-06-09", - "last_updated": "2026-06-09", + "open_weights": true, + "release_date": "2026-02-15", + "last_updated": "2026-02-15", "cost": { - "input": 10, - "output": 50, - "cache_read": 1, - "cache_write": 12.5 + "input": 0.6, + "output": 3.6 }, "type": "chat" }, { - "id": "zai.glm-4.7-flash", - "name": "GLM-4.7-Flash", - "display_name": "GLM-4.7-Flash", + "id": "qwen3-coder-flash", + "name": "Qwen3 Coder Flash", + "display_name": "Qwen3 Coder Flash", "modalities": { "input": [ "text" @@ -139877,30 +143878,29 @@ ] }, "limit": { - "context": 200000, - "output": 131072 + "context": 1000000, + "output": 65536 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, "attachment": false, - "open_weights": true, + "open_weights": false, "knowledge": "2025-04", - "release_date": "2026-01-19", - "last_updated": "2026-01-19", + "release_date": "2025-07-28", + "last_updated": "2025-07-28", "cost": { - "input": 0.07, - "output": 0.4 + "input": 0.3, + "output": 1.5 }, "type": "chat" }, { - "id": "openai.gpt-oss-20b-1:0", - "name": "gpt-oss-20b", - "display_name": "gpt-oss-20b", + "id": "qwen3-14b", + "name": "Qwen3 14B", + "display_name": "Qwen3 14B", "modalities": { "input": [ "text" @@ -139910,149 +143910,135 @@ ] }, "limit": { - "context": 128000, - "output": 16384 + "context": 131072, + "output": 8192 }, "temperature": true, "tool_call": true, "reasoning": { "supported": true, - "default": true + "default": true, + "budget": { + "default": 38912, + "min": 0, + "max": 38912 + } + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } }, "attachment": false, - "open_weights": false, - "release_date": "2025-08-05", - "last_updated": "2025-08-05", + "open_weights": true, + "knowledge": "2025-04", + "release_date": "2025-04", + "last_updated": "2025-04", "cost": { - "input": 0.07, - "output": 0.3 + "input": 0.35, + "output": 1.4, + "reasoning": 4.2 }, "type": "chat" }, { - "id": "anthropic.claude-opus-4-8", - "name": "Claude Opus 4.8", - "display_name": "Claude Opus 4.8", + "id": "qwen3-asr-flash", + "name": "Qwen3-ASR Flash", + "display_name": "Qwen3-ASR Flash", "modalities": { "input": [ - "text", - "image", - "pdf" + "audio" ], "output": [ "text" ] }, "limit": { - "context": 1000000, - "output": 128000 + "context": 53248, + "output": 4096 }, "temperature": false, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": false - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": false, - "mode": "effort", - "effort": "high", - "effort_options": [ - "low", - "medium", - "high", - "xhigh", - "max" - ], - "interleaved": true, - "summaries": true, - "visibility": "omitted", - "continuation": [ - "thinking_blocks" - ], - "notes": [ - "Claude Opus 4.7 and newer Opus models require thinking.type = \"adaptive\" to enable thinking explicitly.", - "Manual budget_tokens requests return 400 on Claude Opus 4.7 and newer adaptive-only Opus models.", - "task_budget is separate from thinking control and should not be treated as a thinking budget." - ] - } + "supported": false }, - "attachment": true, + "attachment": false, "open_weights": false, - "release_date": "2026-05-28", - "last_updated": "2026-05-28", + "knowledge": "2024-04", + "release_date": "2025-09-08", + "last_updated": "2025-09-08", "cost": { - "input": 5, - "output": 25, - "cache_read": 0.5, - "cache_write": 6.25 + "input": 0.035, + "output": 0.035 }, "type": "chat" }, { - "id": "au.anthropic.claude-sonnet-4-5-20250929-v1:0", - "name": "Claude Sonnet 4.5 (AU)", - "display_name": "Claude Sonnet 4.5 (AU)", + "id": "qwen-turbo", + "name": "Qwen Turbo", + "display_name": "Qwen Turbo", "modalities": { "input": [ - "text", - "image", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 64000 + "context": 131072, + "output": 16384 }, "temperature": true, "tool_call": true, "reasoning": { "supported": true, - "default": false + "default": false, + "budget": { + "default": 38912, + "min": 0, + "max": 38912 + } }, "extra_capabilities": { "reasoning": { "supported": true, - "default_enabled": false, - "mode": "budget", - "budget": { - "min": 1024, - "unit": "tokens" - }, "interleaved": true, "summaries": true, "visibility": "summary", "continuation": [ "thinking_blocks" - ], - "notes": [ - "Claude 4 manual thinking uses thinking.type = \"enabled\" with budget_tokens.", - "Interleaved thinking requires the interleaved-thinking-2025-05-14 beta header for this model family." ] } }, - "attachment": true, + "search": { + "supported": true, + "default": false, + "forced_search": false, + "search_strategy": "turbo" + }, + "attachment": false, "open_weights": false, - "knowledge": "2025-07-31", - "release_date": "2025-09-29", - "last_updated": "2025-09-29", + "knowledge": "2024-04", + "release_date": "2024-11-01", + "last_updated": "2025-04-28", "cost": { - "input": 3, - "output": 15, - "cache_read": 0.3, - "cache_write": 3.75 + "input": 0.05, + "output": 0.2, + "reasoning": 0.5 }, "type": "chat" }, { - "id": "openai.gpt-oss-20b", - "name": "gpt-oss-20b", - "display_name": "gpt-oss-20b", + "id": "qwen2-5-7b-instruct", + "name": "Qwen2.5 7B Instruct", + "display_name": "Qwen2.5 7B Instruct", "modalities": { "input": [ "text" @@ -140062,62 +144048,62 @@ ] }, "limit": { - "context": 128000, - "output": 16384 + "context": 131072, + "output": 8192 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, "attachment": false, - "open_weights": false, - "release_date": "2025-08-05", - "last_updated": "2025-08-05", + "open_weights": true, + "knowledge": "2024-04", + "release_date": "2024-09", + "last_updated": "2024-09", "cost": { - "input": 0.07, - "output": 0.3 + "input": 0.175, + "output": 0.7 }, "type": "chat" }, { - "id": "qwen.qwen3-32b-v1:0", - "name": "Qwen3 32B (dense)", - "display_name": "Qwen3 32B (dense)", + "id": "qwen2-5-vl-7b-instruct", + "name": "Qwen2.5-VL 7B Instruct", + "display_name": "Qwen2.5-VL 7B Instruct", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 16384, - "output": 16384 + "context": 131072, + "output": 8192 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, "attachment": false, "open_weights": true, "knowledge": "2024-04", - "release_date": "2025-09-18", - "last_updated": "2025-09-18", + "release_date": "2024-09", + "last_updated": "2024-09", "cost": { - "input": 0.15, - "output": 0.6 + "input": 0.35, + "output": 1.05 }, "type": "chat" }, { - "id": "deepseek.r1-v1:0", - "name": "DeepSeek-R1", - "display_name": "DeepSeek-R1", + "id": "qwen3.6-max-preview", + "name": "Qwen3.6 Max Preview", + "display_name": "Qwen3.6 Max Preview", "modalities": { "input": [ "text" @@ -140127,8 +144113,8 @@ ] }, "limit": { - "context": 128000, - "output": 32768 + "context": 262144, + "output": 65536 }, "temperature": true, "tool_call": true, @@ -140136,109 +144122,126 @@ "supported": true, "default": true }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } + }, "attachment": false, "open_weights": false, - "knowledge": "2024-07", - "release_date": "2025-01-20", - "last_updated": "2025-05-29", + "knowledge": "2025-04", + "release_date": "2026-04-20", + "last_updated": "2026-04-20", "cost": { - "input": 1.35, - "output": 5.4 + "input": 1.3, + "output": 7.8, + "cache_read": 0.13, + "cache_write": 1.625 }, "type": "chat" }, { - "id": "amazon.nova-lite-v1:0", - "name": "Nova Lite", - "display_name": "Nova Lite", + "id": "qwen3.5-122b-a10b", + "name": "Qwen3.5 122B-A10B", + "display_name": "Qwen3.5 122B-A10B", "modalities": { "input": [ "text", "image", - "video" + "video", + "audio" ], "output": [ "text" ] }, "limit": { - "context": 300000, - "output": 8192 + "context": 262144, + "output": 65536 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } }, "attachment": true, - "open_weights": false, - "knowledge": "2024-10", - "release_date": "2024-12-03", - "last_updated": "2024-12-03", + "open_weights": true, + "release_date": "2026-02-23", + "last_updated": "2026-02-23", "cost": { - "input": 0.06, - "output": 0.24, - "cache_read": 0.015 + "input": 0.4, + "output": 3.2 }, "type": "chat" }, { - "id": "us.deepseek.r1-v1:0", - "name": "DeepSeek-R1 (US)", - "display_name": "DeepSeek-R1 (US)", + "id": "qwen-vl-plus", + "name": "Qwen-VL Plus", + "display_name": "Qwen-VL Plus", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 32768 + "context": 131072, + "output": 8192 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, "attachment": false, - "open_weights": true, - "knowledge": "2024-07", - "release_date": "2025-01-20", - "last_updated": "2025-05-29", + "open_weights": false, + "knowledge": "2024-04", + "release_date": "2024-01-25", + "last_updated": "2025-08-15", "cost": { - "input": 1.35, - "output": 5.4 + "input": 0.21, + "output": 0.63 }, "type": "chat" - } - ] - }, - "synthetic": { - "id": "synthetic", - "name": "Synthetic", - "display_name": "Synthetic", - "api": "https://api.synthetic.new/openai/v1", - "doc": "https://synthetic.new/pricing", - "models": [ + }, { - "id": "hf:openai/gpt-oss-120b", - "name": "GPT OSS 120B", - "display_name": "GPT OSS 120B", + "id": "qwen3.6-plus", + "name": "Qwen3.6 Plus", + "display_name": "Qwen3.6 Plus", "modalities": { "input": [ - "text" + "text", + "image", + "video" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 32768 + "context": 1000000, + "output": 65536 }, "temperature": true, "tool_call": true, @@ -140248,23 +144251,50 @@ }, "extra_capabilities": { "reasoning": { - "supported": true + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] } }, "attachment": false, - "open_weights": true, - "release_date": "2025-08-05", - "last_updated": "2025-08-05", + "open_weights": false, + "knowledge": "2025-04", + "release_date": "2026-04-02", + "last_updated": "2026-04-02", "cost": { - "input": 0.1, - "output": 0.1 + "input": 0.5, + "output": 3, + "cache_read": 0.05, + "cache_write": 0.625, + "tiers": [ + { + "input": 2, + "output": 6, + "cache_read": 0.2, + "cache_write": 2.5, + "tier": { + "type": "context", + "size": 256000 + } + } + ], + "context_over_200k": { + "input": 2, + "output": 6, + "cache_read": 0.2, + "cache_write": 2.5 + } }, "type": "chat" }, { - "id": "hf:meta-llama/Llama-3.1-70B-Instruct", - "name": "Llama-3.1-70B-Instruct", - "display_name": "Llama-3.1-70B-Instruct", + "id": "qwen3-coder-plus-2025-09-23", + "name": "Qwen3 Coder Plus 2025 09 23", + "display_name": "Qwen3 Coder Plus 2025 09 23", "modalities": { "input": [ "text" @@ -140274,30 +144304,21 @@ ] }, "limit": { - "context": 128000, - "output": 32768 + "context": 1000000, + "output": 65536 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, "attachment": false, - "open_weights": true, - "knowledge": "2023-12", - "release_date": "2024-07-23", - "last_updated": "2024-07-23", - "cost": { - "input": 0.9, - "output": 0.9 - }, "type": "chat" }, { - "id": "hf:meta-llama/Llama-3.1-405B-Instruct", - "name": "Llama-3.1-405B-Instruct", - "display_name": "Llama-3.1-405B-Instruct", + "id": "qwen3-coder-plus-2025-07-22", + "name": "Qwen3 Coder Plus 2025 07 22", + "display_name": "Qwen3 Coder Plus 2025 07 22", "modalities": { "input": [ "text" @@ -140307,63 +144328,46 @@ ] }, "limit": { - "context": 128000, - "output": 32768 + "context": 1000000, + "output": 65536 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, "attachment": false, - "open_weights": true, - "knowledge": "2023-12", - "release_date": "2024-07-23", - "last_updated": "2024-07-23", - "cost": { - "input": 3, - "output": 3 - }, "type": "chat" }, { - "id": "hf:meta-llama/Llama-3.1-8B-Instruct", - "name": "Llama-3.1-8B-Instruct", - "display_name": "Llama-3.1-8B-Instruct", + "id": "qwen-vl-ocr-latest", + "name": "Qwen Vl Ocr Latest", + "display_name": "Qwen Vl Ocr Latest", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 32768 + "context": 34096, + "output": 4096 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": true + "supported": false }, "attachment": false, - "open_weights": true, - "knowledge": "2023-12", - "release_date": "2024-07-23", - "last_updated": "2024-07-23", - "cost": { - "input": 0.2, - "output": 0.2 - }, "type": "chat" }, { - "id": "hf:meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8", - "name": "Llama-4-Maverick-17B-128E-Instruct-FP8", - "display_name": "Llama-4-Maverick-17B-128E-Instruct-FP8", + "id": "qvq-max-2025-05-15", + "name": "Qvq Max 2025 05 15", + "display_name": "Qvq Max 2025 05 15", "modalities": { "input": [ "text", @@ -140374,29 +144378,27 @@ ] }, "limit": { - "context": 524000, - "output": 4096 + "context": 131072, + "output": 8192 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": false - }, - "attachment": true, - "open_weights": true, - "knowledge": "2024-08", - "release_date": "2025-04-05", - "last_updated": "2025-04-05", - "cost": { - "input": 0.22, - "output": 0.88 + "supported": true, + "default": false, + "budget": { + "default": 16384, + "min": 0, + "max": 16384 + } }, + "attachment": false, "type": "chat" }, { - "id": "hf:meta-llama/Llama-3.3-70B-Instruct", - "name": "Llama-3.3-70B-Instruct", - "display_name": "Llama-3.3-70B-Instruct", + "id": "qwen-long", + "name": "Qwen Long", + "display_name": "Qwen Long", "modalities": { "input": [ "text" @@ -140406,63 +144408,68 @@ ] }, "limit": { - "context": 128000, - "output": 32768 + "context": 1000000, + "output": 8192 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": true + "supported": false }, "attachment": false, - "open_weights": true, - "knowledge": "2023-12", - "release_date": "2024-12-06", - "last_updated": "2024-12-06", - "cost": { - "input": 0.9, - "output": 0.9 - }, "type": "chat" }, { - "id": "hf:meta-llama/Llama-4-Scout-17B-16E-Instruct", - "name": "Llama-4-Scout-17B-16E-Instruct", - "display_name": "Llama-4-Scout-17B-16E-Instruct", + "id": "qwen-turbo-latest", + "name": "Qwen Turbo Latest", + "display_name": "Qwen Turbo Latest", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 328000, - "output": 4096 + "context": 131072, + "output": 16384 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": false, + "budget": { + "default": 38912, + "min": 0, + "max": 38912 + } }, - "attachment": true, - "open_weights": true, - "knowledge": "2024-08", - "release_date": "2025-04-05", - "last_updated": "2025-04-05", - "cost": { - "input": 0.15, - "output": 0.6 + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } + }, + "search": { + "supported": true, + "default": false, + "forced_search": false, + "search_strategy": "turbo" }, + "attachment": false, "type": "chat" }, { - "id": "hf:Qwen/Qwen3-Coder-480B-A35B-Instruct", - "name": "Qwen 3 Coder 480B", - "display_name": "Qwen 3 Coder 480B", + "id": "qwen-turbo-2024-09-19", + "name": "Qwen Turbo 2024 09 19", + "display_name": "Qwen Turbo 2024 09 19", "modalities": { "input": [ "text" @@ -140472,8 +144479,8 @@ ] }, "limit": { - "context": 256000, - "output": 32000 + "context": 131072, + "output": 8192 }, "temperature": true, "tool_call": true, @@ -140481,20 +144488,12 @@ "supported": false }, "attachment": false, - "open_weights": true, - "knowledge": "2025-04", - "release_date": "2025-07-23", - "last_updated": "2025-07-23", - "cost": { - "input": 2, - "output": 2 - }, "type": "chat" }, { - "id": "hf:Qwen/Qwen3-235B-A22B-Thinking-2507", - "name": "Qwen3 235B A22B Thinking 2507", - "display_name": "Qwen3 235B A22B Thinking 2507", + "id": "qwen-flash-2025-07-28", + "name": "Qwen Flash 2025 07 28", + "display_name": "Qwen Flash 2025 07 28", "modalities": { "input": [ "text" @@ -140504,14 +144503,19 @@ ] }, "limit": { - "context": 256000, - "output": 32000 + "context": 1000000, + "output": 32768 }, "temperature": true, "tool_call": true, "reasoning": { "supported": true, - "default": true + "default": false, + "budget": { + "default": 81920, + "min": 0, + "max": 81920 + } }, "extra_capabilities": { "reasoning": { @@ -140524,39 +144528,41 @@ ] } }, - "attachment": false, - "open_weights": true, - "knowledge": "2025-04", - "release_date": "2025-07-25", - "last_updated": "2025-07-25", - "cost": { - "input": 0.65, - "output": 3 + "search": { + "supported": true, + "default": false, + "forced_search": false, + "search_strategy": "turbo" }, + "attachment": false, "type": "chat" }, { - "id": "hf:Qwen/Qwen3.5-397B-A17B", - "name": "Qwen3.5-97B-A17B", - "display_name": "Qwen3.5-97B-A17B", + "id": "qwen-plus-latest", + "name": "Qwen Plus Latest", + "display_name": "Qwen Plus Latest", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 262144, - "output": 65536 + "context": 1000000, + "output": 32768 }, "temperature": true, "tool_call": true, "reasoning": { "supported": true, - "default": true + "default": false, + "budget": { + "default": 81920, + "min": 0, + "max": 81920 + } }, "extra_capabilities": { "reasoning": { @@ -140569,53 +144575,19 @@ ] } }, - "attachment": false, - "open_weights": true, - "release_date": "2026-02-11", - "last_updated": "2026-02-11", - "cost": { - "input": 0.6, - "output": 3, - "cache_read": 0.6 - }, - "type": "chat" - }, - { - "id": "hf:Qwen/Qwen3-235B-A22B-Instruct-2507", - "name": "Qwen 3 235B Instruct", - "display_name": "Qwen 3 235B Instruct", - "modalities": { - "input": [ - "text" - ], - "output": [ - "text" - ] - }, - "limit": { - "context": 256000, - "output": 32000 - }, - "temperature": true, - "tool_call": true, - "reasoning": { - "supported": false + "search": { + "supported": true, + "default": false, + "forced_search": false, + "search_strategy": "turbo" }, "attachment": false, - "open_weights": true, - "knowledge": "2025-04", - "release_date": "2025-04-28", - "last_updated": "2025-07-21", - "cost": { - "input": 0.2, - "output": 0.6 - }, "type": "chat" }, { - "id": "hf:Qwen/Qwen2.5-Coder-32B-Instruct", - "name": "Qwen2.5-Coder-32B-Instruct", - "display_name": "Qwen2.5-Coder-32B-Instruct", + "id": "qwen-plus-2024-09-19", + "name": "Qwen Plus 2024 09 19", + "display_name": "Qwen Plus 2024 09 19", "modalities": { "input": [ "text" @@ -140625,29 +144597,21 @@ ] }, "limit": { - "context": 32768, - "output": 32768 + "context": 131072, + "output": 8192 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { "supported": false }, "attachment": false, - "open_weights": true, - "knowledge": "2024-10", - "release_date": "2024-11-11", - "last_updated": "2024-11-11", - "cost": { - "input": 0.8, - "output": 0.8 - }, "type": "chat" }, { - "id": "hf:MiniMaxAI/MiniMax-M2.5", - "name": "MiniMax-M2.5", - "display_name": "MiniMax-M2.5", + "id": "qwen-plus-2025-07-14", + "name": "Qwen Plus 2025 07 14", + "display_name": "Qwen Plus 2025 07 14", "modalities": { "input": [ "text" @@ -140657,14 +144621,19 @@ ] }, "limit": { - "context": 191488, - "output": 65536 + "context": 131072, + "output": 16384 }, "temperature": true, "tool_call": true, "reasoning": { "supported": true, - "default": true + "default": false, + "budget": { + "default": 38912, + "min": 0, + "max": 38912 + } }, "extra_capabilities": { "reasoning": { @@ -140677,21 +144646,19 @@ ] } }, - "attachment": false, - "open_weights": true, - "release_date": "2026-02-07", - "last_updated": "2026-02-07", - "cost": { - "input": 0.6, - "output": 3, - "cache_read": 0.6 + "search": { + "supported": true, + "default": false, + "forced_search": false, + "search_strategy": "turbo" }, + "attachment": false, "type": "chat" }, { - "id": "hf:MiniMaxAI/MiniMax-M2", - "name": "MiniMax-M2", - "display_name": "MiniMax-M2", + "id": "qwen-plus-2025-09-11", + "name": "Qwen Plus 2025 09 11", + "display_name": "Qwen Plus 2025 09 11", "modalities": { "input": [ "text" @@ -140701,34 +144668,44 @@ ] }, "limit": { - "context": 196608, - "output": 131000 + "context": 1000000, + "output": 32768 }, "temperature": true, "tool_call": true, "reasoning": { "supported": true, - "default": true + "default": false, + "budget": { + "default": 81920, + "min": 0, + "max": 81920 + } }, "extra_capabilities": { "reasoning": { - "supported": true + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] } }, - "attachment": false, - "open_weights": true, - "release_date": "2025-10-27", - "last_updated": "2025-10-27", - "cost": { - "input": 0.55, - "output": 2.19 + "search": { + "supported": true, + "default": false, + "forced_search": false, + "search_strategy": "turbo" }, + "attachment": false, "type": "chat" }, { - "id": "hf:MiniMaxAI/MiniMax-M2.1", - "name": "MiniMax-M2.1", - "display_name": "MiniMax-M2.1", + "id": "qwen-max-latest", + "name": "Qwen Max Latest", + "display_name": "Qwen Max Latest", "modalities": { "input": [ "text" @@ -140738,40 +144715,27 @@ ] }, "limit": { - "context": 204800, - "output": 131072 + "context": 131072, + "output": 8192 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } + "search": { + "supported": true, + "default": false, + "forced_search": false, + "search_strategy": "turbo" }, "attachment": false, - "open_weights": true, - "release_date": "2025-12-23", - "last_updated": "2025-12-23", - "cost": { - "input": 0.55, - "output": 2.19 - }, "type": "chat" }, { - "id": "hf:zai-org/GLM-4.7", - "name": "GLM 4.7", - "display_name": "GLM 4.7", + "id": "qwen-max-2024-09-19", + "name": "Qwen Max 2024 09 19", + "display_name": "Qwen Max 2024 09 19", "modalities": { "input": [ "text" @@ -140781,41 +144745,27 @@ ] }, "limit": { - "context": 200000, - "output": 64000 + "context": 32768, + "output": 8192 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } + "search": { + "supported": true, + "default": false, + "forced_search": false, + "search_strategy": "turbo" }, "attachment": false, - "open_weights": true, - "knowledge": "2025-04", - "release_date": "2025-12-22", - "last_updated": "2025-12-22", - "cost": { - "input": 0.55, - "output": 2.19 - }, "type": "chat" }, { - "id": "hf:zai-org/GLM-5", - "name": "GLM-5", - "display_name": "GLM-5", + "id": "qwen-max-2024-04-28", + "name": "Qwen Max 2024 04 28", + "display_name": "Qwen Max 2024 04 28", "modalities": { "input": [ "text" @@ -140825,41 +144775,21 @@ ] }, "limit": { - "context": 196608, - "output": 65536 + "context": 8000, + "output": 2000 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } + "supported": false }, "attachment": false, - "open_weights": true, - "release_date": "2026-02-12", - "last_updated": "2026-04-08", - "cost": { - "input": 1, - "output": 3, - "cache_read": 1 - }, "type": "chat" }, { - "id": "hf:zai-org/GLM-5.1", - "name": "GLM 5.1", - "display_name": "GLM 5.1", + "id": "qwen-max-2024-04-03", + "name": "Qwen Max 2024 04 03", + "display_name": "Qwen Max 2024 04 03", "modalities": { "input": [ "text" @@ -140869,41 +144799,21 @@ ] }, "limit": { - "context": 196608, - "output": 65536 + "context": 8000, + "output": 2000 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } + "supported": false }, "attachment": false, - "open_weights": true, - "release_date": "2026-03-27", - "last_updated": "2026-04-12", - "cost": { - "input": 1, - "output": 3, - "cache_read": 1 - }, "type": "chat" }, { - "id": "hf:zai-org/GLM-4.7-Flash", - "name": "GLM-4.7-Flash", - "display_name": "GLM-4.7-Flash", + "id": "qwen-max-2025-01-25", + "name": "Qwen Max 2025 01 25", + "display_name": "Qwen Max 2025 01 25", "modalities": { "input": [ "text" @@ -140913,41 +144823,27 @@ ] }, "limit": { - "context": 196608, - "output": 65536 + "context": 131072, + "output": 8192 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } + "search": { + "supported": true, + "default": false, + "forced_search": false, + "search_strategy": "turbo" }, "attachment": false, - "open_weights": true, - "release_date": "2026-01-18", - "last_updated": "2026-01-18", - "cost": { - "input": 0.06, - "output": 0.4, - "cache_read": 0.06 - }, "type": "chat" }, { - "id": "hf:zai-org/GLM-4.6", - "name": "GLM 4.6", - "display_name": "GLM 4.6", + "id": "qwen3-max-2025-09-23", + "name": "Qwen3 Max 20250923", + "display_name": "Qwen3 Max 20250923", "modalities": { "input": [ "text" @@ -140957,35 +144853,27 @@ ] }, "limit": { - "context": 200000, - "output": 64000 + "context": 262144, + "output": 65536 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, - "extra_capabilities": { - "reasoning": { - "supported": true - } + "search": { + "supported": true, + "default": false, + "forced_search": false, + "search_strategy": "turbo" }, "attachment": false, - "open_weights": true, - "knowledge": "2025-04", - "release_date": "2025-09-30", - "last_updated": "2025-09-30", - "cost": { - "input": 0.55, - "output": 2.19 - }, "type": "chat" }, { - "id": "hf:nvidia/NVIDIA-Nemotron-3-Super-120B-A12B-NVFP4", - "name": "Nemotron 3 Super 120B", - "display_name": "Nemotron 3 Super 120B", + "id": "qwen3-max-preview", + "name": "Qwen3 Max Preview", + "display_name": "Qwen3 Max Preview", "modalities": { "input": [ "text" @@ -141001,8 +144889,7 @@ "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": true }, "extra_capabilities": { "reasoning": { @@ -141015,40 +144902,41 @@ ] } }, - "attachment": false, - "open_weights": true, - "knowledge": "2024-04", - "release_date": "2026-03-11", - "last_updated": "2026-04-03", - "cost": { - "input": 0.3, - "output": 1, - "cache_read": 0.3 + "search": { + "supported": true, + "default": false, + "forced_search": false, + "search_strategy": "turbo" }, + "attachment": false, "type": "chat" }, { - "id": "hf:nvidia/Kimi-K2.5-NVFP4", - "name": "Kimi K2.5 (NVFP4)", - "display_name": "Kimi K2.5 (NVFP4)", + "id": "qwen3-235b-a22b-thinking-2507", + "name": "Qwen3 235B A22B Thinking 2507", + "display_name": "Qwen3 235B A22B Thinking 2507", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 262144, - "output": 65536 + "context": 131072, + "output": 32768 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": true, - "default": true + "default": true, + "budget": { + "default": 81920, + "min": 0, + "max": 81920 + } }, "extra_capabilities": { "reasoning": { @@ -141062,20 +144950,12 @@ } }, "attachment": false, - "open_weights": true, - "knowledge": "2025-01", - "release_date": "2026-01", - "last_updated": "2026-01", - "cost": { - "input": 0.55, - "output": 2.19 - }, "type": "chat" }, { - "id": "hf:deepseek-ai/DeepSeek-V3.1", - "name": "DeepSeek V3.1", - "display_name": "DeepSeek V3.1", + "id": "qwen3-235b-a22b-instruct-2507", + "name": "Qwen3 235B A22B Instruct 2507", + "display_name": "Qwen3 235B A22B Instruct 2507", "modalities": { "input": [ "text" @@ -141085,29 +144965,21 @@ ] }, "limit": { - "context": 128000, - "output": 128000 + "context": 131072, + "output": 32768 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, "attachment": false, - "open_weights": false, - "release_date": "2025-08-21", - "last_updated": "2025-08-21", - "cost": { - "input": 0.56, - "output": 1.68 - }, "type": "chat" }, { - "id": "hf:deepseek-ai/DeepSeek-V3.1-Terminus", - "name": "DeepSeek V3.1 Terminus", - "display_name": "DeepSeek V3.1 Terminus", + "id": "qwen3-30b-a3b-instruct-2507", + "name": "Qwen3 30B A3B Instruct 2507", + "display_name": "Qwen3 30B A3B Instruct 2507", "modalities": { "input": [ "text" @@ -141117,29 +144989,21 @@ ] }, "limit": { - "context": 128000, - "output": 128000 + "context": 131072, + "output": 32768 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, "attachment": false, - "open_weights": false, - "release_date": "2025-09-22", - "last_updated": "2025-09-25", - "cost": { - "input": 1.2, - "output": 1.2 - }, "type": "chat" }, { - "id": "hf:deepseek-ai/DeepSeek-V3.2", - "name": "DeepSeek V3.2", - "display_name": "DeepSeek V3.2", + "id": "qwen3-30b-a3b-thinking-2507", + "name": "Qwen3 30B A3B Thinking 2507", + "display_name": "Qwen3 30B A3B Thinking 2507", "modalities": { "input": [ "text" @@ -141149,36 +145013,38 @@ ] }, "limit": { - "context": 162816, - "output": 8000 + "context": 131072, + "output": 32768 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": true, - "default": true + "default": true, + "budget": { + "default": 81920, + "min": 0, + "max": 81920 + } }, "extra_capabilities": { "reasoning": { - "supported": true + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] } }, "attachment": false, - "open_weights": true, - "release_date": "2025-12-01", - "last_updated": "2025-12-01", - "cost": { - "input": 0.27, - "output": 0.4, - "cache_read": 0.27, - "cache_write": 0 - }, "type": "chat" }, { - "id": "hf:deepseek-ai/DeepSeek-R1", - "name": "DeepSeek R1", - "display_name": "DeepSeek R1", + "id": "qwen3-30b-a3b", + "name": "Qwen3 30B A3B", + "display_name": "Qwen3 30B A3B", "modalities": { "input": [ "text" @@ -141188,14 +145054,19 @@ ] }, "limit": { - "context": 128000, - "output": 128000 + "context": 131072, + "output": 32768 }, "temperature": true, "tool_call": true, "reasoning": { "supported": true, - "default": true + "default": false, + "budget": { + "default": 81920, + "min": 0, + "max": 81920 + } }, "extra_capabilities": { "reasoning": { @@ -141209,20 +145080,12 @@ } }, "attachment": false, - "open_weights": true, - "knowledge": "2025-01", - "release_date": "2025-01-20", - "last_updated": "2025-01-20", - "cost": { - "input": 0.55, - "output": 2.19 - }, "type": "chat" }, { - "id": "hf:deepseek-ai/DeepSeek-V3-0324", - "name": "DeepSeek V3 (0324)", - "display_name": "DeepSeek V3 (0324)", + "id": "qwen3-4b", + "name": "Qwen3 4B", + "display_name": "Qwen3 4B", "modalities": { "input": [ "text" @@ -141232,28 +145095,38 @@ ] }, "limit": { - "context": 128000, - "output": 128000 + "context": 131072, + "output": 8192 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true, + "budget": { + "default": 38912, + "min": 0, + "max": 38912 + } }, - "attachment": false, - "open_weights": false, - "release_date": "2025-08-01", - "last_updated": "2025-08-01", - "cost": { - "input": 1.2, - "output": 1.2 + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } }, + "attachment": false, "type": "chat" }, { - "id": "hf:deepseek-ai/DeepSeek-V3", - "name": "DeepSeek V3", - "display_name": "DeepSeek V3", + "id": "qwen3-1.7b", + "name": "Qwen3 1.7B", + "display_name": "Qwen3 1.7B", "modalities": { "input": [ "text" @@ -141263,30 +145136,38 @@ ] }, "limit": { - "context": 128000, - "output": 128000 + "context": 32768, + "output": 8192 }, "temperature": true, "tool_call": true, "reasoning": { "supported": true, - "default": true + "default": true, + "budget": { + "default": 30720, + "min": 0, + "max": 30720 + } }, - "attachment": false, - "open_weights": true, - "knowledge": "2024-07", - "release_date": "2025-01-20", - "last_updated": "2025-05-29", - "cost": { - "input": 1.25, - "output": 1.25 + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } }, + "attachment": false, "type": "chat" }, { - "id": "hf:deepseek-ai/DeepSeek-R1-0528", - "name": "DeepSeek R1 (0528)", - "display_name": "DeepSeek R1 (0528)", + "id": "qwen3-0.6b", + "name": "Qwen3 0.6B", + "display_name": "Qwen3 0.6B", "modalities": { "input": [ "text" @@ -141296,14 +145177,19 @@ ] }, "limit": { - "context": 128000, - "output": 128000 + "context": 32768, + "output": 8192 }, "temperature": true, "tool_call": true, "reasoning": { "supported": true, - "default": true + "default": true, + "budget": { + "default": 30720, + "min": 0, + "max": 30720 + } }, "extra_capabilities": { "reasoning": { @@ -141317,19 +145203,12 @@ } }, "attachment": false, - "open_weights": false, - "release_date": "2025-08-01", - "last_updated": "2025-08-01", - "cost": { - "input": 3, - "output": 8 - }, "type": "chat" }, { - "id": "hf:moonshotai/Kimi-K2.6", - "name": "Kimi K2.6", - "display_name": "Kimi K2.6", + "id": "qwen3-vl-plus-2025-09-23", + "name": "Qwen3 VL Plus 2025 09 23", + "display_name": "Qwen3 VL Plus 2025 09 23", "modalities": { "input": [ "text", @@ -141341,13 +145220,18 @@ }, "limit": { "context": 262144, - "output": 65536 + "output": 32768 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": true, - "default": true + "default": false, + "budget": { + "default": 81920, + "min": 0, + "max": 81920 + } }, "extra_capabilities": { "reasoning": { @@ -141360,22 +145244,13 @@ ] } }, - "attachment": true, - "open_weights": true, - "knowledge": "2025-01", - "release_date": "2026-04-21", - "last_updated": "2026-04-21", - "cost": { - "input": 0.95, - "output": 4, - "cache_read": 0.95 - }, + "attachment": false, "type": "chat" }, { - "id": "hf:moonshotai/Kimi-K2-Instruct-0905", - "name": "Kimi K2 0905", - "display_name": "Kimi K2 0905", + "id": "qwq-plus-latest", + "name": "QwQ Plus Latest", + "display_name": "QwQ Plus Latest", "modalities": { "input": [ "text" @@ -141385,138 +145260,180 @@ ] }, "limit": { - "context": 262144, - "output": 32768 + "context": 131072, + "output": 8192 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { + "supported": true, + "default": true, + "budget": { + "default": 32768, + "min": 0, + "max": 32768 + } + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } + }, + "search": { "supported": false }, "attachment": false, - "open_weights": true, - "knowledge": "2024-10", - "release_date": "2025-09-05", - "last_updated": "2025-09-05", - "cost": { - "input": 1.2, - "output": 1.2 - }, "type": "chat" - }, + } + ] + }, + "databricks": { + "id": "databricks", + "name": "Databricks", + "display_name": "Databricks", + "api": "https://${DATABRICKS_HOST}/ai-gateway/mlflow/v1", + "doc": "https://docs.databricks.com/aws/en/machine-learning/foundation-models/", + "models": [ { - "id": "hf:moonshotai/Kimi-K2.5", - "name": "Kimi K2.5", - "display_name": "Kimi K2.5", + "id": "databricks-claude-opus-4-7", + "name": "Claude Opus 4.7", + "display_name": "Claude Opus 4.7", "modalities": { "input": [ "text", - "image" + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 262144, - "output": 65536 + "context": 1000000, + "output": 128000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { "supported": true, - "default": true + "default": false }, "extra_capabilities": { "reasoning": { "supported": true, + "default_enabled": false, + "mode": "effort", + "effort": "high", + "effort_options": [ + "low", + "medium", + "high", + "xhigh", + "max" + ], "interleaved": true, "summaries": true, - "visibility": "summary", + "visibility": "omitted", "continuation": [ "thinking_blocks" + ], + "notes": [ + "Claude Opus 4.7 and newer Opus models require thinking.type = \"adaptive\" to enable thinking explicitly.", + "Manual budget_tokens requests return 400 on Claude Opus 4.7 and newer adaptive-only Opus models.", + "task_budget is separate from thinking control and should not be treated as a thinking budget." ] } }, - "attachment": false, - "open_weights": true, - "knowledge": "2025-01", - "release_date": "2026-01", - "last_updated": "2026-01", + "attachment": true, + "open_weights": false, + "knowledge": "2026-01-31", + "release_date": "2026-04-16", + "last_updated": "2026-04-16", "cost": { - "input": 0.55, - "output": 2.19 + "input": 5, + "output": 25, + "cache_read": 0.5, + "cache_write": 6.25 }, "type": "chat" }, { - "id": "hf:moonshotai/Kimi-K2-Thinking", - "name": "Kimi K2 Thinking", - "display_name": "Kimi K2 Thinking", + "id": "databricks-gpt-5-4", + "name": "GPT-5.4", + "display_name": "GPT-5.4", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 262144, - "output": 262144 + "context": 1050000, + "output": 128000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { "supported": true, "default": true }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } - }, - "attachment": false, - "open_weights": true, - "knowledge": "2025-11", - "release_date": "2025-11-07", - "last_updated": "2025-11-07", + "attachment": true, + "open_weights": false, + "knowledge": "2025-08-31", + "release_date": "2026-03-05", + "last_updated": "2026-03-05", "cost": { - "input": 0.55, - "output": 2.19 - }, - "type": "chat" - } - ] - }, - "cloudferro-sherlock": { - "id": "cloudferro-sherlock", - "name": "CloudFerro Sherlock", - "display_name": "CloudFerro Sherlock", - "api": "https://api-sherlock.cloudferro.com/openai/v1/", - "doc": "https://docs.sherlock.cloudferro.com/", - "models": [ + "input": 2.5, + "output": 15, + "cache_read": 0.25, + "tiers": [ + { + "input": 5, + "output": 22.5, + "cache_read": 0.5, + "tier": { + "type": "context", + "size": 272000 + } + } + ], + "context_over_200k": { + "input": 5, + "output": 22.5, + "cache_read": 0.5 + } + }, + "type": "chat" + }, { - "id": "MiniMaxAI/MiniMax-M2.5", - "name": "MiniMax-M2.5", - "display_name": "MiniMax-M2.5", + "id": "databricks-gemini-3-flash", + "name": "Gemini 3 Flash Preview", + "display_name": "Gemini 3 Flash Preview", "modalities": { "input": [ - "text" + "text", + "image", + "video", + "audio", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 196000, - "output": 16000 + "context": 1048576, + "output": 65536 }, "temperature": true, "tool_call": true, @@ -141524,286 +145441,344 @@ "supported": true, "default": true }, - "extra_capabilities": { - "reasoning": { - "supported": true - } - }, - "attachment": false, - "open_weights": true, - "knowledge": "2026-01", - "release_date": "2026-03-05", - "last_updated": "2026-03-05", + "attachment": true, + "open_weights": false, + "knowledge": "2025-01", + "release_date": "2025-12-17", + "last_updated": "2025-12-17", "cost": { - "input": 0.3, - "output": 1.2 + "input": 0.5, + "output": 3, + "cache_read": 0.05, + "input_audio": 1 }, "type": "chat" }, { - "id": "meta-llama/Llama-3.3-70B-Instruct", - "name": "Llama 3.3 70B Instruct", - "display_name": "Llama 3.3 70B Instruct", + "id": "databricks-claude-opus-4-5", + "name": "Claude Opus 4.5 (latest)", + "display_name": "Claude Opus 4.5 (latest)", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 70000, - "output": 70000 + "context": 200000, + "output": 64000 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": false }, - "attachment": false, - "open_weights": true, - "knowledge": "2024-10-09", - "release_date": "2024-12-06", - "last_updated": "2024-12-06", + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": false, + "mode": "mixed", + "budget": { + "min": 1024, + "unit": "tokens" + }, + "effort": "high", + "effort_options": [ + "low", + "medium", + "high" + ], + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ], + "notes": [ + "Claude Opus 4.5 uses manual thinking.type = \"enabled\" with budget_tokens; effort can be used alongside the thinking budget.", + "Interleaved thinking requires the interleaved-thinking-2025-05-14 beta header." + ] + } + }, + "attachment": true, + "open_weights": false, + "knowledge": "2025-03-31", + "release_date": "2025-11-24", + "last_updated": "2025-11-24", "cost": { - "input": 2.92, - "output": 2.92 + "input": 5, + "output": 25, + "cache_read": 0.5, + "cache_write": 6.25 }, "type": "chat" }, { - "id": "speakleash/Bielik-11B-v2.6-Instruct", - "name": "Bielik 11B v2.6 Instruct", - "display_name": "Bielik 11B v2.6 Instruct", + "id": "databricks-gpt-5-nano", + "name": "GPT-5 Nano", + "display_name": "GPT-5 Nano", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 32000, - "output": 32000 + "context": 400000, + "output": 128000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": false, - "open_weights": true, - "knowledge": "2025-03", - "release_date": "2025-03-13", - "last_updated": "2025-03-13", + "attachment": true, + "open_weights": false, + "knowledge": "2024-05-30", + "release_date": "2025-08-07", + "last_updated": "2025-08-07", "cost": { - "input": 0.67, - "output": 0.67 + "input": 0.05, + "output": 0.4, + "cache_read": 0.005 }, "type": "chat" }, { - "id": "speakleash/Bielik-11B-v3.0-Instruct", - "name": "Bielik 11B v3.0 Instruct", - "display_name": "Bielik 11B v3.0 Instruct", + "id": "databricks-gpt-5-mini", + "name": "GPT-5 Mini", + "display_name": "GPT-5 Mini", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 32000, - "output": 32000 + "context": 400000, + "output": 128000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": false, - "open_weights": true, - "knowledge": "2025-03", - "release_date": "2025-03-13", - "last_updated": "2025-03-13", + "attachment": true, + "open_weights": false, + "knowledge": "2024-05-30", + "release_date": "2025-08-07", + "last_updated": "2025-08-07", "cost": { - "input": 0.67, - "output": 0.67 + "input": 0.25, + "output": 2, + "cache_read": 0.025 }, "type": "chat" }, { - "id": "openai/gpt-oss-120b", - "name": "OpenAI GPT OSS 120B", - "display_name": "OpenAI GPT OSS 120B", + "id": "databricks-gpt-5", + "name": "GPT-5", + "display_name": "GPT-5", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 131000, - "output": 131000 + "context": 400000, + "output": 128000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { "supported": true, "default": true }, - "extra_capabilities": { - "reasoning": { - "supported": true - } - }, - "attachment": false, - "open_weights": true, - "release_date": "2025-08-28", - "last_updated": "2025-08-28", + "attachment": true, + "open_weights": false, + "knowledge": "2024-09-30", + "release_date": "2025-08-07", + "last_updated": "2025-08-07", "cost": { - "input": 2.92, - "output": 2.92 + "input": 1.25, + "output": 10, + "cache_read": 0.125 }, "type": "chat" - } - ] - }, - "helicone": { - "id": "helicone", - "name": "Helicone", - "display_name": "Helicone", - "api": "https://ai-gateway.helicone.ai/v1", - "doc": "https://helicone.ai/models", - "models": [ + }, { - "id": "chatgpt-4o-latest", - "name": "OpenAI ChatGPT-4o", - "display_name": "OpenAI ChatGPT-4o", + "id": "databricks-gemini-2-5-pro", + "name": "Gemini 2.5 Pro", + "display_name": "Gemini 2.5 Pro", "modalities": { "input": [ "text", - "image" + "image", + "audio", + "video", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 16384 + "context": 1048576, + "output": 65536 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": false, + "attachment": true, "open_weights": false, - "knowledge": "2024-08", - "release_date": "2024-08-14", - "last_updated": "2024-08-14", + "knowledge": "2025-01", + "release_date": "2025-03-20", + "last_updated": "2025-06-05", "cost": { - "input": 5, - "output": 20, - "cache_read": 2.5 + "input": 1.25, + "output": 10, + "cache_read": 0.125, + "tiers": [ + { + "input": 2.5, + "output": 15, + "cache_read": 0.25, + "tier": { + "type": "context", + "size": 200000 + } + } + ], + "context_over_200k": { + "input": 2.5, + "output": 15, + "cache_read": 0.25 + } }, "type": "chat" }, { - "id": "mistral-large-2411", - "name": "Mistral-Large", - "display_name": "Mistral-Large", + "id": "databricks-gemini-3-1-pro", + "name": "Gemini 3.1 Pro Preview Custom Tools", + "display_name": "Gemini 3.1 Pro Preview Custom Tools", "modalities": { "input": [ - "text" + "text", + "image", + "video", + "audio", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 32768 + "context": 1048576, + "output": 65536 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": false, + "attachment": true, "open_weights": false, - "knowledge": "2024-07", - "release_date": "2024-07-24", - "last_updated": "2024-07-24", + "knowledge": "2025-01", + "release_date": "2026-02-19", + "last_updated": "2026-02-19", "cost": { "input": 2, - "output": 6 + "output": 12, + "cache_read": 0.2, + "tiers": [ + { + "input": 4, + "output": 18, + "cache_read": 0.4, + "tier": { + "type": "context", + "size": 200000 + } + } + ], + "context_over_200k": { + "input": 4, + "output": 18, + "cache_read": 0.4 + } }, "type": "chat" }, { - "id": "gpt-5-pro", - "name": "OpenAI: GPT-5 Pro", - "display_name": "OpenAI: GPT-5 Pro", + "id": "databricks-gemini-2-5-flash", + "name": "Gemini 2.5 Flash", + "display_name": "Gemini 2.5 Flash", "modalities": { "input": [ - "text" + "text", + "image", + "audio", + "video", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 32768 + "context": 1048576, + "output": 65536 }, - "temperature": false, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { "supported": true, "default": true }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": true, - "mode": "fixed", - "effort": "high", - "verbosity": "medium", - "verbosity_options": [ - "low", - "medium", - "high" - ], - "visibility": "hidden" - } - }, - "attachment": false, + "attachment": true, "open_weights": false, "knowledge": "2025-01", - "release_date": "2025-01-01", - "last_updated": "2025-01-01", + "release_date": "2025-03-20", + "last_updated": "2025-06-05", "cost": { - "input": 15, - "output": 120 + "input": 0.3, + "output": 2.5, + "cache_read": 0.03, + "input_audio": 1 }, "type": "chat" }, { - "id": "claude-sonnet-4", - "name": "Anthropic: Claude Sonnet 4", - "display_name": "Anthropic: Claude Sonnet 4", + "id": "databricks-claude-sonnet-4", + "name": "Claude Sonnet 4.5", + "display_name": "Claude Sonnet 4.5", "modalities": { "input": [ "text", - "image" + "image", + "pdf" ], "output": [ "text" @@ -141840,145 +145815,181 @@ ] } }, - "attachment": false, + "attachment": true, "open_weights": false, - "knowledge": "2025-05", - "release_date": "2025-05-14", - "last_updated": "2025-05-14", + "knowledge": "2025-07-31", + "release_date": "2025-09-29", + "last_updated": "2025-09-29", "cost": { "input": 3, "output": 15, - "cache_read": 0.30000000000000004, + "cache_read": 0.3, "cache_write": 3.75 }, "type": "chat" }, { - "id": "gpt-5-mini", - "name": "OpenAI GPT-5 Mini", - "display_name": "OpenAI GPT-5 Mini", + "id": "databricks-claude-haiku-4-5", + "name": "Claude Haiku 4.5 (latest)", + "display_name": "Claude Haiku 4.5 (latest)", "modalities": { "input": [ "text", - "image" + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 400000, - "output": 128000 + "context": 200000, + "output": 64000 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, - "default": true + "default": false }, "extra_capabilities": { "reasoning": { "supported": true, - "default_enabled": true, - "mode": "effort", - "effort": "medium", - "effort_options": [ - "minimal", - "low", - "medium", - "high" - ], - "verbosity": "medium", - "verbosity_options": [ - "low", - "medium", - "high" + "default_enabled": false, + "mode": "budget", + "budget": { + "min": 1024, + "unit": "tokens" + }, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" ], - "visibility": "hidden" + "notes": [ + "Claude 4 manual thinking uses thinking.type = \"enabled\" with budget_tokens.", + "Interleaved thinking requires the interleaved-thinking-2025-05-14 beta header for this model family." + ] } }, - "attachment": false, + "attachment": true, "open_weights": false, - "knowledge": "2025-01", - "release_date": "2025-01-01", - "last_updated": "2025-01-01", + "knowledge": "2025-02-28", + "release_date": "2025-10-15", + "last_updated": "2025-10-15", "cost": { - "input": 0.25, - "output": 2, - "cache_read": 0.024999999999999998 + "input": 1, + "output": 5, + "cache_read": 0.1, + "cache_write": 1.25 }, "type": "chat" }, { - "id": "qwen3-next-80b-a3b-instruct", - "name": "Qwen3 Next 80B A3B Instruct", - "display_name": "Qwen3 Next 80B A3B Instruct", + "id": "databricks-gpt-5-4-nano", + "name": "GPT-5.4 nano", + "display_name": "GPT-5.4 nano", "modalities": { "input": [ "text", - "image", - "video" + "image" ], "output": [ "text" ] }, "limit": { - "context": 262000, - "output": 16384 + "context": 400000, + "output": 128000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": false, + "attachment": true, "open_weights": false, - "knowledge": "2025-01", - "release_date": "2025-01-01", - "last_updated": "2025-01-01", + "knowledge": "2025-08-31", + "release_date": "2026-03-17", + "last_updated": "2026-03-17", "cost": { - "input": 0.14, - "output": 1.4 + "input": 0.2, + "output": 1.25, + "cache_read": 0.02 }, "type": "chat" }, { - "id": "sonar", - "name": "Perplexity Sonar", - "display_name": "Perplexity Sonar", + "id": "databricks-claude-opus-4-6", + "name": "Claude Opus 4.6", + "display_name": "Claude Opus 4.6", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 127000, - "output": 4096 + "context": 1000000, + "output": 128000 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": false }, - "attachment": false, + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": false, + "mode": "mixed", + "budget": { + "min": 1024, + "unit": "tokens" + }, + "effort": "high", + "effort_options": [ + "low", + "medium", + "high", + "max" + ], + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ], + "notes": [ + "Anthropic recommends adaptive thinking with effort for Claude 4.6; budget_tokens remains a deprecated compatibility path.", + "Anthropic API defaults effort to high; lower effort levels should be chosen per workload." + ] + } + }, + "attachment": true, "open_weights": false, - "knowledge": "2025-01", - "release_date": "2025-01-27", - "last_updated": "2025-01-27", + "knowledge": "2025-05-31", + "release_date": "2026-02-05", + "last_updated": "2026-03-13", "cost": { - "input": 1, - "output": 1 + "input": 5, + "output": 25, + "cache_read": 0.5, + "cache_write": 6.25 }, "type": "chat" }, { - "id": "gpt-4o", - "name": "OpenAI GPT-4o", - "display_name": "OpenAI GPT-4o", + "id": "databricks-gpt-5-1", + "name": "GPT-5.1", + "display_name": "GPT-5.1", "modalities": { "input": [ "text", @@ -141989,107 +146000,159 @@ ] }, "limit": { - "context": 128000, - "output": 16384 + "context": 400000, + "output": 128000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": false, + "attachment": true, "open_weights": false, - "knowledge": "2024-05", - "release_date": "2024-05-13", - "last_updated": "2024-05-13", + "knowledge": "2024-09-30", + "release_date": "2025-11-13", + "last_updated": "2025-11-13", "cost": { - "input": 2.5, + "input": 1.25, "output": 10, - "cache_read": 1.25 + "cache_read": 0.125 }, "type": "chat" }, { - "id": "llama-4-maverick", - "name": "Meta Llama 4 Maverick 17B 128E", - "display_name": "Meta Llama 4 Maverick 17B 128E", + "id": "databricks-claude-sonnet-4-5", + "name": "Claude Sonnet 4.5 (latest)", + "display_name": "Claude Sonnet 4.5 (latest)", "modalities": { "input": [ "text", - "image" + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 131072, - "output": 8192 + "context": 200000, + "output": 64000 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": false }, - "attachment": false, + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": false, + "mode": "budget", + "budget": { + "min": 1024, + "unit": "tokens" + }, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ], + "notes": [ + "Claude 4 manual thinking uses thinking.type = \"enabled\" with budget_tokens.", + "Interleaved thinking requires the interleaved-thinking-2025-05-14 beta header for this model family." + ] + } + }, + "attachment": true, "open_weights": false, - "knowledge": "2025-01", - "release_date": "2025-01-01", - "last_updated": "2025-01-01", + "knowledge": "2025-07-31", + "release_date": "2025-09-29", + "last_updated": "2025-09-29", "cost": { - "input": 0.15, - "output": 0.6 + "input": 3, + "output": 15, + "cache_read": 0.3, + "cache_write": 3.75 }, "type": "chat" }, { - "id": "gpt-5-chat-latest", - "name": "OpenAI GPT-5 Chat Latest", - "display_name": "OpenAI GPT-5 Chat Latest", + "id": "databricks-claude-opus-4-1", + "name": "Claude Opus 4.1 (latest)", + "display_name": "Claude Opus 4.1 (latest)", "modalities": { "input": [ "text", - "image" + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 16384 + "context": 200000, + "output": 32000 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": false }, - "attachment": false, + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": false, + "mode": "budget", + "budget": { + "min": 1024, + "unit": "tokens" + }, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ], + "notes": [ + "Claude 4 manual thinking uses thinking.type = \"enabled\" with budget_tokens.", + "Interleaved thinking requires the interleaved-thinking-2025-05-14 beta header for this model family." + ] + } + }, + "attachment": true, "open_weights": false, - "knowledge": "2024-09", - "release_date": "2024-09-30", - "last_updated": "2024-09-30", + "knowledge": "2025-03-31", + "release_date": "2025-08-05", + "last_updated": "2025-08-05", "cost": { - "input": 1.25, - "output": 10, - "cache_read": 0.12500000000000003 + "input": 15, + "output": 75, + "cache_read": 1.5, + "cache_write": 18.75 }, "type": "chat" }, { - "id": "gpt-5-codex", - "name": "OpenAI: GPT-5 Codex", - "display_name": "OpenAI: GPT-5 Codex", + "id": "databricks-gpt-5-5", + "name": "GPT-5.5", + "display_name": "GPT-5.5", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 400000, + "context": 1050000, "output": 128000 }, "temperature": false, @@ -142098,103 +146161,92 @@ "supported": true, "default": true }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": true, - "mode": "effort", - "effort": "medium", - "effort_options": [ - "minimal", - "low", - "medium", - "high" - ], - "verbosity": "medium", - "verbosity_options": [ - "low", - "medium", - "high" - ], - "visibility": "hidden" - } - }, - "attachment": false, + "attachment": true, "open_weights": false, - "knowledge": "2025-01", - "release_date": "2025-01-01", - "last_updated": "2025-01-01", + "knowledge": "2025-12-01", + "release_date": "2026-04-23", + "last_updated": "2026-04-23", "cost": { - "input": 1.25, - "output": 10, - "cache_read": 0.12500000000000003 + "input": 5, + "output": 30, + "cache_read": 0.5, + "tiers": [ + { + "input": 10, + "output": 45, + "cache_read": 1, + "tier": { + "type": "context", + "size": 272000 + } + } + ], + "context_over_200k": { + "input": 10, + "output": 45, + "cache_read": 1 + } }, "type": "chat" }, { - "id": "o3", - "name": "OpenAI o3", - "display_name": "OpenAI o3", + "id": "databricks-gemini-3-1-flash-lite", + "name": "Gemini 3.1 Flash Lite Preview", + "display_name": "Gemini 3.1 Flash Lite Preview", "modalities": { "input": [ "text", - "image" + "image", + "video", + "audio", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 100000 + "context": 1048576, + "output": 65536 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, "default": true }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": true, - "mode": "effort", - "effort": "medium", - "effort_options": [ - "low", - "medium", - "high" - ], - "visibility": "hidden" - } - }, - "attachment": false, + "attachment": true, "open_weights": false, - "knowledge": "2024-06", - "release_date": "2024-06-01", - "last_updated": "2024-06-01", + "knowledge": "2025-01", + "release_date": "2026-03-03", + "last_updated": "2026-03-03", "cost": { - "input": 2, - "output": 8, - "cache_read": 0.5 + "input": 0.25, + "output": 1.5, + "cache_read": 0.025, + "input_audio": 0.5 }, "type": "chat" }, { - "id": "glm-4.6", - "name": "Zai GLM-4.6", - "display_name": "Zai GLM-4.6", + "id": "databricks-gemini-3-pro", + "name": "Gemini 3 Pro Preview", + "display_name": "Gemini 3 Pro Preview", "modalities": { "input": [ - "text" + "text", + "image", + "video", + "audio", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 204800, - "output": 131072 + "context": 1048576, + "output": 65536 }, "temperature": true, "tool_call": true, @@ -142202,70 +146254,103 @@ "supported": true, "default": true }, - "extra_capabilities": { - "reasoning": { - "supported": true - } - }, - "attachment": false, + "attachment": true, "open_weights": false, - "knowledge": "2024-07", - "release_date": "2024-07-18", - "last_updated": "2024-07-18", + "knowledge": "2025-01", + "release_date": "2025-11-18", + "last_updated": "2025-11-18", "cost": { - "input": 0.44999999999999996, - "output": 1.5 + "input": 2, + "output": 12, + "cache_read": 0.2, + "tiers": [ + { + "input": 4, + "output": 18, + "cache_read": 0.4, + "tier": { + "type": "context", + "size": 200000 + } + } + ], + "context_over_200k": { + "input": 4, + "output": 18, + "cache_read": 0.4 + } }, "type": "chat" }, { - "id": "qwen3-32b", - "name": "Qwen3 32B", - "display_name": "Qwen3 32B", + "id": "databricks-claude-sonnet-4-6", + "name": "Claude Sonnet 4.6", + "display_name": "Claude Sonnet 4.6", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 131072, - "output": 40960 + "context": 1000000, + "output": 64000 }, "temperature": true, "tool_call": true, "reasoning": { "supported": true, - "default": true + "default": false }, "extra_capabilities": { "reasoning": { "supported": true, + "default_enabled": false, + "mode": "mixed", + "budget": { + "min": 1024, + "unit": "tokens" + }, + "effort": "high", + "effort_options": [ + "low", + "medium", + "high", + "max" + ], "interleaved": true, "summaries": true, "visibility": "summary", "continuation": [ "thinking_blocks" + ], + "notes": [ + "Anthropic recommends adaptive thinking with effort for Claude 4.6; budget_tokens remains a deprecated compatibility path.", + "Anthropic API defaults effort to high; lower effort levels should be chosen per workload." ] } }, - "attachment": false, + "attachment": true, "open_weights": false, - "knowledge": "2025-04", - "release_date": "2025-04-28", - "last_updated": "2025-04-28", + "knowledge": "2025-08-31", + "release_date": "2026-02-17", + "last_updated": "2026-03-13", "cost": { - "input": 0.29, - "output": 0.59 + "input": 3, + "output": 15, + "cache_read": 0.3, + "cache_write": 3.75 }, "type": "chat" }, { - "id": "qwen3-coder-30b-a3b-instruct", - "name": "Qwen3 Coder 30B A3B Instruct", - "display_name": "Qwen3 Coder 30B A3B Instruct", + "id": "databricks-gpt-oss-20b", + "name": "GPT OSS 20B", + "display_name": "GPT OSS 20B", "modalities": { "input": [ "text" @@ -142275,29 +146360,29 @@ ] }, "limit": { - "context": 262144, - "output": 262144 + "context": 131072, + "output": 32768 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "attachment": false, - "open_weights": false, - "knowledge": "2025-07", - "release_date": "2025-07-31", - "last_updated": "2025-07-31", + "open_weights": true, + "release_date": "2025-08-05", + "last_updated": "2025-08-05", "cost": { - "input": 0.09999999999999999, - "output": 0.3 + "input": 0.05, + "output": 0.2 }, "type": "chat" }, { - "id": "kimi-k2-thinking", - "name": "Kimi K2 Thinking", - "display_name": "Kimi K2 Thinking", + "id": "databricks-gpt-oss-120b", + "name": "GPT OSS 120B", + "display_name": "GPT OSS 120B", "modalities": { "input": [ "text" @@ -142307,72 +146392,64 @@ ] }, "limit": { - "context": 256000, - "output": 262144 + "context": 131072, + "output": 32768 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } + "supported": true, + "default": true }, "attachment": false, - "open_weights": false, - "knowledge": "2025-11", - "release_date": "2025-11-06", - "last_updated": "2025-11-06", + "open_weights": true, + "release_date": "2025-08-05", + "last_updated": "2025-08-05", "cost": { - "input": 0.48, - "output": 2 + "input": 0.072, + "output": 0.28 }, "type": "chat" }, { - "id": "deepseek-tng-r1t2-chimera", - "name": "DeepSeek TNG R1T2 Chimera", - "display_name": "DeepSeek TNG R1T2 Chimera", + "id": "databricks-gpt-5-2", + "name": "GPT-5.2", + "display_name": "GPT-5.2", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 130000, - "output": 163840 + "context": 400000, + "output": 128000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": false, + "attachment": true, "open_weights": false, - "knowledge": "2025-07", - "release_date": "2025-07-02", - "last_updated": "2025-07-02", + "knowledge": "2025-08-31", + "release_date": "2025-12-11", + "last_updated": "2025-12-11", "cost": { - "input": 0.3, - "output": 1.2 + "input": 1.75, + "output": 14, + "cache_read": 0.175 }, "type": "chat" }, { - "id": "claude-haiku-4-5-20251001", - "name": "Anthropic: Claude 4.5 Haiku (20251001)", - "display_name": "Anthropic: Claude 4.5 Haiku (20251001)", + "id": "databricks-gpt-5-4-mini", + "name": "GPT-5.4 mini", + "display_name": "GPT-5.4 mini", "modalities": { "input": [ "text", @@ -142383,213 +146460,246 @@ ] }, "limit": { - "context": 200000, - "output": 8192 + "context": 400000, + "output": 128000 + }, + "temperature": false, + "tool_call": true, + "reasoning": { + "supported": true, + "default": true + }, + "attachment": true, + "open_weights": false, + "knowledge": "2025-08-31", + "release_date": "2026-03-17", + "last_updated": "2026-03-17", + "cost": { + "input": 0.75, + "output": 4.5, + "cache_read": 0.075 + }, + "type": "chat" + } + ] + }, + "crof": { + "id": "crof", + "name": "CrofAI", + "display_name": "CrofAI", + "api": "https://crof.ai/v1", + "doc": "https://crof.ai/docs", + "models": [ + { + "id": "deepseek-v4-flash", + "name": "DeepSeek V4 Flash", + "display_name": "DeepSeek V4 Flash", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 1000000, + "output": 131072 }, "temperature": true, "tool_call": true, "reasoning": { "supported": true, - "default": false + "default": true }, "extra_capabilities": { "reasoning": { "supported": true, - "default_enabled": false, - "mode": "budget", - "budget": { - "min": 1024, - "unit": "tokens" - }, "interleaved": true, "summaries": true, "visibility": "summary", "continuation": [ "thinking_blocks" - ], - "notes": [ - "Claude 4 manual thinking uses thinking.type = \"enabled\" with budget_tokens.", - "Interleaved thinking requires the interleaved-thinking-2025-05-14 beta header for this model family." ] } }, "attachment": false, - "open_weights": false, - "knowledge": "2025-10", - "release_date": "2025-10-01", - "last_updated": "2025-10-01", + "open_weights": true, + "knowledge": "2025-05", + "release_date": "2026-04-24", + "last_updated": "2026-04-24", "cost": { - "input": 1, - "output": 5, - "cache_read": 0.09999999999999999, - "cache_write": 1.25 + "input": 0.12, + "output": 0.21, + "cache_read": 0.003 }, "type": "chat" }, { - "id": "claude-3.5-sonnet-v2", - "name": "Anthropic: Claude 3.5 Sonnet v2", - "display_name": "Anthropic: Claude 3.5 Sonnet v2", + "id": "minimax-m2.5", + "name": "MiniMax-M2.5", + "display_name": "MiniMax-M2.5", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 8192 + "context": 204800, + "output": 131072 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true + } }, "attachment": false, - "open_weights": false, - "knowledge": "2024-10", - "release_date": "2024-10-22", - "last_updated": "2024-10-22", + "open_weights": true, + "release_date": "2026-02-12", + "last_updated": "2026-02-12", "cost": { - "input": 3, - "output": 15, - "cache_read": 0.30000000000000004, - "cache_write": 3.75 + "input": 0.11, + "output": 0.95, + "cache_read": 0.02, + "cache_write": 0.375 }, "type": "chat" }, { - "id": "qwen3-vl-235b-a22b-instruct", - "name": "Qwen3 VL 235B A22B Instruct", - "display_name": "Qwen3 VL 235B A22B Instruct", + "id": "glm-4.7", + "name": "GLM-4.7", + "display_name": "GLM-4.7", "modalities": { "input": [ - "text", - "image", - "video" + "text" ], "output": [ "text" ] }, "limit": { - "context": 256000, - "output": 16384 + "context": 202752, + "output": 202752 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } }, "attachment": false, - "open_weights": false, - "knowledge": "2025-09", - "release_date": "2025-09-23", - "last_updated": "2025-09-23", + "open_weights": true, + "knowledge": "2025-04", + "release_date": "2025-12-22", + "last_updated": "2025-12-22", "cost": { - "input": 0.3, - "output": 1.5 + "input": 0.25, + "output": 1.1, + "cache_read": 0.05, + "cache_write": 0 }, "type": "chat" }, { - "id": "gpt-5", - "name": "OpenAI GPT-5", - "display_name": "OpenAI GPT-5", + "id": "greg-1-super", + "name": "Greg 1 Super", + "display_name": "Greg 1 Super", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 400000, - "output": 128000 + "context": 229376, + "output": 229376 }, - "temperature": false, - "tool_call": true, + "temperature": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": true, - "mode": "effort", - "effort": "medium", - "effort_options": [ - "minimal", - "low", - "medium", - "high" - ], - "verbosity": "medium", - "verbosity_options": [ - "low", - "medium", - "high" - ], - "visibility": "hidden" - } + "supported": false }, "attachment": false, "open_weights": false, - "knowledge": "2025-01", - "release_date": "2025-01-01", - "last_updated": "2025-01-01", + "release_date": "2026-01-27", + "last_updated": "2026-01-27", "cost": { - "input": 1.25, - "output": 10, - "cache_read": 0.12500000000000003 + "input": 1, + "output": 5, + "cache_read": 0.2 }, "type": "chat" }, { - "id": "grok-4-fast-non-reasoning", - "name": "xAI Grok 4 Fast Non-Reasoning", - "display_name": "xAI Grok 4 Fast Non-Reasoning", + "id": "deepseek-v4-pro-lightning", + "name": "DeepSeek V4 Pro", + "display_name": "DeepSeek V4 Pro", "modalities": { "input": [ - "text", - "image", - "audio" + "text" ], "output": [ "text" ] }, "limit": { - "context": 2000000, - "output": 2000000 + "context": 1000000, + "output": 131072 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } }, "attachment": false, - "open_weights": false, - "knowledge": "2025-09", - "release_date": "2025-09-19", - "last_updated": "2025-09-19", + "open_weights": true, + "knowledge": "2025-05", + "release_date": "2026-04-24", + "last_updated": "2026-04-24", "cost": { - "input": 0.19999999999999998, - "output": 0.5, - "cache_read": 0.049999999999999996 + "input": 0.8, + "output": 1.6, + "cache_read": 0.02 }, "type": "chat" }, { - "id": "sonar-pro", - "name": "Perplexity Sonar Pro", - "display_name": "Perplexity Sonar Pro", + "id": "greg-rp", + "name": "Greg (Roleplay)", + "display_name": "Greg (Roleplay)", "modalities": { "input": [ "text" @@ -142599,8 +146709,8 @@ ] }, "limit": { - "context": 200000, - "output": 4096 + "context": 229376, + "output": 229376 }, "temperature": true, "tool_call": false, @@ -142609,19 +146719,19 @@ }, "attachment": false, "open_weights": false, - "knowledge": "2025-01", - "release_date": "2025-01-27", - "last_updated": "2025-01-27", + "release_date": "2026-01-27", + "last_updated": "2026-01-27", "cost": { - "input": 3, - "output": 15 + "input": 0.1, + "output": 0.3, + "cache_read": 0.02 }, "type": "chat" }, { - "id": "gpt-4.1-mini", - "name": "OpenAI GPT-4.1 Mini", - "display_name": "OpenAI GPT-4.1 Mini", + "id": "gemma-4-31b-it", + "name": "Gemma 4 31B IT", + "display_name": "Gemma 4 31B IT", "modalities": { "input": [ "text", @@ -142632,30 +146742,30 @@ ] }, "limit": { - "context": 1047576, - "output": 32768 + "context": 262144, + "output": 262144 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": false, - "open_weights": false, - "knowledge": "2025-04", - "release_date": "2025-04-14", - "last_updated": "2025-04-14", + "attachment": true, + "open_weights": true, + "release_date": "2026-04-02", + "last_updated": "2026-04-02", "cost": { - "input": 0.39999999999999997, - "output": 1.5999999999999999, - "cache_read": 0.09999999999999999 + "input": 0.1, + "output": 0.3, + "cache_read": 0.02 }, "type": "chat" }, { - "id": "deepseek-v3.2", - "name": "DeepSeek V3.2", - "display_name": "DeepSeek V3.2", + "id": "greg-1", + "name": "Greg 1 Normal", + "display_name": "Greg 1 Normal", "modalities": { "input": [ "text" @@ -142665,48 +146775,42 @@ ] }, "limit": { - "context": 163840, - "output": 65536 + "context": 229376, + "output": 229376 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true - } + "supported": false }, "attachment": false, "open_weights": false, - "knowledge": "2025-09", - "release_date": "2025-09-22", - "last_updated": "2025-09-22", + "release_date": "2026-01-27", + "last_updated": "2026-01-27", "cost": { - "input": 0.27, - "output": 0.41 + "input": 0.1, + "output": 0.3, + "cache_read": 0.02 }, "type": "chat" }, { - "id": "o3-pro", - "name": "OpenAI o3 Pro", - "display_name": "OpenAI o3 Pro", + "id": "glm-5.1", + "name": "GLM-5.1", + "display_name": "GLM-5.1", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 100000 + "context": 202752, + "output": 202752 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, @@ -142715,32 +146819,30 @@ "extra_capabilities": { "reasoning": { "supported": true, - "default_enabled": true, - "mode": "effort", - "effort": "medium", - "effort_options": [ - "low", - "medium", - "high" - ], - "visibility": "hidden" + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] } }, "attachment": false, - "open_weights": false, - "knowledge": "2024-06", - "release_date": "2024-06-01", - "last_updated": "2024-06-01", + "open_weights": true, + "release_date": "2026-03-27", + "last_updated": "2026-03-27", "cost": { - "input": 20, - "output": 80 + "input": 0.45, + "output": 2.15, + "cache_read": 0.08, + "cache_write": 0 }, "type": "chat" }, { - "id": "llama-3.1-8b-instant", - "name": "Meta Llama 3.1 8B Instant", - "display_name": "Meta Llama 3.1 8B Instant", + "id": "deepseek-v4-pro", + "name": "DeepSeek V4 Pro", + "display_name": "DeepSeek V4 Pro", "modalities": { "input": [ "text" @@ -142750,41 +146852,55 @@ ] }, "limit": { - "context": 131072, - "output": 32678 + "context": 1000000, + "output": 131072 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } }, "attachment": false, - "open_weights": false, - "knowledge": "2024-07", - "release_date": "2024-07-01", - "last_updated": "2024-07-01", + "open_weights": true, + "knowledge": "2025-05", + "release_date": "2026-04-24", + "last_updated": "2026-04-24", "cost": { - "input": 0.049999999999999996, - "output": 0.08 + "input": 0.35, + "output": 0.8, + "cache_read": 0.003 }, "type": "chat" }, { - "id": "o4-mini", - "name": "OpenAI o4 Mini", - "display_name": "OpenAI o4 Mini", + "id": "kimi-k2.5-lightning", + "name": "Kimi K2.5 (Lightning)", + "display_name": "Kimi K2.5 (Lightning)", "modalities": { "input": [ "text", - "image" + "image", + "video" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 100000 + "context": 131072, + "output": 32768 }, "temperature": false, "tool_call": true, @@ -142795,44 +146911,42 @@ "extra_capabilities": { "reasoning": { "supported": true, - "default_enabled": true, - "mode": "effort", - "effort": "medium", - "effort_options": [ - "low", - "medium", - "high" - ], - "visibility": "hidden" + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] } }, "attachment": false, - "open_weights": false, - "knowledge": "2024-06", - "release_date": "2024-06-01", - "last_updated": "2024-06-01", + "open_weights": true, + "release_date": "2026-02-06", + "last_updated": "2026-02-06", "cost": { - "input": 1.1, - "output": 4.4, - "cache_read": 0.275 + "input": 1, + "output": 3, + "cache_read": 0.2 }, "type": "chat" }, { - "id": "o3-mini", - "name": "OpenAI o3 Mini", - "display_name": "OpenAI o3 Mini", + "id": "kimi-k2.5", + "name": "Kimi K2.5", + "display_name": "Kimi K2.5", "modalities": { "input": [ - "text" + "text", + "image", + "video" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 100000 + "context": 262144, + "output": 262144 }, "temperature": false, "tool_call": true, @@ -142843,83 +146957,50 @@ "extra_capabilities": { "reasoning": { "supported": true, - "default_enabled": true, - "mode": "effort", - "effort": "medium", - "effort_options": [ - "low", - "medium", - "high" - ], - "visibility": "hidden" + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] } }, "attachment": false, - "open_weights": false, - "knowledge": "2023-10", - "release_date": "2023-10-01", - "last_updated": "2023-10-01", + "open_weights": true, + "knowledge": "2025-01", + "release_date": "2026-01", + "last_updated": "2026-01", "cost": { - "input": 1.1, - "output": 4.4, - "cache_read": 0.55 + "input": 0.35, + "output": 1.7, + "cache_read": 0.07 }, "type": "chat" }, { - "id": "sonar-reasoning", - "name": "Perplexity Sonar Reasoning", - "display_name": "Perplexity Sonar Reasoning", + "id": "kimi-k2.6", + "name": "Kimi K2.6", + "display_name": "Kimi K2.6", "modalities": { "input": [ - "text" + "text", + "image", + "video" ], "output": [ "text" ] }, "limit": { - "context": 127000, - "output": 4096 + "context": 262144, + "output": 262144 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { "supported": true, "default": true }, - "attachment": false, - "open_weights": false, - "knowledge": "2025-01", - "release_date": "2025-01-27", - "last_updated": "2025-01-27", - "cost": { - "input": 1, - "output": 5 - }, - "type": "chat" - }, - { - "id": "deepseek-reasoner", - "name": "DeepSeek Reasoner", - "display_name": "DeepSeek Reasoner", - "modalities": { - "input": [ - "text" - ], - "output": [ - "text" - ] - }, - "limit": { - "context": 128000, - "output": 64000 - }, - "temperature": true, - "tool_call": false, - "reasoning": { - "supported": true - }, "extra_capabilities": { "reasoning": { "supported": true, @@ -142931,248 +147012,277 @@ ] } }, - "attachment": false, - "open_weights": false, + "attachment": true, + "open_weights": true, "knowledge": "2025-01", - "release_date": "2025-01-20", - "last_updated": "2025-01-20", + "release_date": "2026-04-21", + "last_updated": "2026-04-21", "cost": { - "input": 0.56, - "output": 1.68, - "cache_read": 0.07 + "input": 0.5, + "output": 1.99, + "cache_read": 0.05 }, "type": "chat" }, { - "id": "ernie-4.5-21b-a3b-thinking", - "name": "Baidu Ernie 4.5 21B A3B Thinking", - "display_name": "Baidu Ernie 4.5 21B A3B Thinking", + "id": "qwen3.6-27b", + "name": "Qwen3.6 27B", + "display_name": "Qwen3.6 27B", "modalities": { "input": [ - "text" + "text", + "image", + "video", + "audio" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 8000 + "context": 262144, + "output": 262144 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { "supported": true, "default": true }, - "attachment": false, - "open_weights": false, - "knowledge": "2025-03", - "release_date": "2025-03-16", - "last_updated": "2025-03-16", + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } + }, + "attachment": true, + "open_weights": true, + "release_date": "2026-04-22", + "last_updated": "2026-04-22", "cost": { - "input": 0.07, - "output": 0.28 + "input": 0.2, + "output": 1.5, + "cache_read": 0.04 }, "type": "chat" }, { - "id": "claude-3.7-sonnet", - "name": "Anthropic: Claude 3.7 Sonnet", - "display_name": "Anthropic: Claude 3.7 Sonnet", + "id": "qwen3.5-9b", + "name": "Qwen3.5 9B", + "display_name": "Qwen3.5 9B", "modalities": { "input": [ "text", - "image" + "image", + "video", + "audio" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 64000 + "context": 262144, + "output": 262144 }, "temperature": true, "tool_call": true, "reasoning": { "supported": true, - "default": false + "default": true }, "extra_capabilities": { "reasoning": { "supported": true, - "default_enabled": false, - "mode": "budget", - "budget": { - "min": 1024, - "unit": "tokens" - }, - "interleaved": false, - "summaries": false, - "visibility": "full", + "interleaved": true, + "summaries": true, + "visibility": "summary", "continuation": [ "thinking_blocks" - ], - "notes": [ - "Anthropic uses thinking budget tokens" ] } }, - "attachment": false, - "open_weights": false, - "knowledge": "2025-02", - "release_date": "2025-02-19", - "last_updated": "2025-02-19", + "attachment": true, + "open_weights": true, + "release_date": "2026-03-13", + "last_updated": "2026-03-13", "cost": { - "input": 3, - "output": 15, - "cache_read": 0.30000000000000004, - "cache_write": 3.75 + "input": 0.04, + "output": 0.15, + "cache_read": 0.008 }, "type": "chat" }, { - "id": "mistral-nemo", - "name": "Mistral Nemo", - "display_name": "Mistral Nemo", + "id": "qwen3.5-397b-a17b", + "name": "Qwen3.5 397B-A17B", + "display_name": "Qwen3.5 397B-A17B", "modalities": { "input": [ "text", - "image" + "image", + "video", + "audio" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 16400 + "context": 262144, + "output": 262144 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": false, - "open_weights": false, - "knowledge": "2024-07", - "release_date": "2024-07-18", - "last_updated": "2024-07-18", + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } + }, + "attachment": true, + "open_weights": true, + "release_date": "2026-02-15", + "last_updated": "2026-02-15", "cost": { - "input": 20, - "output": 40 + "input": 0.35, + "output": 1.75, + "cache_read": 0.07 }, "type": "chat" }, { - "id": "mistral-small", - "name": "Mistral Small 3.2", - "display_name": "Mistral Small 3.2", + "id": "glm-4.7-flash", + "name": "GLM-4.7-Flash", + "display_name": "GLM-4.7-Flash", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 16384 + "context": 202752, + "output": 131072 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true + } }, "attachment": false, "open_weights": true, - "knowledge": "2025-03", - "release_date": "2025-06-20", - "last_updated": "2025-06-20", + "knowledge": "2025-04", + "release_date": "2026-01-19", + "last_updated": "2026-01-19", "cost": { - "input": 0.075, - "output": 0.2 + "input": 0.04, + "output": 0.3, + "cache_read": 0.008, + "cache_write": 0 }, "type": "chat" }, { - "id": "gpt-5.1", - "name": "OpenAI GPT-5.1", - "display_name": "OpenAI GPT-5.1", + "id": "mimo-v2.5-pro", + "name": "MiMo-V2.5-Pro", + "display_name": "MiMo-V2.5-Pro", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ - "text", - "image" + "text" ] }, "limit": { - "context": 400000, - "output": 128000 + "context": 1048576, + "output": 131072 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, - "default": false + "default": true }, "extra_capabilities": { "reasoning": { "supported": true, - "default_enabled": false, - "mode": "effort", - "effort": "none", - "effort_options": [ - "none", - "low", - "medium", - "high" - ], - "verbosity": "medium", - "verbosity_options": [ - "low", - "medium", - "high" - ], - "visibility": "hidden" + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] } }, "attachment": false, - "open_weights": false, - "knowledge": "2025-01", - "release_date": "2025-01-01", - "last_updated": "2025-01-01", + "open_weights": true, + "knowledge": "2024-12", + "release_date": "2026-04-22", + "last_updated": "2026-04-22", "cost": { - "input": 1.25, - "output": 10, - "cache_read": 0.12500000000000003 + "input": 0.4, + "output": 0.8, + "cache_read": 0.003, + "tiers": [ + { + "input": 2, + "output": 6, + "cache_read": 0.4, + "tier": { + "type": "context", + "size": 256000 + } + } + ], + "context_over_200k": { + "input": 2, + "output": 6, + "cache_read": 0.4 + } }, "type": "chat" }, { - "id": "gpt-5-nano", - "name": "OpenAI GPT-5 Nano", - "display_name": "OpenAI GPT-5 Nano", + "id": "glm-5", + "name": "GLM-5", + "display_name": "GLM-5", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 400000, - "output": 128000 + "context": 202752, + "output": 202752 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, @@ -143181,40 +147291,30 @@ "extra_capabilities": { "reasoning": { "supported": true, - "default_enabled": true, - "mode": "effort", - "effort": "medium", - "effort_options": [ - "minimal", - "low", - "medium", - "high" - ], - "verbosity": "medium", - "verbosity_options": [ - "low", - "medium", - "high" - ], - "visibility": "hidden" + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] } }, "attachment": false, - "open_weights": false, - "knowledge": "2025-01", - "release_date": "2025-01-01", - "last_updated": "2025-01-01", + "open_weights": true, + "release_date": "2026-02-11", + "last_updated": "2026-02-11", "cost": { - "input": 0.049999999999999996, - "output": 0.39999999999999997, - "cache_read": 0.005 + "input": 0.48, + "output": 1.9, + "cache_read": 0.1, + "cache_write": 0 }, "type": "chat" }, { - "id": "gpt-oss-120b", - "name": "OpenAI GPT-OSS 120b", - "display_name": "OpenAI GPT-OSS 120b", + "id": "deepseek-v3.2", + "name": "DeepSeek V3.2", + "display_name": "DeepSeek V3.2", "modalities": { "input": [ "text" @@ -143224,14 +147324,13 @@ ] }, "limit": { - "context": 131072, - "output": 131072 + "context": 163840, + "output": 163840 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": true }, "extra_capabilities": { "reasoning": { @@ -143240,19 +147339,19 @@ }, "attachment": false, "open_weights": false, - "knowledge": "2024-06", - "release_date": "2024-06-01", - "last_updated": "2024-06-01", + "release_date": "2025-07-22", + "last_updated": "2025-07-22", "cost": { - "input": 0.04, - "output": 0.16 + "input": 0.18, + "output": 0.35, + "cache_read": 0.04 }, "type": "chat" }, { - "id": "grok-3", - "name": "xAI Grok 3", - "display_name": "xAI Grok 3", + "id": "greg-1-mini", + "name": "Greg 1 Mini", + "display_name": "Greg 1 Mini", "modalities": { "input": [ "text" @@ -143262,133 +147361,111 @@ ] }, "limit": { - "context": 131072, - "output": 131072 + "context": 229376, + "output": 229376 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": false }, "attachment": false, "open_weights": false, - "knowledge": "2024-06", - "release_date": "2024-06-01", - "last_updated": "2024-06-01", + "release_date": "2026-01-27", + "last_updated": "2026-01-27", "cost": { - "input": 3, - "output": 15, - "cache_read": 0.75 + "input": 0.07, + "output": 0.15, + "cache_read": 0.01 }, "type": "chat" - }, + } + ] + }, + "fastrouter": { + "id": "fastrouter", + "name": "FastRouter", + "display_name": "FastRouter", + "api": "https://go.fastrouter.ai/api/v1", + "doc": "https://fastrouter.ai/models", + "models": [ { - "id": "gpt-4o-mini", - "name": "OpenAI GPT-4o-mini", - "display_name": "OpenAI GPT-4o-mini", + "id": "wanx/wan-v2-6", + "name": "Wan 2.6", + "display_name": "Wan 2.6", "modalities": { "input": [ "text", "image" ], "output": [ - "text" + "video" ] }, "limit": { - "context": 128000, - "output": 16384 + "context": 400000, + "output": 8192 }, - "temperature": true, - "tool_call": true, + "temperature": false, + "tool_call": false, "reasoning": { "supported": false }, - "attachment": false, - "open_weights": false, - "knowledge": "2024-07", - "release_date": "2024-07-18", - "last_updated": "2024-07-18", - "cost": { - "input": 0.15, - "output": 0.6, - "cache_read": 0.075 - }, + "attachment": true, + "open_weights": true, + "release_date": "2025-12-01", + "last_updated": "2025-12-01", "type": "chat" }, { - "id": "claude-opus-4-1", - "name": "Anthropic: Claude Opus 4.1", - "display_name": "Anthropic: Claude Opus 4.1", + "id": "moonshotai/kimi-k2", + "name": "Kimi K2", + "display_name": "Kimi K2", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 32000 + "context": 131072, + "output": 32768 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": false - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": false, - "mode": "budget", - "budget": { - "min": 1024, - "unit": "tokens" - }, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ], - "notes": [ - "Claude 4 manual thinking uses thinking.type = \"enabled\" with budget_tokens.", - "Interleaved thinking requires the interleaved-thinking-2025-05-14 beta header for this model family." - ] - } + "supported": false }, "attachment": false, - "open_weights": false, - "knowledge": "2025-08", - "release_date": "2025-08-05", - "last_updated": "2025-08-05", + "open_weights": true, + "knowledge": "2024-10", + "release_date": "2025-07-11", + "last_updated": "2025-07-11", "cost": { - "input": 15, - "output": 75, - "cache_read": 1.5, - "cache_write": 18.75 + "input": 0.55, + "output": 2.2 }, "type": "chat" }, { - "id": "grok-4-fast-reasoning", - "name": "xAI: Grok 4 Fast Reasoning", - "display_name": "xAI: Grok 4 Fast Reasoning", + "id": "moonshotai/kimi-k2.6", + "name": "Kimi K2.6", + "display_name": "Kimi K2.6", "modalities": { "input": [ "text", - "image" + "image", + "video" ], "output": [ "text" ] }, "limit": { - "context": 2000000, - "output": 2000000 + "context": 262144, + "output": 262144 }, "temperature": true, "tool_call": true, @@ -143401,160 +147478,174 @@ "supported": true } }, - "attachment": false, - "open_weights": false, - "knowledge": "2025-09", - "release_date": "2025-09-01", - "last_updated": "2025-09-01", + "attachment": true, + "open_weights": true, + "knowledge": "2025-01", + "release_date": "2026-04-21", + "last_updated": "2026-04-21", "cost": { - "input": 0.19999999999999998, - "output": 0.5, - "cache_read": 0.049999999999999996 + "input": 0.75, + "output": 3.5 }, "type": "chat" }, { - "id": "gpt-5.1-codex-mini", - "name": "OpenAI: GPT-5.1 Codex Mini", - "display_name": "OpenAI: GPT-5.1 Codex Mini", + "id": "google/imagen-4.0-fast", + "name": "Imagen 4 Fast", + "display_name": "Imagen 4 Fast", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ - "text", "image" ] }, "limit": { - "context": 400000, - "output": 128000 + "context": 480, + "output": 8192 }, "temperature": false, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": false - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": false, - "mode": "effort", - "effort": "none", - "effort_options": [ - "none", - "low", - "medium", - "high" - ], - "verbosity": "medium", - "verbosity_options": [ - "low", - "medium", - "high" - ], - "visibility": "hidden" - } + "supported": false }, "attachment": false, "open_weights": false, - "knowledge": "2025-01", - "release_date": "2025-01-01", - "last_updated": "2025-01-01", - "cost": { - "input": 0.25, - "output": 2, - "cache_read": 0.024999999999999998 - }, + "release_date": "2025-05-20", + "last_updated": "2025-05-20", "type": "chat" }, { - "id": "grok-4-1-fast-non-reasoning", - "name": "xAI Grok 4.1 Fast Non-Reasoning", - "display_name": "xAI Grok 4.1 Fast Non-Reasoning", + "id": "google/gemini-2.5-pro", + "name": "Gemini 2.5 Pro", + "display_name": "Gemini 2.5 Pro", "modalities": { "input": [ "text", - "image" + "image", + "pdf" ], "output": [ - "text", - "image" + "text" ] }, "limit": { - "context": 2000000, - "output": 30000 + "context": 1048576, + "output": 65536 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": false, + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": true, + "mode": "budget", + "budget": { + "default": -1, + "min": 128, + "max": 32768, + "auto": -1, + "unit": "tokens" + }, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thought_signatures" + ] + } + }, + "attachment": true, "open_weights": false, - "knowledge": "2025-11", - "release_date": "2025-11-17", - "last_updated": "2025-11-17", + "knowledge": "2025-01", + "release_date": "2025-06-17", + "last_updated": "2025-06-17", "cost": { - "input": 0.19999999999999998, - "output": 0.5, - "cache_read": 0.049999999999999996 + "input": 1.25, + "output": 10, + "cache_read": 0.31 }, "type": "chat" }, { - "id": "claude-3.5-haiku", - "name": "Anthropic: Claude 3.5 Haiku", - "display_name": "Anthropic: Claude 3.5 Haiku", + "id": "google/gemini-2.5-flash", + "name": "Gemini 2.5 Flash", + "display_name": "Gemini 2.5 Flash", "modalities": { "input": [ "text", - "image" + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 8192 + "context": 1048576, + "output": 65536 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": false, + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": true, + "mode": "budget", + "budget": { + "default": -1, + "min": 0, + "max": 24576, + "auto": -1, + "off": 0, + "unit": "tokens" + }, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thought_signatures" + ] + } + }, + "attachment": true, "open_weights": false, - "knowledge": "2024-10", - "release_date": "2024-10-22", - "last_updated": "2024-10-22", + "knowledge": "2025-01", + "release_date": "2025-06-17", + "last_updated": "2025-06-17", "cost": { - "input": 0.7999999999999999, - "output": 4, - "cache_read": 0.08, - "cache_write": 1 + "input": 0.3, + "output": 2.5, + "cache_read": 0.0375 }, "type": "chat" }, { - "id": "gpt-oss-20b", - "name": "OpenAI GPT-OSS 20b", - "display_name": "OpenAI GPT-OSS 20b", + "id": "google/gemini-3.5-flash", + "name": "Gemini 3.5 Flash", + "display_name": "Gemini 3.5 Flash", "modalities": { "input": [ - "text" + "text", + "image", + "video", + "audio", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 131072, - "output": 131072 + "context": 1048576, + "output": 65536 }, "temperature": true, "tool_call": true, @@ -143564,56 +147655,66 @@ }, "extra_capabilities": { "reasoning": { - "supported": true + "supported": true, + "default_enabled": true, + "mode": "level", + "level": "high", + "level_options": [ + "minimal", + "low", + "medium", + "high" + ], + "summaries": true, + "visibility": "summary", + "continuation": [ + "thought_signatures" + ] } }, - "attachment": false, + "attachment": true, "open_weights": false, - "knowledge": "2024-06", - "release_date": "2024-06-01", - "last_updated": "2024-06-01", + "knowledge": "2025-01", + "release_date": "2026-05-19", + "last_updated": "2026-05-19", "cost": { - "input": 0.049999999999999996, - "output": 0.19999999999999998 + "input": 1.5, + "output": 9 }, "type": "chat" }, { - "id": "llama-prompt-guard-2-86m", - "name": "Meta Llama Prompt Guard 2 86M", - "display_name": "Meta Llama Prompt Guard 2 86M", + "id": "google/veo3.1-lite", + "name": "Veo 3.1 Lite", + "display_name": "Veo 3.1 Lite", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ - "text" + "video" ] }, "limit": { - "context": 512, - "output": 2 + "context": 400000, + "output": 8192 }, - "temperature": true, + "temperature": false, "tool_call": false, "reasoning": { "supported": false }, - "attachment": false, + "attachment": true, "open_weights": false, - "knowledge": "2024-10", - "release_date": "2024-10-01", - "last_updated": "2024-10-01", - "cost": { - "input": 0.01, - "output": 0.01 - }, + "release_date": "2026-05-01", + "last_updated": "2026-05-01", "type": "chat" }, { - "id": "llama-4-scout", - "name": "Meta Llama 4 Scout 17B 16E", - "display_name": "Meta Llama 4 Scout 17B 16E", + "id": "google/gemma-4-31b-it", + "name": "Gemma 4 31B IT", + "display_name": "Gemma 4 31B IT", "modalities": { "input": [ "text", @@ -143624,77 +147725,100 @@ ] }, "limit": { - "context": 131072, - "output": 8192 + "context": 262144, + "output": 32768 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": false, - "open_weights": false, - "knowledge": "2025-01", - "release_date": "2025-01-01", - "last_updated": "2025-01-01", + "attachment": true, + "open_weights": true, + "release_date": "2026-04-02", + "last_updated": "2026-04-02", "cost": { - "input": 0.08, - "output": 0.3 + "input": 0.13, + "output": 0.38 }, "type": "chat" }, { - "id": "sonar-reasoning-pro", - "name": "Perplexity Sonar Reasoning Pro", - "display_name": "Perplexity Sonar Reasoning Pro", + "id": "google/veo3.1", + "name": "Veo 3.1", + "display_name": "Veo 3.1", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ + "video" + ] + }, + "limit": { + "context": 400000, + "output": 8192 + }, + "temperature": false, + "tool_call": false, + "reasoning": { + "supported": false + }, + "attachment": true, + "open_weights": false, + "release_date": "2026-05-01", + "last_updated": "2026-05-01", + "type": "chat" + }, + { + "id": "google/imagen-4.0-ultra", + "name": "Imagen 4 Ultra", + "display_name": "Imagen 4 Ultra", + "modalities": { + "input": [ "text" + ], + "output": [ + "image" ] }, "limit": { - "context": 127000, - "output": 4096 + "context": 480, + "output": 8192 }, - "temperature": true, + "temperature": false, "tool_call": false, "reasoning": { - "supported": true, - "default": true + "supported": false }, "attachment": false, "open_weights": false, - "knowledge": "2025-01", - "release_date": "2025-01-27", - "last_updated": "2025-01-27", - "cost": { - "input": 2, - "output": 8 - }, - "type": "chat" + "release_date": "2025-05-20", + "last_updated": "2025-05-20", + "type": "imageGeneration" }, { - "id": "gemini-2.5-pro", - "name": "Google Gemini 2.5 Pro", - "display_name": "Google Gemini 2.5 Pro", + "id": "google/gemini-3-pro-image-preview", + "name": "Nano Banana Pro", + "display_name": "Nano Banana Pro", "modalities": { "input": [ "text", "image" ], "output": [ - "text" + "text", + "image" ] }, "limit": { - "context": 1048576, - "output": 65536 + "context": 65536, + "output": 32768 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": true, "default": true @@ -143703,14 +147827,12 @@ "reasoning": { "supported": true, "default_enabled": true, - "mode": "budget", - "budget": { - "default": -1, - "min": 128, - "max": 32768, - "auto": -1, - "unit": "tokens" - }, + "mode": "level", + "level": "high", + "level_options": [ + "low", + "high" + ], "summaries": true, "visibility": "summary", "continuation": [ @@ -143718,37 +147840,38 @@ ] } }, - "attachment": false, + "attachment": true, "open_weights": false, - "knowledge": "2025-06", - "release_date": "2025-06-17", - "last_updated": "2025-06-17", + "knowledge": "2025-01", + "release_date": "2025-11-20", + "last_updated": "2025-11-20", "cost": { - "input": 1.25, - "output": 10, - "cache_read": 0.3125, - "cache_write": 1.25 + "input": 2, + "output": 12 }, - "type": "chat" + "type": "imageGeneration" }, { - "id": "deepseek-r1-distill-llama-70b", - "name": "DeepSeek R1 Distill Llama 70B", - "display_name": "DeepSeek R1 Distill Llama 70B", + "id": "google/gemini-3.1-flash-image-preview", + "name": "Nano Banana 2", + "display_name": "Nano Banana 2", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ - "text" + "text", + "image" ] }, "limit": { - "context": 128000, - "output": 4096 + "context": 65536, + "output": 65536 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": true, "default": true @@ -143758,313 +147881,269 @@ "supported": true } }, - "attachment": false, + "attachment": true, "open_weights": false, "knowledge": "2025-01", - "release_date": "2025-01-20", - "last_updated": "2025-01-20", + "release_date": "2026-02-26", + "last_updated": "2026-02-26", "cost": { - "input": 0.03, - "output": 0.13 + "input": 0.5, + "output": 3 }, - "type": "chat" + "type": "imageGeneration" }, { - "id": "qwen3-30b-a3b", - "name": "Qwen3 30B A3B", - "display_name": "Qwen3 30B A3B", + "id": "google/gemini-3.1-pro-preview", + "name": "Gemini 3.1 Pro Preview", + "display_name": "Gemini 3.1 Pro Preview", "modalities": { "input": [ "text", - "image" + "image", + "video", + "audio", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 41000, - "output": 41000 + "context": 1048576, + "output": 65536 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true + "supported": true, + "default": true }, "extra_capabilities": { "reasoning": { "supported": true, - "interleaved": true, + "default_enabled": true, + "mode": "level", + "level": "high", + "level_options": [ + "low", + "high" + ], "summaries": true, "visibility": "summary", "continuation": [ - "thinking_blocks" + "thought_signatures" ] } }, - "attachment": false, + "attachment": true, "open_weights": false, - "knowledge": "2025-06", - "release_date": "2025-06-01", - "last_updated": "2025-06-01", + "knowledge": "2025-01", + "release_date": "2026-02-19", + "last_updated": "2026-02-19", "cost": { - "input": 0.08, - "output": 0.29 + "input": 2, + "output": 12 }, "type": "chat" }, { - "id": "gpt-4.1", - "name": "OpenAI GPT-4.1", - "display_name": "OpenAI GPT-4.1", + "id": "google/veo3.1-fast", + "name": "Veo 3.1 Fast", + "display_name": "Veo 3.1 Fast", "modalities": { "input": [ "text", "image" ], "output": [ - "text" + "video" ] }, "limit": { - "context": 1047576, - "output": 32768 + "context": 400000, + "output": 8192 }, - "temperature": true, - "tool_call": true, + "temperature": false, + "tool_call": false, "reasoning": { "supported": false }, - "attachment": false, + "attachment": true, "open_weights": false, - "knowledge": "2025-04", - "release_date": "2025-04-14", - "last_updated": "2025-04-14", - "cost": { - "input": 2, - "output": 8, - "cache_read": 0.5 - }, + "release_date": "2026-05-01", + "last_updated": "2026-05-01", "type": "chat" }, { - "id": "llama-guard-4", - "name": "Meta Llama Guard 4 12B", - "display_name": "Meta Llama Guard 4 12B", + "id": "x-ai/grok-4.3", + "name": "Grok 4.3", + "display_name": "Grok 4.3", "modalities": { "input": [ "text", - "image" + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 131072, - "output": 1024 + "context": 1000000, + "output": 30000 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": false, + "extra_capabilities": { + "reasoning": { + "supported": true + } + }, + "attachment": true, "open_weights": false, - "knowledge": "2025-01", - "release_date": "2025-01-01", - "last_updated": "2025-01-01", + "release_date": "2026-04-17", + "last_updated": "2026-04-17", "cost": { - "input": 0.21, - "output": 0.21 + "input": 1.25, + "output": 2.5 }, "type": "chat" }, { - "id": "claude-sonnet-4-5-20250929", - "name": "Anthropic: Claude Sonnet 4.5 (20250929)", - "display_name": "Anthropic: Claude Sonnet 4.5 (20250929)", + "id": "x-ai/grok-4", + "name": "Grok 4", + "display_name": "Grok 4", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 200000, + "context": 256000, "output": 64000 }, "temperature": true, "tool_call": true, "reasoning": { "supported": true, - "default": false + "default": true }, "extra_capabilities": { "reasoning": { - "supported": true, - "default_enabled": false, - "mode": "budget", - "budget": { - "min": 1024, - "unit": "tokens" - }, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ], - "notes": [ - "Claude 4 manual thinking uses thinking.type = \"enabled\" with budget_tokens.", - "Interleaved thinking requires the interleaved-thinking-2025-05-14 beta header for this model family." - ] + "supported": true } }, "attachment": false, "open_weights": false, - "knowledge": "2025-09", - "release_date": "2025-09-29", - "last_updated": "2025-09-29", + "knowledge": "2025-07", + "release_date": "2025-07-09", + "last_updated": "2025-07-09", "cost": { "input": 3, "output": 15, - "cache_read": 0.30000000000000004, - "cache_write": 3.75 + "cache_read": 0.75, + "cache_write": 15 }, "type": "chat" }, { - "id": "claude-opus-4-1-20250805", - "name": "Anthropic: Claude Opus 4.1 (20250805)", - "display_name": "Anthropic: Claude Opus 4.1 (20250805)", + "id": "x-ai/grok-build-0.1", + "name": "Grok Build 0.1", + "display_name": "Grok Build 0.1", "modalities": { "input": [ "text", - "image" + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 32000 + "context": 256000, + "output": 256000 }, "temperature": true, "tool_call": true, "reasoning": { "supported": true, - "default": false + "default": true }, "extra_capabilities": { "reasoning": { - "supported": true, - "default_enabled": false, - "mode": "budget", - "budget": { - "min": 1024, - "unit": "tokens" - }, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ], - "notes": [ - "Claude 4 manual thinking uses thinking.type = \"enabled\" with budget_tokens.", - "Interleaved thinking requires the interleaved-thinking-2025-05-14 beta header for this model family." - ] + "supported": true } }, - "attachment": false, + "attachment": true, "open_weights": false, - "knowledge": "2025-08", - "release_date": "2025-08-05", - "last_updated": "2025-08-05", + "release_date": "2026-04-16", + "last_updated": "2026-04-16", "cost": { - "input": 15, - "output": 75, - "cache_read": 1.5, - "cache_write": 18.75 + "input": 1, + "output": 2 }, "type": "chat" }, { - "id": "gemini-2.5-flash-lite", - "name": "Google Gemini 2.5 Flash Lite", - "display_name": "Google Gemini 2.5 Flash Lite", + "id": "z-ai/glm-5.1", + "name": "GLM-5.1", + "display_name": "GLM-5.1", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 1048576, - "output": 65535 + "context": 200000, + "output": 131072 }, "temperature": true, "tool_call": true, "reasoning": { "supported": true, - "default": false + "default": true }, "extra_capabilities": { "reasoning": { - "supported": true, - "default_enabled": false, - "mode": "budget", - "budget": { - "default": -1, - "min": 512, - "max": 24576, - "auto": -1, - "unit": "tokens" - }, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thought_signatures" - ] + "supported": true } }, "attachment": false, - "open_weights": false, - "knowledge": "2025-07", - "release_date": "2025-07-22", - "last_updated": "2025-07-22", + "open_weights": true, + "release_date": "2026-03-27", + "last_updated": "2026-03-27", "cost": { - "input": 0.09999999999999999, - "output": 0.39999999999999997, - "cache_read": 0.024999999999999998, - "cache_write": 0.09999999999999999 + "input": 1.05, + "output": 3.5 }, "type": "chat" }, { - "id": "gemini-2.5-flash", - "name": "Google Gemini 2.5 Flash", - "display_name": "Google Gemini 2.5 Flash", + "id": "z-ai/glm-5", + "name": "GLM-5", + "display_name": "GLM-5", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 1048576, - "output": 65535 + "context": 204800, + "output": 131072 }, "temperature": true, "tool_call": true, @@ -144075,40 +148154,28 @@ "extra_capabilities": { "reasoning": { "supported": true, - "default_enabled": true, - "mode": "budget", - "budget": { - "default": -1, - "min": 0, - "max": 24576, - "auto": -1, - "off": 0, - "unit": "tokens" - }, + "interleaved": true, "summaries": true, "visibility": "summary", "continuation": [ - "thought_signatures" + "thinking_blocks" ] } }, "attachment": false, - "open_weights": false, - "knowledge": "2025-06", - "release_date": "2025-06-17", - "last_updated": "2025-06-17", + "open_weights": true, + "release_date": "2026-02-11", + "last_updated": "2026-02-11", "cost": { - "input": 0.3, - "output": 2.5, - "cache_read": 0.075, - "cache_write": 0.3 + "input": 0.95, + "output": 3.15 }, "type": "chat" }, { - "id": "claude-4.5-haiku", - "name": "Anthropic: Claude 4.5 Haiku", - "display_name": "Anthropic: Claude 4.5 Haiku", + "id": "openai/gpt-5", + "name": "GPT-5", + "display_name": "GPT-5", "modalities": { "input": [ "text", @@ -144119,134 +148186,198 @@ ] }, "limit": { - "context": 200000, - "output": 8192 + "context": 400000, + "output": 128000 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": false, + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": true, + "mode": "effort", + "effort": "medium", + "effort_options": [ + "minimal", + "low", + "medium", + "high" + ], + "verbosity": "medium", + "verbosity_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" + } + }, + "attachment": true, "open_weights": false, - "knowledge": "2025-10", - "release_date": "2025-10-01", - "last_updated": "2025-10-01", + "knowledge": "2024-10-01", + "release_date": "2025-08-07", + "last_updated": "2025-08-07", "cost": { - "input": 1, - "output": 5, - "cache_read": 0.09999999999999999, - "cache_write": 1.25 + "input": 1.25, + "output": 10, + "cache_read": 0.125 }, "type": "chat" }, { - "id": "deepseek-v3.1-terminus", - "name": "DeepSeek V3.1 Terminus", - "display_name": "DeepSeek V3.1 Terminus", + "id": "openai/gpt-5.4-nano", + "name": "GPT-5.4 nano", + "display_name": "GPT-5.4 nano", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 16384 + "context": 400000, + "output": 128000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { "supported": true, - "default": true + "default": false }, - "attachment": false, + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": false, + "mode": "effort", + "effort": "none", + "effort_options": [ + "none", + "low", + "medium", + "high", + "xhigh" + ], + "verbosity": "medium", + "verbosity_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" + } + }, + "attachment": true, "open_weights": false, - "knowledge": "2025-09", - "release_date": "2025-09-22", - "last_updated": "2025-09-22", + "knowledge": "2025-08-31", + "release_date": "2026-03-17", + "last_updated": "2026-03-17", "cost": { - "input": 0.27, - "output": 1, - "cache_read": 0.21600000000000003 + "input": 0.2, + "output": 1.25 }, "type": "chat" }, { - "id": "gemma-3-12b-it", - "name": "Google Gemma 3 12B", - "display_name": "Google Gemma 3 12B", + "id": "openai/gpt-5.3-codex", + "name": "GPT-5.3 Codex", + "display_name": "GPT-5.3 Codex", "modalities": { "input": [ "text", - "image" + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 131072, - "output": 8192 + "context": 400000, + "output": 128000 }, - "temperature": true, - "tool_call": false, + "temperature": false, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": false, + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": true, + "mode": "effort", + "effort": "medium", + "effort_options": [ + "low", + "medium", + "high", + "xhigh" + ], + "verbosity": "medium", + "verbosity_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" + } + }, + "attachment": true, "open_weights": false, - "knowledge": "2024-12", - "release_date": "2024-12-01", - "last_updated": "2024-12-01", + "knowledge": "2025-08-31", + "release_date": "2026-02-05", + "last_updated": "2026-02-05", "cost": { - "input": 0.049999999999999996, - "output": 0.09999999999999999 + "input": 1.75, + "output": 14 }, "type": "chat" }, { - "id": "claude-4.5-opus", - "name": "Anthropic: Claude Opus 4.5", - "display_name": "Anthropic: Claude Opus 4.5", + "id": "openai/gpt-realtime-1.5", + "name": "GPT Realtime 1.5", + "display_name": "GPT Realtime 1.5", "modalities": { "input": [ "text", + "audio", "image" ], "output": [ - "text" + "text", + "audio" ] }, "limit": { - "context": 200000, - "output": 64000 + "context": 32000, + "output": 4096 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, - "attachment": false, + "attachment": true, "open_weights": false, - "knowledge": "2025-11", - "release_date": "2025-11-24", - "last_updated": "2025-11-24", + "release_date": "2025-06-01", + "last_updated": "2025-06-01", "cost": { - "input": 5, - "output": 25, - "cache_read": 0.5, - "cache_write": 6.25 + "input": 4, + "output": 16 }, "type": "chat" }, { - "id": "kimi-k2-0711", - "name": "Kimi K2 (07/11)", - "display_name": "Kimi K2 (07/11)", + "id": "openai/gpt-oss-120b", + "name": "GPT OSS 120B", + "display_name": "GPT OSS 120B", "modalities": { "input": [ "text" @@ -144257,28 +148388,33 @@ }, "limit": { "context": 131072, - "output": 16384 + "output": 32768 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true + } }, "attachment": false, - "open_weights": false, - "knowledge": "2025-01", - "release_date": "2025-01-01", - "last_updated": "2025-01-01", + "open_weights": true, + "release_date": "2025-08-05", + "last_updated": "2025-08-05", "cost": { - "input": 0.5700000000000001, - "output": 2.3 + "input": 0.15, + "output": 0.6 }, "type": "chat" }, { - "id": "claude-4.5-sonnet", - "name": "Anthropic: Claude Sonnet 4.5", - "display_name": "Anthropic: Claude Sonnet 4.5", + "id": "openai/gpt-5.4-mini", + "name": "GPT-5.4 mini", + "display_name": "GPT-5.4 mini", "modalities": { "input": [ "text", @@ -144289,96 +148425,142 @@ ] }, "limit": { - "context": 200000, - "output": 64000 + "context": 400000, + "output": 128000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { "supported": true, - "default": true + "default": false }, - "attachment": false, + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": false, + "mode": "effort", + "effort": "none", + "effort_options": [ + "none", + "low", + "medium", + "high", + "xhigh" + ], + "verbosity": "medium", + "verbosity_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" + } + }, + "attachment": true, "open_weights": false, - "knowledge": "2025-09", - "release_date": "2025-09-29", - "last_updated": "2025-09-29", + "knowledge": "2025-08-31", + "release_date": "2026-03-17", + "last_updated": "2026-03-17", "cost": { - "input": 3, - "output": 15, - "cache_read": 0.30000000000000004, - "cache_write": 3.75 + "input": 0.75, + "output": 4.5 }, "type": "chat" }, { - "id": "qwen2.5-coder-7b-fast", - "name": "Qwen2.5 Coder 7B fast", - "display_name": "Qwen2.5 Coder 7B fast", + "id": "openai/gpt-4.1", + "name": "GPT-4.1", + "display_name": "GPT-4.1", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 32000, - "output": 8192 + "context": 1047576, + "output": 32768 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { "supported": false }, - "attachment": false, + "attachment": true, "open_weights": false, - "knowledge": "2024-09", - "release_date": "2024-09-15", - "last_updated": "2024-09-15", + "knowledge": "2024-04", + "release_date": "2025-04-14", + "last_updated": "2025-04-14", "cost": { - "input": 0.03, - "output": 0.09 + "input": 2, + "output": 8, + "cache_read": 0.5 }, "type": "chat" }, { - "id": "hermes-2-pro-llama-3-8b", - "name": "Hermes 2 Pro Llama 3 8B", - "display_name": "Hermes 2 Pro Llama 3 8B", + "id": "openai/gpt-5-mini", + "name": "GPT-5 Mini", + "display_name": "GPT-5 Mini", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 131072, - "output": 131072 + "context": 400000, + "output": 128000 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": false, + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": true, + "mode": "effort", + "effort": "medium", + "effort_options": [ + "minimal", + "low", + "medium", + "high" + ], + "verbosity": "medium", + "verbosity_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" + } + }, + "attachment": true, "open_weights": false, - "knowledge": "2024-05", - "release_date": "2024-05-27", - "last_updated": "2024-05-27", + "knowledge": "2024-10-01", + "release_date": "2025-08-07", + "last_updated": "2025-08-07", "cost": { - "input": 0.14, - "output": 0.14 + "input": 0.25, + "output": 2, + "cache_read": 0.025 }, "type": "chat" }, { - "id": "gpt-4.1-mini-2025-04-14", - "name": "OpenAI GPT-4.1 Mini", - "display_name": "OpenAI GPT-4.1 Mini", + "id": "openai/gpt-5-nano", + "name": "GPT-5 Nano", + "display_name": "GPT-5 Nano", "modalities": { "input": [ "text", @@ -144389,63 +148571,92 @@ ] }, "limit": { - "context": 1047576, - "output": 32768 + "context": 400000, + "output": 128000 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": false, + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": true, + "mode": "effort", + "effort": "medium", + "effort_options": [ + "minimal", + "low", + "medium", + "high" + ], + "verbosity": "medium", + "verbosity_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" + } + }, + "attachment": true, "open_weights": false, - "knowledge": "2025-04", - "release_date": "2025-04-14", - "last_updated": "2025-04-14", + "knowledge": "2024-10-01", + "release_date": "2025-08-07", + "last_updated": "2025-08-07", "cost": { - "input": 0.39999999999999997, - "output": 1.5999999999999999, - "cache_read": 0.09999999999999999 + "input": 0.05, + "output": 0.4, + "cache_read": 0.005 }, "type": "chat" }, { - "id": "kimi-k2-0905", - "name": "Kimi K2 (09/05)", - "display_name": "Kimi K2 (09/05)", + "id": "openai/gpt-5.5-pro", + "name": "GPT-5.5 Pro", + "display_name": "GPT-5.5 Pro", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 262144, - "output": 16384 + "context": 1050000, + "output": 128000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": false, + "extra_capabilities": { + "reasoning": { + "supported": true + } + }, + "attachment": true, "open_weights": false, - "knowledge": "2025-09", - "release_date": "2025-09-05", - "last_updated": "2025-09-05", + "knowledge": "2025-12-01", + "release_date": "2026-04-23", + "last_updated": "2026-04-23", "cost": { - "input": 0.5, - "output": 2, - "cache_read": 0.39999999999999997 + "input": 30, + "output": 180 }, "type": "chat" }, { - "id": "o1-mini", - "name": "OpenAI: o1-mini", - "display_name": "OpenAI: o1-mini", + "id": "openai/gpt-oss-20b", + "name": "GPT OSS 20B", + "display_name": "GPT OSS 20B", "modalities": { "input": [ "text" @@ -144455,51 +148666,41 @@ ] }, "limit": { - "context": 128000, + "context": 131072, "output": 65536 }, - "temperature": false, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { "supported": true, "default": true }, "extra_capabilities": { "reasoning": { - "supported": true, - "default_enabled": true, - "mode": "effort", - "effort": "medium", - "effort_options": [ - "low", - "medium", - "high" - ], - "visibility": "hidden" + "supported": true } }, "attachment": false, - "open_weights": false, - "knowledge": "2025-01", - "release_date": "2025-01-01", - "last_updated": "2025-01-01", + "open_weights": true, + "release_date": "2025-08-05", + "last_updated": "2025-08-05", "cost": { - "input": 1.1, - "output": 4.4, - "cache_read": 0.55 + "input": 0.05, + "output": 0.2 }, "type": "chat" }, { - "id": "deepseek-v3", - "name": "DeepSeek V3", - "display_name": "DeepSeek V3", + "id": "openai/gpt-image-2", + "name": "GPT Image 2", + "display_name": "GPT Image 2", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ - "text" + "image" ] }, "limit": { @@ -144507,57 +148708,51 @@ "output": 8192 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": false }, - "attachment": false, + "attachment": true, "open_weights": false, - "knowledge": "2024-12", - "release_date": "2024-12-26", - "last_updated": "2024-12-26", - "cost": { - "input": 0.56, - "output": 1.68, - "cache_read": 0.07 - }, - "type": "chat" + "release_date": "2026-04-21", + "last_updated": "2026-04-21", + "type": "imageGeneration" }, { - "id": "gpt-5.1-codex", - "name": "OpenAI: GPT-5.1 Codex", - "display_name": "OpenAI: GPT-5.1 Codex", + "id": "openai/gpt-5.5", + "name": "GPT-5.5", + "display_name": "GPT-5.5", "modalities": { "input": [ "text", - "image" + "image", + "pdf" ], "output": [ - "text", - "image" + "text" ] }, "limit": { - "context": 400000, + "context": 1050000, "output": 128000 }, "temperature": false, "tool_call": true, "reasoning": { "supported": true, - "default": false + "default": true }, "extra_capabilities": { "reasoning": { "supported": true, - "default_enabled": false, + "default_enabled": true, "mode": "effort", - "effort": "none", + "effort": "medium", "effort_options": [ - "none", "low", "medium", - "high" + "high", + "xhigh" ], "verbosity": "medium", "verbosity_options": [ @@ -144568,178 +148763,288 @@ "visibility": "hidden" } }, - "attachment": false, + "attachment": true, "open_weights": false, - "knowledge": "2025-01", - "release_date": "2025-01-01", - "last_updated": "2025-01-01", + "knowledge": "2025-12-01", + "release_date": "2026-04-23", + "last_updated": "2026-04-23", "cost": { - "input": 1.25, - "output": 10, - "cache_read": 0.12500000000000003 + "input": 5, + "output": 30 }, "type": "chat" }, { - "id": "claude-3-haiku-20240307", - "name": "Anthropic: Claude 3 Haiku", - "display_name": "Anthropic: Claude 3 Haiku", + "id": "bytedance/seedance-2", + "name": "Seedance 2", + "display_name": "Seedance 2", "modalities": { "input": [ "text", "image" ], + "output": [ + "video" + ] + }, + "limit": { + "context": 4096, + "output": 8192 + }, + "temperature": false, + "tool_call": false, + "reasoning": { + "supported": false + }, + "attachment": true, + "open_weights": false, + "release_date": "2026-04-01", + "last_updated": "2026-04-01", + "type": "chat" + }, + { + "id": "anthropic/claude-sonnet-4", + "name": "Claude Sonnet 4", + "display_name": "Claude Sonnet 4", + "modalities": { + "input": [ + "text", + "image", + "pdf" + ], "output": [ "text" ] }, "limit": { "context": 200000, - "output": 4096 + "output": 64000 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": false }, - "attachment": false, + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": false, + "mode": "budget", + "budget": { + "min": 1024, + "unit": "tokens" + }, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ], + "notes": [ + "Claude 4 manual thinking uses thinking.type = \"enabled\" with budget_tokens.", + "Interleaved thinking requires the interleaved-thinking-2025-05-14 beta header for this model family." + ] + } + }, + "attachment": true, "open_weights": false, - "knowledge": "2024-03", - "release_date": "2024-03-07", - "last_updated": "2024-03-07", + "knowledge": "2025-03-31", + "release_date": "2025-05-22", + "last_updated": "2025-05-22", "cost": { - "input": 0.25, - "output": 1.25, - "cache_read": 0.03, - "cache_write": 0.3 + "input": 3, + "output": 15, + "cache_read": 0.3, + "cache_write": 3.75 }, "type": "chat" }, { - "id": "gemma2-9b-it", - "name": "Google Gemma 2", - "display_name": "Google Gemma 2", + "id": "anthropic/claude-opus-4.8", + "name": "Claude Opus 4.8", + "display_name": "Claude Opus 4.8", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 8192, - "output": 8192 + "context": 1000000, + "output": 128000 }, - "temperature": true, - "tool_call": false, + "temperature": false, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": false }, - "attachment": false, + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": false, + "mode": "effort", + "effort": "high", + "effort_options": [ + "low", + "medium", + "high", + "xhigh", + "max" + ], + "interleaved": true, + "summaries": true, + "visibility": "omitted", + "continuation": [ + "thinking_blocks" + ], + "notes": [ + "Claude Opus 4.7 and newer Opus models require thinking.type = \"adaptive\" to enable thinking explicitly.", + "Manual budget_tokens requests return 400 on Claude Opus 4.7 and newer adaptive-only Opus models.", + "task_budget is separate from thinking control and should not be treated as a thinking budget." + ] + } + }, + "attachment": true, "open_weights": false, - "knowledge": "2024-06", - "release_date": "2024-06-25", - "last_updated": "2024-06-25", + "release_date": "2026-05-28", + "last_updated": "2026-05-28", "cost": { - "input": 0.01, - "output": 0.03 + "input": 5, + "output": 25 }, "type": "chat" }, { - "id": "gemini-3-pro-preview", - "name": "Google Gemini 3 Pro Preview", - "display_name": "Google Gemini 3 Pro Preview", + "id": "anthropic/claude-opus-4.1", + "name": "Claude Opus 4.1", + "display_name": "Claude Opus 4.1", "modalities": { "input": [ "text", "image", - "audio", - "video" + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 1048576, - "output": 65536 + "context": 200000, + "output": 32000 }, "temperature": true, "tool_call": true, "reasoning": { "supported": true, - "default": true + "default": false }, "extra_capabilities": { "reasoning": { "supported": true, - "default_enabled": true, - "mode": "level", - "level": "high", - "level_options": [ - "low", - "high" - ], + "default_enabled": false, + "mode": "budget", + "budget": { + "min": 1024, + "unit": "tokens" + }, + "interleaved": true, "summaries": true, "visibility": "summary", "continuation": [ - "thought_signatures" + "thinking_blocks" + ], + "notes": [ + "Claude 4 manual thinking uses thinking.type = \"enabled\" with budget_tokens.", + "Interleaved thinking requires the interleaved-thinking-2025-05-14 beta header for this model family." ] } }, - "attachment": false, + "attachment": true, "open_weights": false, - "knowledge": "2025-11", - "release_date": "2025-11-18", - "last_updated": "2025-11-18", + "knowledge": "2025-03-31", + "release_date": "2025-08-05", + "last_updated": "2025-08-05", "cost": { - "input": 2, - "output": 12, - "cache_read": 0.19999999999999998 + "input": 15, + "output": 75, + "cache_read": 1.5, + "cache_write": 18.75 }, "type": "chat" }, { - "id": "qwen3-coder", - "name": "Qwen3 Coder 480B A35B Instruct Turbo", - "display_name": "Qwen3 Coder 480B A35B Instruct Turbo", + "id": "anthropic/claude-sonnet-4.6", + "name": "Claude Sonnet 4.6", + "display_name": "Claude Sonnet 4.6", "modalities": { "input": [ "text", "image", - "audio", - "video" + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 262144, - "output": 16384 + "context": 1000000, + "output": 64000 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": false }, - "attachment": false, + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": false, + "mode": "mixed", + "budget": { + "min": 1024, + "unit": "tokens" + }, + "effort": "high", + "effort_options": [ + "low", + "medium", + "high", + "max" + ], + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ], + "notes": [ + "Anthropic recommends adaptive thinking with effort for Claude 4.6; budget_tokens remains a deprecated compatibility path.", + "Anthropic API defaults effort to high; lower effort levels should be chosen per workload." + ] + } + }, + "attachment": true, "open_weights": false, - "knowledge": "2025-07", - "release_date": "2025-07-23", - "last_updated": "2025-07-23", + "knowledge": "2025-08-31", + "release_date": "2026-02-17", + "last_updated": "2026-03-13", "cost": { - "input": 0.22, - "output": 0.95 + "input": 3, + "output": 15 }, "type": "chat" }, { - "id": "grok-3-mini", - "name": "xAI Grok 3 Mini", - "display_name": "xAI Grok 3 Mini", + "id": "sarvam/sarvam-105b", + "name": "Sarvam 105B", + "display_name": "Sarvam 105B", "modalities": { "input": [ "text" @@ -144755,24 +149060,23 @@ "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "attachment": false, - "open_weights": false, - "knowledge": "2024-06", - "release_date": "2024-06-01", - "last_updated": "2024-06-01", + "open_weights": true, + "release_date": "2025-09-01", + "last_updated": "2025-09-01", "cost": { - "input": 0.3, - "output": 0.5, - "cache_read": 0.075 + "input": 0.04, + "output": 0.16 }, "type": "chat" }, { - "id": "llama-3.1-8b-instruct-turbo", - "name": "Meta Llama 3.1 8B Instruct Turbo", - "display_name": "Meta Llama 3.1 8B Instruct Turbo", + "id": "sarvam/sarvam-30b", + "name": "Sarvam 30B", + "display_name": "Sarvam 30B", "modalities": { "input": [ "text" @@ -144788,23 +149092,23 @@ "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "attachment": false, - "open_weights": false, - "knowledge": "2024-07", - "release_date": "2024-07-23", - "last_updated": "2024-07-23", + "open_weights": true, + "release_date": "2026-02-18", + "last_updated": "2026-02-18", "cost": { "input": 0.02, - "output": 0.03 + "output": 0.1 }, "type": "chat" }, { - "id": "llama-3.1-8b-instruct", - "name": "Meta Llama 3.1 8B Instruct", - "display_name": "Meta Llama 3.1 8B Instruct", + "id": "deepseek-ai/deepseek-r1-distill-llama-70b", + "name": "DeepSeek R1 Distill Llama 70B", + "display_name": "DeepSeek R1 Distill Llama 70B", "modalities": { "input": [ "text" @@ -144814,29 +149118,35 @@ ] }, "limit": { - "context": 16384, - "output": 16384 + "context": 131072, + "output": 131072 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": false + "supported": true, + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true + } }, "attachment": false, - "open_weights": false, - "knowledge": "2024-07", - "release_date": "2024-07-23", - "last_updated": "2024-07-23", + "open_weights": true, + "knowledge": "2024-10", + "release_date": "2025-01-23", + "last_updated": "2025-01-23", "cost": { - "input": 0.02, - "output": 0.049999999999999996 + "input": 0.03, + "output": 0.14 }, "type": "chat" }, { - "id": "llama-3.3-70b-versatile", - "name": "Meta Llama 3.3 70B Versatile", - "display_name": "Meta Llama 3.3 70B Versatile", + "id": "qwen/qwen3-coder", + "name": "Qwen3 Coder", + "display_name": "Qwen3 Coder", "modalities": { "input": [ "text" @@ -144846,8 +149156,8 @@ ] }, "limit": { - "context": 131072, - "output": 32678 + "context": 262144, + "output": 66536 }, "temperature": true, "tool_call": true, @@ -144855,36 +149165,34 @@ "supported": false }, "attachment": false, - "open_weights": false, - "knowledge": "2024-12", - "release_date": "2024-12-06", - "last_updated": "2024-12-06", + "open_weights": true, + "knowledge": "2025-04", + "release_date": "2025-07-23", + "last_updated": "2025-07-23", "cost": { - "input": 0.59, - "output": 0.7899999999999999 + "input": 0.3, + "output": 1.2 }, "type": "chat" }, { - "id": "qwen3-235b-a22b-thinking", - "name": "Qwen3 235B A22B Thinking", - "display_name": "Qwen3 235B A22B Thinking", + "id": "deepseek/deepseek-v4-pro", + "name": "DeepSeek V4 Pro", + "display_name": "DeepSeek V4 Pro", "modalities": { "input": [ - "text", - "image", - "video" + "text" ], "output": [ "text" ] }, "limit": { - "context": 262144, - "output": 81920 + "context": 1000000, + "output": 384000 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { "supported": true, "default": true @@ -144901,55 +149209,63 @@ } }, "attachment": false, - "open_weights": false, - "knowledge": "2025-07", - "release_date": "2025-07-25", - "last_updated": "2025-07-25", + "open_weights": true, + "knowledge": "2025-05", + "release_date": "2026-04-24", + "last_updated": "2026-04-24", "cost": { - "input": 0.3, - "output": 2.9000000000000004 + "input": 1.74, + "output": 3.48 }, "type": "chat" }, { - "id": "gpt-5.1-chat-latest", - "name": "OpenAI GPT-5.1 Chat", - "display_name": "OpenAI GPT-5.1 Chat", + "id": "minimax/minimax-m2.7-highspeed", + "name": "MiniMax-M2.7-highspeed", + "display_name": "MiniMax-M2.7-highspeed", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ - "text", - "image" + "text" ] }, "limit": { - "context": 128000, - "output": 16384 + "context": 204800, + "output": 131072 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } }, "attachment": false, - "open_weights": false, - "knowledge": "2025-01", - "release_date": "2025-01-01", - "last_updated": "2025-01-01", + "open_weights": true, + "release_date": "2026-03-18", + "last_updated": "2026-03-18", "cost": { - "input": 1.25, - "output": 10, - "cache_read": 0.12500000000000003 + "input": 0.6, + "output": 2.4 }, "type": "chat" }, { - "id": "grok-4", - "name": "xAI Grok 4", - "display_name": "xAI Grok 4", + "id": "minimax/minimax-m2.7", + "name": "MiniMax-M2.7", + "display_name": "MiniMax-M2.7", "modalities": { "input": [ "text" @@ -144959,113 +149275,161 @@ ] }, "limit": { - "context": 256000, - "output": 256000 + "context": 204800, + "output": 131072 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true + "supported": true, + "default": true }, "extra_capabilities": { "reasoning": { - "supported": true + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] } }, "attachment": false, - "open_weights": false, - "knowledge": "2024-07", - "release_date": "2024-07-09", - "last_updated": "2024-07-09", + "open_weights": true, + "release_date": "2026-03-18", + "last_updated": "2026-03-18", "cost": { - "input": 3, - "output": 15, - "cache_read": 0.75 + "input": 0.3, + "output": 1.2 }, "type": "chat" }, { - "id": "llama-3.3-70b-instruct", - "name": "Meta Llama 3.3 70B Instruct", - "display_name": "Meta Llama 3.3 70B Instruct", + "id": "leonardo-ai/lucid-origin", + "name": "Lucid Origin", + "display_name": "Lucid Origin", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ - "text" + "image" ] }, "limit": { - "context": 128000, - "output": 16400 + "context": 4096, + "output": 8192 }, - "temperature": true, - "tool_call": true, + "temperature": false, + "tool_call": false, "reasoning": { "supported": false }, - "attachment": false, + "attachment": true, "open_weights": false, - "knowledge": "2024-12", - "release_date": "2024-12-06", - "last_updated": "2024-12-06", - "cost": { - "input": 0.13, - "output": 0.39 - }, + "release_date": "2025-06-01", + "last_updated": "2025-06-01", "type": "chat" }, { - "id": "llama-prompt-guard-2-22m", - "name": "Meta Llama Prompt Guard 2 22M", - "display_name": "Meta Llama Prompt Guard 2 22M", + "id": "leonardo-ai/lucid-realism", + "name": "Lucid Realism", + "display_name": "Lucid Realism", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ - "text" + "image" ] }, "limit": { - "context": 512, - "output": 2 + "context": 4096, + "output": 8192 }, - "temperature": true, + "temperature": false, "tool_call": false, "reasoning": { "supported": false }, - "attachment": false, + "attachment": true, "open_weights": false, - "knowledge": "2024-10", - "release_date": "2024-10-01", - "last_updated": "2024-10-01", + "release_date": "2025-06-01", + "last_updated": "2025-06-01", + "type": "chat" + } + ] + }, + "abliteration-ai": { + "id": "abliteration-ai", + "name": "abliteration.ai", + "display_name": "abliteration.ai", + "api": "https://api.abliteration.ai/v1", + "doc": "https://docs.abliteration.ai/models", + "models": [ + { + "id": "abliterated-model", + "name": "Abliterated Model", + "display_name": "Abliterated Model", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 150000, + "output": 8192 + }, + "temperature": true, + "tool_call": true, + "reasoning": { + "supported": false + }, + "attachment": true, + "open_weights": true, + "release_date": "2026-01-06", + "last_updated": "2026-01-06", "cost": { - "input": 0.01, - "output": 0.01 + "input": 3, + "output": 3 }, "type": "chat" - }, + } + ] + }, + "xpersona": { + "id": "xpersona", + "name": "Xpersona", + "display_name": "Xpersona", + "api": "https://www.xpersona.co/v1", + "doc": "https://www.xpersona.co/docs", + "models": [ { - "id": "o1", - "name": "OpenAI: o1", - "display_name": "OpenAI: o1", + "id": "xpersona-gpt-5.5", + "name": "GPT-5.5", + "display_name": "GPT-5.5", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 100000 + "context": 1000000, + "output": 128000 }, "temperature": false, - "tool_call": false, + "tool_call": true, "reasoning": { "supported": true, "default": true @@ -145073,33 +149437,31 @@ "extra_capabilities": { "reasoning": { "supported": true, - "default_enabled": true, - "mode": "effort", - "effort": "medium", - "effort_options": [ - "low", - "medium", - "high" - ], - "visibility": "hidden" + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] } }, "attachment": false, "open_weights": false, - "knowledge": "2025-01", - "release_date": "2025-01-01", - "last_updated": "2025-01-01", + "knowledge": "2025-12-30", + "release_date": "2026-05-29", + "last_updated": "2026-05-29", "cost": { - "input": 15, - "output": 60, - "cache_read": 7.5 + "input": 3, + "output": 18, + "reasoning": 18, + "cache_read": 0.3 }, "type": "chat" }, { - "id": "grok-4-1-fast-reasoning", - "name": "xAI Grok 4.1 Fast Reasoning", - "display_name": "xAI Grok 4.1 Fast Reasoning", + "id": "xpersona-frieren-coder", + "name": "Xpersona Frieren 1", + "display_name": "Xpersona Frieren 1", "modalities": { "input": [ "text", @@ -145110,40 +149472,45 @@ ] }, "limit": { - "context": 2000000, - "output": 2000000 + "context": 1000000, + "output": 384000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { "supported": true, "default": true }, - "extra_capabilities": { - "reasoning": { - "supported": true - } - }, "attachment": false, "open_weights": false, - "knowledge": "2025-11", - "release_date": "2025-11-17", - "last_updated": "2025-11-17", + "knowledge": "2025-12-30", + "release_date": "2026-05-01", + "last_updated": "2026-05-25", "cost": { - "input": 0.19999999999999998, - "output": 0.5, - "cache_read": 0.049999999999999996 + "input": 1.5, + "output": 6, + "reasoning": 6, + "cache_read": 0.15 }, "type": "chat" - }, + } + ] + }, + "azure-cognitive-services": { + "id": "azure-cognitive-services", + "name": "Azure Cognitive Services", + "display_name": "Azure Cognitive Services", + "doc": "https://learn.microsoft.com/en-us/azure/ai-services/openai/concepts/models", + "models": [ { - "id": "claude-opus-4", - "name": "Anthropic: Claude Opus 4", - "display_name": "Anthropic: Claude Opus 4", + "id": "claude-opus-4-5", + "name": "Claude Opus 4.5", + "display_name": "Claude Opus 4.5", "modalities": { "input": [ "text", - "image" + "image", + "pdf" ], "output": [ "text" @@ -145151,7 +149518,7 @@ }, "limit": { "context": 200000, - "output": 32000 + "output": 64000 }, "temperature": true, "tool_call": true, @@ -145163,11 +149530,17 @@ "reasoning": { "supported": true, "default_enabled": false, - "mode": "budget", + "mode": "mixed", "budget": { "min": 1024, "unit": "tokens" }, + "effort": "high", + "effort_options": [ + "low", + "medium", + "high" + ], "interleaved": true, "summaries": true, "visibility": "summary", @@ -145175,180 +149548,207 @@ "thinking_blocks" ], "notes": [ - "Claude 4 manual thinking uses thinking.type = \"enabled\" with budget_tokens.", - "Interleaved thinking requires the interleaved-thinking-2025-05-14 beta header for this model family." + "Claude Opus 4.5 uses manual thinking.type = \"enabled\" with budget_tokens; effort can be used alongside the thinking budget.", + "Interleaved thinking requires the interleaved-thinking-2025-05-14 beta header." ] } }, - "attachment": false, + "attachment": true, "open_weights": false, - "knowledge": "2025-05", - "release_date": "2025-05-14", - "last_updated": "2025-05-14", + "knowledge": "2025-03-31", + "release_date": "2025-11-24", + "last_updated": "2025-08-01", "cost": { - "input": 15, - "output": 75, - "cache_read": 1.5, - "cache_write": 18.75 + "input": 5, + "output": 25, + "cache_read": 0.5, + "cache_write": 6.25 }, "type": "chat" }, { - "id": "grok-code-fast-1", - "name": "xAI Grok Code Fast 1", - "display_name": "xAI Grok Code Fast 1", + "id": "claude-sonnet-4-5", + "name": "Claude Sonnet 4.5", + "display_name": "Claude Sonnet 4.5", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 256000, - "output": 10000 + "context": 200000, + "output": 64000 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true + "supported": true, + "default": false }, "extra_capabilities": { "reasoning": { - "supported": true + "supported": true, + "default_enabled": false, + "mode": "budget", + "budget": { + "min": 1024, + "unit": "tokens" + }, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ], + "notes": [ + "Claude 4 manual thinking uses thinking.type = \"enabled\" with budget_tokens.", + "Interleaved thinking requires the interleaved-thinking-2025-05-14 beta header for this model family." + ] } }, - "attachment": false, + "attachment": true, "open_weights": false, - "knowledge": "2024-08", - "release_date": "2024-08-25", - "last_updated": "2024-08-25", + "knowledge": "2025-07-31", + "release_date": "2025-11-18", + "last_updated": "2025-11-18", "cost": { - "input": 0.19999999999999998, - "output": 1.5, - "cache_read": 0.02 + "input": 3, + "output": 15, + "cache_read": 0.3, + "cache_write": 3.75 }, "type": "chat" }, { - "id": "sonar-deep-research", - "name": "Perplexity Sonar Deep Research", - "display_name": "Perplexity Sonar Deep Research", + "id": "gpt-5.4-nano", + "name": "GPT-5.4 Nano", + "display_name": "GPT-5.4 Nano", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 127000, - "output": 4096 + "context": 400000, + "output": 128000 }, - "temperature": true, - "tool_call": false, + "temperature": false, + "tool_call": true, "reasoning": { "supported": true, - "default": true + "default": false }, - "attachment": false, + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": false, + "mode": "effort", + "effort": "none", + "effort_options": [ + "none", + "low", + "medium", + "high", + "xhigh" + ], + "verbosity": "medium", + "verbosity_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" + } + }, + "attachment": true, "open_weights": false, - "knowledge": "2025-01", - "release_date": "2025-01-27", - "last_updated": "2025-01-27", + "knowledge": "2025-08-31", + "release_date": "2026-03-17", + "last_updated": "2026-03-17", "cost": { - "input": 2, - "output": 8 + "input": 0.2, + "output": 1.25, + "cache_read": 0.02 }, "type": "chat" }, { - "id": "gpt-4.1-nano", - "name": "OpenAI GPT-4.1 Nano", - "display_name": "OpenAI GPT-4.1 Nano", + "id": "claude-opus-4-1", + "name": "Claude Opus 4.1", + "display_name": "Claude Opus 4.1", "modalities": { "input": [ "text", - "image" - ], - "output": [ - "text" - ] - }, - "limit": { - "context": 1047576, - "output": 32768 - }, - "temperature": true, - "tool_call": true, - "reasoning": { - "supported": false - }, - "attachment": false, - "open_weights": false, - "knowledge": "2025-04", - "release_date": "2025-04-14", - "last_updated": "2025-04-14", - "cost": { - "input": 0.09999999999999999, - "output": 0.39999999999999997, - "cache_read": 0.024999999999999998 - }, - "type": "chat" - } - ] - }, - "zai": { - "id": "zai", - "name": "Z.AI", - "display_name": "Z.AI", - "api": "https://api.z.ai/api/paas/v4", - "doc": "https://docs.z.ai/guides/overview/pricing", - "models": [ - { - "id": "glm-4.5-flash", - "name": "GLM-4.5-Flash", - "display_name": "GLM-4.5-Flash", - "modalities": { - "input": [ - "text" + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 131072, - "output": 98304 + "context": 200000, + "output": 32000 }, "temperature": true, "tool_call": true, "reasoning": { "supported": true, - "default": true + "default": false }, - "attachment": false, - "open_weights": true, - "knowledge": "2025-04", - "release_date": "2025-07-28", - "last_updated": "2025-07-28", + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": false, + "mode": "budget", + "budget": { + "min": 1024, + "unit": "tokens" + }, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ], + "notes": [ + "Claude 4 manual thinking uses thinking.type = \"enabled\" with budget_tokens.", + "Interleaved thinking requires the interleaved-thinking-2025-05-14 beta header for this model family." + ] + } + }, + "attachment": true, + "open_weights": false, + "knowledge": "2025-03-31", + "release_date": "2025-11-18", + "last_updated": "2025-11-18", "cost": { - "input": 0, - "output": 0, - "cache_read": 0, - "cache_write": 0 + "input": 15, + "output": 75, + "cache_read": 1.5, + "cache_write": 18.75 }, "type": "chat" }, { - "id": "glm-4.7-flashx", - "name": "GLM-4.7-FlashX", - "display_name": "GLM-4.7-FlashX", + "id": "claude-haiku-4-5", + "name": "Claude Haiku 4.5", + "display_name": "Claude Haiku 4.5", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ "text" @@ -145356,130 +149756,196 @@ }, "limit": { "context": 200000, - "output": 131072 + "output": 64000 }, "temperature": true, "tool_call": true, "reasoning": { "supported": true, - "default": true + "default": false }, - "attachment": false, - "open_weights": true, - "knowledge": "2025-04", - "release_date": "2026-01-19", - "last_updated": "2026-01-19", + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": false, + "mode": "budget", + "budget": { + "min": 1024, + "unit": "tokens" + }, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ], + "notes": [ + "Claude 4 manual thinking uses thinking.type = \"enabled\" with budget_tokens.", + "Interleaved thinking requires the interleaved-thinking-2025-05-14 beta header for this model family." + ] + } + }, + "attachment": true, + "open_weights": false, + "knowledge": "2025-02-31", + "release_date": "2025-11-18", + "last_updated": "2025-11-18", "cost": { - "input": 0.07, - "output": 0.4, - "cache_read": 0.01, - "cache_write": 0 + "input": 1, + "output": 5, + "cache_read": 0.1, + "cache_write": 1.25 }, "type": "chat" }, { - "id": "glm-4.6", - "name": "GLM-4.6", - "display_name": "GLM-4.6", + "id": "gpt-5.4", + "name": "GPT-5.4", + "display_name": "GPT-5.4", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 204800, - "output": 131072 + "context": 1050000, + "output": 128000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { "supported": true, - "default": true + "default": false }, "extra_capabilities": { "reasoning": { - "supported": true + "supported": true, + "default_enabled": false, + "mode": "effort", + "effort": "none", + "effort_options": [ + "none", + "low", + "medium", + "high", + "xhigh" + ], + "verbosity": "medium", + "verbosity_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" + } + }, + "attachment": true, + "open_weights": false, + "knowledge": "2025-08-31", + "release_date": "2026-03-05", + "last_updated": "2026-03-05", + "cost": { + "input": 2.5, + "output": 15, + "cache_read": 0.25, + "tiers": [ + { + "input": 5, + "output": 22.5, + "cache_read": 0.5, + "tier": { + "type": "context", + "size": 272000 + } + } + ], + "context_over_200k": { + "input": 5, + "output": 22.5, + "cache_read": 0.5 } }, - "attachment": false, - "open_weights": true, - "knowledge": "2025-04", - "release_date": "2025-09-30", - "last_updated": "2025-09-30", - "cost": { - "input": 0.6, - "output": 2.2, - "cache_read": 0.11, - "cache_write": 0 - }, "type": "chat" }, { - "id": "glm-4.7", - "name": "GLM-4.7", - "display_name": "GLM-4.7", + "id": "gpt-5.4-mini", + "name": "GPT-5.4 Mini", + "display_name": "GPT-5.4 Mini", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 204800, - "output": 131072 + "context": 400000, + "output": 128000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { "supported": true, - "default": true + "default": false }, "extra_capabilities": { "reasoning": { "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] + "default_enabled": false, + "mode": "effort", + "effort": "none", + "effort_options": [ + "none", + "low", + "medium", + "high", + "xhigh" + ], + "verbosity": "medium", + "verbosity_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" } }, - "attachment": false, - "open_weights": true, - "knowledge": "2025-04", - "release_date": "2025-12-22", - "last_updated": "2025-12-22", + "attachment": true, + "open_weights": false, + "knowledge": "2025-08-31", + "release_date": "2026-03-17", + "last_updated": "2026-03-17", "cost": { - "input": 0.6, - "output": 2.2, - "cache_read": 0.11, - "cache_write": 0 + "input": 0.75, + "output": 4.5, + "cache_read": 0.075 }, "type": "chat" }, { - "id": "glm-4.5v", - "name": "GLM-4.5V", - "display_name": "GLM-4.5V", + "id": "kimi-k2.6", + "name": "Kimi K2.6", + "display_name": "Kimi K2.6", "modalities": { "input": [ "text", - "image", - "video" + "image" ], "output": [ "text" ] }, "limit": { - "context": 64000, - "output": 16384 + "context": 262144, + "output": 262144 }, "temperature": true, "tool_call": true, @@ -145487,69 +149953,124 @@ "supported": true, "default": true }, - "attachment": true, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true + } + }, + "attachment": false, "open_weights": true, - "knowledge": "2025-04", - "release_date": "2025-08-11", - "last_updated": "2025-08-11", + "knowledge": "2025-01", + "release_date": "2026-04-22", + "last_updated": "2026-04-22", "cost": { - "input": 0.6, - "output": 1.8 + "input": 0.95, + "output": 4 }, "type": "chat" }, { - "id": "glm-4.6v", - "name": "GLM-4.6V", - "display_name": "GLM-4.6V", + "id": "claude-opus-4-6", + "name": "Claude Opus 4.6", + "display_name": "Claude Opus 4.6", "modalities": { "input": [ "text", "image", - "video" + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 32768 + "context": 200000, + "output": 128000 }, "temperature": true, "tool_call": true, "reasoning": { "supported": true, - "default": true + "default": false + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": false, + "mode": "mixed", + "budget": { + "min": 1024, + "unit": "tokens" + }, + "effort": "high", + "effort_options": [ + "low", + "medium", + "high", + "max" + ], + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ], + "notes": [ + "Anthropic recommends adaptive thinking with effort for Claude 4.6; budget_tokens remains a deprecated compatibility path.", + "Anthropic API defaults effort to high; lower effort levels should be chosen per workload." + ] + } }, "attachment": true, - "open_weights": true, - "knowledge": "2025-04", - "release_date": "2025-12-08", - "last_updated": "2025-12-08", + "open_weights": false, + "knowledge": "2025-05-31", + "release_date": "2026-02-05", + "last_updated": "2026-02-05", "cost": { - "input": 0.3, - "output": 0.9 + "input": 5, + "output": 25, + "cache_read": 0.5, + "cache_write": 6.25, + "tiers": [ + { + "input": 10, + "output": 37.5, + "cache_read": 1, + "cache_write": 12.5, + "tier": { + "type": "context", + "size": 200000 + } + } + ], + "context_over_200k": { + "input": 10, + "output": 37.5, + "cache_read": 1, + "cache_write": 12.5 + } }, "type": "chat" }, { - "id": "glm-4.7-flash", - "name": "GLM-4.7-Flash", - "display_name": "GLM-4.7-Flash", + "id": "gpt-5.4-pro", + "name": "GPT-5.4 Pro", + "display_name": "GPT-5.4 Pro", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 131072 + "context": 1050000, + "output": 128000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { "supported": true, @@ -145557,31 +150078,57 @@ }, "extra_capabilities": { "reasoning": { - "supported": true + "supported": true, + "default_enabled": true, + "mode": "effort", + "effort": "high", + "effort_options": [ + "medium", + "high", + "xhigh" + ], + "verbosity": "medium", + "verbosity_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" } }, - "attachment": false, - "open_weights": true, - "knowledge": "2025-04", - "release_date": "2026-01-19", - "last_updated": "2026-01-19", + "attachment": true, + "open_weights": false, + "knowledge": "2025-08-31", + "release_date": "2026-03-05", + "last_updated": "2026-03-05", "cost": { - "input": 0, - "output": 0, - "cache_read": 0, - "cache_write": 0 + "input": 30, + "output": 180, + "tiers": [ + { + "input": 60, + "output": 270, + "tier": { + "type": "context", + "size": 272000 + } + } + ], + "context_over_200k": { + "input": 60, + "output": 270 + } }, "type": "chat" }, { - "id": "glm-5v-turbo", - "name": "GLM-5V-Turbo", - "display_name": "GLM-5V-Turbo", + "id": "gpt-5.5", + "name": "GPT-5.5", + "display_name": "GPT-5.5", "modalities": { "input": [ "text", "image", - "video", "pdf" ], "output": [ @@ -145589,10 +150136,10 @@ ] }, "limit": { - "context": 200000, - "output": 131072 + "context": 1050000, + "output": 128000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { "supported": true, @@ -145601,75 +150148,115 @@ "extra_capabilities": { "reasoning": { "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] + "default_enabled": true, + "mode": "effort", + "effort": "medium", + "effort_options": [ + "low", + "medium", + "high", + "xhigh" + ], + "verbosity": "medium", + "verbosity_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" } }, "attachment": true, "open_weights": false, - "release_date": "2026-04-01", - "last_updated": "2026-04-01", + "knowledge": "2025-12-01", + "release_date": "2026-04-24", + "last_updated": "2026-04-24", "cost": { - "input": 1.2, - "output": 4, - "cache_read": 0.24, - "cache_write": 0 + "input": 5, + "output": 30, + "cache_read": 0.5, + "tiers": [ + { + "input": 10, + "output": 45, + "cache_read": 1, + "tier": { + "type": "context", + "size": 272000 + } + } + ], + "context_over_200k": { + "input": 10, + "output": 45, + "cache_read": 1 + } }, "type": "chat" }, { - "id": "glm-5", - "name": "GLM-5", - "display_name": "GLM-5", + "id": "gpt-5.1", + "name": "GPT-5.1", + "display_name": "GPT-5.1", "modalities": { "input": [ - "text" + "text", + "image", + "audio" ], "output": [ - "text" + "text", + "image", + "audio" ] }, "limit": { - "context": 204800, - "output": 131072 + "context": 272000, + "output": 128000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { "supported": true, - "default": true + "default": false }, "extra_capabilities": { "reasoning": { "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] + "default_enabled": false, + "mode": "effort", + "effort": "none", + "effort_options": [ + "none", + "low", + "medium", + "high" + ], + "verbosity": "medium", + "verbosity_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" } }, - "attachment": false, - "open_weights": true, - "release_date": "2026-02-11", - "last_updated": "2026-02-11", + "attachment": true, + "open_weights": false, + "knowledge": "2024-09-30", + "release_date": "2025-11-14", + "last_updated": "2025-11-14", "cost": { - "input": 1, - "output": 3.2, - "cache_read": 0.2, - "cache_write": 0 + "input": 1.25, + "output": 10, + "cache_read": 0.125 }, "type": "chat" }, { - "id": "glm-5-turbo", - "name": "GLM-5-Turbo", - "display_name": "GLM-5-Turbo", + "id": "meta-llama-3-70b-instruct", + "name": "Meta-Llama-3-70B-Instruct", + "display_name": "Meta-Llama-3-70B-Instruct", "modalities": { "input": [ "text" @@ -145679,42 +150266,29 @@ ] }, "limit": { - "context": 200000, - "output": 131072 + "context": 8192, + "output": 2048 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } + "supported": false }, "attachment": false, - "open_weights": false, - "release_date": "2026-03-16", - "last_updated": "2026-03-16", + "open_weights": true, + "knowledge": "2023-12", + "release_date": "2024-04-18", + "last_updated": "2024-04-18", "cost": { - "input": 1.2, - "output": 4, - "cache_read": 0.24, - "cache_write": 0 + "input": 2.68, + "output": 3.54 }, "type": "chat" }, { - "id": "glm-4.5", - "name": "GLM-4.5", - "display_name": "GLM-4.5", + "id": "phi-3-mini-4k-instruct", + "name": "Phi-3-mini-instruct (4k)", + "display_name": "Phi-3-mini-instruct (4k)", "modalities": { "input": [ "text" @@ -145724,32 +150298,29 @@ ] }, "limit": { - "context": 131072, - "output": 98304 + "context": 4096, + "output": 1024 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": true + "supported": false }, "attachment": false, "open_weights": true, - "knowledge": "2025-04", - "release_date": "2025-07-28", - "last_updated": "2025-07-28", + "knowledge": "2023-10", + "release_date": "2024-04-23", + "last_updated": "2024-04-23", "cost": { - "input": 0.6, - "output": 2.2, - "cache_read": 0.11, - "cache_write": 0 + "input": 0.13, + "output": 0.52 }, "type": "chat" }, { - "id": "glm-4.5-air", - "name": "GLM-4.5-Air", - "display_name": "GLM-4.5-Air", + "id": "phi-3-mini-128k-instruct", + "name": "Phi-3-mini-instruct (128k)", + "display_name": "Phi-3-mini-instruct (128k)", "modalities": { "input": [ "text" @@ -145759,32 +150330,29 @@ ] }, "limit": { - "context": 131072, - "output": 98304 + "context": 128000, + "output": 4096 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": true + "supported": false }, "attachment": false, "open_weights": true, - "knowledge": "2025-04", - "release_date": "2025-07-28", - "last_updated": "2025-07-28", + "knowledge": "2023-10", + "release_date": "2024-04-23", + "last_updated": "2024-04-23", "cost": { - "input": 0.2, - "output": 1.1, - "cache_read": 0.03, - "cache_write": 0 + "input": 0.13, + "output": 0.52 }, "type": "chat" }, { - "id": "glm-5.1", - "name": "GLM-5.1", - "display_name": "GLM-5.1", + "id": "phi-4-mini-reasoning", + "name": "Phi-4-mini-reasoning", + "display_name": "Phi-4-mini-reasoning", "modalities": { "input": [ "text" @@ -145794,8 +150362,8 @@ ] }, "limit": { - "context": 200000, - "output": 131072 + "context": 128000, + "output": 4096 }, "temperature": true, "tool_call": true, @@ -145803,123 +150371,110 @@ "supported": true, "default": true }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } - }, "attachment": false, - "open_weights": false, - "release_date": "2026-03-27", - "last_updated": "2026-03-27", + "open_weights": true, + "knowledge": "2023-10", + "release_date": "2024-12-11", + "last_updated": "2024-12-11", "cost": { - "input": 1.4, - "output": 4.4, - "cache_read": 0.26, - "cache_write": 0 + "input": 0.075, + "output": 0.3 }, "type": "chat" - } - ] - }, - "nova": { - "id": "nova", - "name": "Nova", - "display_name": "Nova", - "api": "https://api.nova.amazon.com/v1", - "doc": "https://nova.amazon.com/dev/documentation", - "models": [ + }, { - "id": "nova-2-pro-v1", - "name": "Nova 2 Pro", - "display_name": "Nova 2 Pro", + "id": "gpt-5.2-codex", + "name": "GPT-5.2 Codex", + "display_name": "GPT-5.2 Codex", "modalities": { "input": [ "text", - "image", - "video", - "pdf" + "image" ], "output": [ "text" ] }, "limit": { - "context": 1000000, - "output": 64000 + "context": 400000, + "output": 128000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { "supported": true, "default": true }, - "attachment": true, + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": true, + "mode": "effort", + "effort": "medium", + "effort_options": [ + "low", + "medium", + "high", + "xhigh" + ], + "verbosity": "medium", + "verbosity_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" + } + }, + "attachment": false, "open_weights": false, - "release_date": "2025-12-03", - "last_updated": "2026-01-03", + "knowledge": "2025-08-31", + "release_date": "2026-01-14", + "last_updated": "2026-01-14", "cost": { - "input": 0, - "output": 0, - "reasoning": 0 + "input": 1.75, + "output": 14, + "cache_read": 0.175 }, "type": "chat" }, { - "id": "nova-2-lite-v1", - "name": "Nova 2 Lite", - "display_name": "Nova 2 Lite", + "id": "llama-4-maverick-17b-128e-instruct-fp8", + "name": "Llama 4 Maverick 17B 128E Instruct FP8", + "display_name": "Llama 4 Maverick 17B 128E Instruct FP8", "modalities": { "input": [ "text", - "image", - "video", - "pdf" + "image" ], "output": [ "text" ] }, "limit": { - "context": 1000000, - "output": 64000 + "context": 128000, + "output": 8192 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, "attachment": true, - "open_weights": false, - "release_date": "2025-12-01", - "last_updated": "2025-12-01", + "open_weights": true, + "knowledge": "2024-08", + "release_date": "2025-04-05", + "last_updated": "2025-04-05", "cost": { - "input": 0, - "output": 0, - "reasoning": 0 + "input": 0.25, + "output": 1 }, "type": "chat" - } - ] - }, - "nearai": { - "id": "nearai", - "name": "NEAR AI Cloud", - "display_name": "NEAR AI Cloud", - "api": "https://cloud-api.near.ai/v1", - "doc": "https://docs.near.ai/", - "models": [ + }, { - "id": "zai-org/GLM-5.1-FP8", - "name": "GLM-5.1 FP8", - "display_name": "GLM-5.1 FP8", + "id": "deepseek-v3.2", + "name": "DeepSeek-V3.2", + "display_name": "DeepSeek-V3.2", "modalities": { "input": [ "text" @@ -145929,8 +150484,8 @@ ] }, "limit": { - "context": 202752, - "output": 131072 + "context": 128000, + "output": 128000 }, "temperature": true, "tool_call": true, @@ -145940,370 +150495,245 @@ }, "extra_capabilities": { "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] + "supported": true } }, "attachment": false, "open_weights": true, - "release_date": "2026-03-27", - "last_updated": "2026-03-27", + "knowledge": "2024-07", + "release_date": "2025-12-01", + "last_updated": "2025-12-01", "cost": { - "input": 0.85, - "output": 3.3 + "input": 0.58, + "output": 1.68 }, "type": "chat" }, { - "id": "anthropic/claude-sonnet-4-6", - "name": "Claude Sonnet 4.6", - "display_name": "Claude Sonnet 4.6", + "id": "gpt-5-codex", + "name": "GPT-5-Codex", + "display_name": "GPT-5-Codex", "modalities": { "input": [ "text", - "image", - "pdf" + "image" ], "output": [ "text" ] }, "limit": { - "context": 1000000, - "output": 64000 + "context": 400000, + "output": 128000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { "supported": true, - "default": false + "default": true }, "extra_capabilities": { "reasoning": { "supported": true, - "default_enabled": false, - "mode": "mixed", - "budget": { - "min": 1024, - "unit": "tokens" - }, - "effort": "high", + "default_enabled": true, + "mode": "effort", + "effort": "medium", "effort_options": [ + "minimal", "low", "medium", - "high", - "max" + "high" ], - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" + "verbosity": "medium", + "verbosity_options": [ + "low", + "medium", + "high" ], - "notes": [ - "Anthropic recommends adaptive thinking with effort for Claude 4.6; budget_tokens remains a deprecated compatibility path.", - "Anthropic API defaults effort to high; lower effort levels should be chosen per workload." - ] + "visibility": "hidden" } }, - "attachment": true, + "attachment": false, "open_weights": false, - "knowledge": "2025-08-31", - "release_date": "2026-02-17", - "last_updated": "2026-03-13", + "knowledge": "2024-09-30", + "release_date": "2025-09-15", + "last_updated": "2025-09-15", "cost": { - "input": 3, - "output": 15, - "cache_read": 0.3, - "cache_write": 3.75 + "input": 1.25, + "output": 10, + "cache_read": 0.13 }, "type": "chat" }, { - "id": "anthropic/claude-haiku-4-5", - "name": "Claude Haiku 4.5 (latest)", - "display_name": "Claude Haiku 4.5 (latest)", + "id": "model-router", + "name": "Model Router", + "display_name": "Model Router", "modalities": { "input": [ "text", - "image", - "pdf" + "image" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 64000 + "context": 128000, + "output": 16384 }, - "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": false - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": false, - "mode": "budget", - "budget": { - "min": 1024, - "unit": "tokens" - }, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ], - "notes": [ - "Claude 4 manual thinking uses thinking.type = \"enabled\" with budget_tokens.", - "Interleaved thinking requires the interleaved-thinking-2025-05-14 beta header for this model family." - ] - } + "supported": false }, "attachment": true, "open_weights": false, - "knowledge": "2025-02-28", - "release_date": "2025-10-15", - "last_updated": "2025-10-15", + "release_date": "2025-05-19", + "last_updated": "2025-11-18", "cost": { - "input": 1, - "output": 5, - "cache_read": 0.1, - "cache_write": 1.25 + "input": 0.14, + "output": 0 }, "type": "chat" }, { - "id": "anthropic/claude-sonnet-4-5", - "name": "Claude Sonnet 4.5 (latest)", - "display_name": "Claude Sonnet 4.5 (latest)", + "id": "gpt-4o-mini", + "name": "GPT-4o mini", + "display_name": "GPT-4o mini", "modalities": { "input": [ "text", - "image", - "pdf" + "image" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 64000 + "context": 128000, + "output": 16384 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": false - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": false, - "mode": "budget", - "budget": { - "min": 1024, - "unit": "tokens" - }, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ], - "notes": [ - "Claude 4 manual thinking uses thinking.type = \"enabled\" with budget_tokens.", - "Interleaved thinking requires the interleaved-thinking-2025-05-14 beta header for this model family." - ] - } + "supported": false }, "attachment": true, "open_weights": false, - "knowledge": "2025-07-31", - "release_date": "2025-09-29", - "last_updated": "2025-09-29", + "knowledge": "2023-09", + "release_date": "2024-07-18", + "last_updated": "2024-07-18", "cost": { - "input": 3, - "output": 15.5, - "cache_read": 0.3, - "cache_write": 3.75 + "input": 0.15, + "output": 0.6, + "cache_read": 0.075 }, "type": "chat" }, { - "id": "anthropic/claude-opus-4-6", - "name": "Claude Opus 4.6", - "display_name": "Claude Opus 4.6", + "id": "phi-4-multimodal", + "name": "Phi-4-multimodal", + "display_name": "Phi-4-multimodal", "modalities": { "input": [ "text", "image", - "pdf" + "audio" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 128000 + "context": 128000, + "output": 4096 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": false - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": false, - "mode": "mixed", - "budget": { - "min": 1024, - "unit": "tokens" - }, - "effort": "high", - "effort_options": [ - "low", - "medium", - "high", - "max" - ], - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ], - "notes": [ - "Anthropic recommends adaptive thinking with effort for Claude 4.6; budget_tokens remains a deprecated compatibility path.", - "Anthropic API defaults effort to high; lower effort levels should be chosen per workload." - ] - } + "supported": false }, "attachment": true, - "open_weights": false, - "knowledge": "2025-05-31", - "release_date": "2026-02-05", - "last_updated": "2026-03-13", + "open_weights": true, + "knowledge": "2023-10", + "release_date": "2024-12-11", + "last_updated": "2024-12-11", "cost": { - "input": 5, - "output": 25, - "cache_read": 0.5, - "cache_write": 6.25 + "input": 0.08, + "output": 0.32, + "input_audio": 4 }, "type": "chat" }, { - "id": "anthropic/claude-opus-4-7", - "name": "Claude Opus 4.7", - "display_name": "Claude Opus 4.7", + "id": "phi-4-reasoning-plus", + "name": "Phi-4-reasoning-plus", + "display_name": "Phi-4-reasoning-plus", "modalities": { "input": [ - "text", - "image", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 1000000, - "output": 128000 + "context": 32000, + "output": 4096 }, - "temperature": false, - "tool_call": true, + "temperature": true, + "tool_call": false, "reasoning": { "supported": true, - "default": false - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": false, - "mode": "effort", - "effort": "high", - "effort_options": [ - "low", - "medium", - "high", - "xhigh", - "max" - ], - "interleaved": true, - "summaries": true, - "visibility": "omitted", - "continuation": [ - "thinking_blocks" - ], - "notes": [ - "Claude Opus 4.7 and newer Opus models require thinking.type = \"adaptive\" to enable thinking explicitly.", - "Manual budget_tokens requests return 400 on Claude Opus 4.7 and newer adaptive-only Opus models.", - "task_budget is separate from thinking control and should not be treated as a thinking budget." - ] - } + "default": true }, - "attachment": true, - "open_weights": false, - "knowledge": "2026-01-31", - "release_date": "2026-04-16", - "last_updated": "2026-04-16", + "attachment": false, + "open_weights": true, + "knowledge": "2023-10", + "release_date": "2024-12-11", + "last_updated": "2024-12-11", "cost": { - "input": 5, - "output": 25, - "cache_read": 0.5, - "cache_write": 6.25 + "input": 0.125, + "output": 0.5 }, "type": "chat" }, { - "id": "black-forest-labs/FLUX.2-klein-4B", - "name": "FLUX.2 Klein 4B", - "display_name": "FLUX.2 Klein 4B", + "id": "codestral-2501", + "name": "Codestral 25.01", + "display_name": "Codestral 25.01", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ - "image" + "text" ] }, "limit": { - "context": 128000, - "output": 128000 + "context": 256000, + "output": 256000 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { "supported": false }, "attachment": false, - "open_weights": true, - "release_date": "2026-01-14", - "last_updated": "2026-01-14", + "open_weights": false, + "knowledge": "2024-03", + "release_date": "2025-01-01", + "last_updated": "2025-01-01", "cost": { - "input": 1, - "output": 1 + "input": 0.3, + "output": 0.9 }, "type": "chat" }, { - "id": "Qwen/Qwen3.6-35B-A3B-FP8", - "name": "Qwen 3.6 35B A3B FP8", - "display_name": "Qwen 3.6 35B A3B FP8", + "id": "cohere-embed-v3-english", + "name": "Embed v3 English", + "display_name": "Embed v3 English", "modalities": { "input": [ "text" @@ -146313,41 +150743,28 @@ ] }, "limit": { - "context": 262144, - "output": 32768 + "context": 512, + "output": 1024 }, - "temperature": true, - "tool_call": true, + "temperature": false, + "tool_call": false, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } + "supported": false }, - "attachment": true, + "attachment": false, "open_weights": true, - "release_date": "2026-04-17", - "last_updated": "2026-04-17", + "release_date": "2023-11-07", + "last_updated": "2023-11-07", "cost": { - "input": 0.17, - "output": 1.1, - "cache_read": 0.056 + "input": 0.1, + "output": 0 }, "type": "chat" }, { - "id": "Qwen/Qwen3-30B-A3B-Instruct-2507", - "name": "Qwen3 30B-A3B Instruct 2507", - "display_name": "Qwen3 30B-A3B Instruct 2507", + "id": "phi-3-medium-4k-instruct", + "name": "Phi-3-medium-instruct (4k)", + "display_name": "Phi-3-medium-instruct (4k)", "modalities": { "input": [ "text" @@ -146357,90 +150774,118 @@ ] }, "limit": { - "context": 262144, - "output": 32768 + "context": 4096, + "output": 1024 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": false }, "attachment": false, "open_weights": true, - "release_date": "2025-07-29", - "last_updated": "2025-07-29", + "knowledge": "2023-10", + "release_date": "2024-04-23", + "last_updated": "2024-04-23", "cost": { - "input": 0.15, - "output": 0.55 + "input": 0.17, + "output": 0.68 }, "type": "chat" }, { - "id": "Qwen/Qwen3-Reranker-0.6B", - "name": "Qwen3 Reranker 0.6B", - "display_name": "Qwen3 Reranker 0.6B", + "id": "gpt-5-nano", + "name": "GPT-5 Nano", + "display_name": "GPT-5 Nano", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 40960, - "output": 1024 + "context": 272000, + "output": 128000 }, "temperature": false, - "tool_call": false, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": true, + "mode": "effort", + "effort": "medium", + "effort_options": [ + "minimal", + "low", + "medium", + "high" + ], + "verbosity": "medium", + "verbosity_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" + } }, - "attachment": false, - "open_weights": true, - "release_date": "2025-06-03", - "last_updated": "2025-06-03", + "attachment": true, + "open_weights": false, + "knowledge": "2024-05-30", + "release_date": "2025-08-07", + "last_updated": "2025-08-07", "cost": { - "input": 0.01, - "output": 0.01 + "input": 0.05, + "output": 0.4, + "cache_read": 0.01 }, - "type": "rerank" + "type": "chat" }, { - "id": "Qwen/Qwen3-Embedding-0.6B", - "name": "Qwen3 Embedding 0.6B", - "display_name": "Qwen3 Embedding 0.6B", + "id": "gpt-4-turbo", + "name": "GPT-4 Turbo", + "display_name": "GPT-4 Turbo", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 40960, - "output": 1024 + "context": 128000, + "output": 4096 }, - "temperature": false, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { "supported": false }, - "attachment": false, - "open_weights": true, - "release_date": "2025-06-03", - "last_updated": "2025-06-03", + "attachment": true, + "open_weights": false, + "knowledge": "2023-12", + "release_date": "2023-11-06", + "last_updated": "2024-04-09", "cost": { - "input": 0.01, - "output": 0 + "input": 10, + "output": 30 }, - "type": "embedding" + "type": "chat" }, { - "id": "Qwen/Qwen3-VL-30B-A3B-Instruct", - "name": "Qwen3-VL 30B-A3B Instruct", - "display_name": "Qwen3-VL 30B-A3B Instruct", + "id": "gpt-4.1-mini", + "name": "GPT-4.1 mini", + "display_name": "GPT-4.1 mini", "modalities": { "input": [ "text", @@ -146451,7 +150896,7 @@ ] }, "limit": { - "context": 256000, + "context": 1047576, "output": 32768 }, "temperature": true, @@ -146460,32 +150905,35 @@ "supported": false }, "attachment": true, - "open_weights": true, - "release_date": "2025-09-23", - "last_updated": "2025-09-23", + "open_weights": false, + "knowledge": "2024-04", + "release_date": "2025-04-14", + "last_updated": "2025-04-14", "cost": { - "input": 0.15, - "output": 0.55 + "input": 0.4, + "output": 1.6, + "cache_read": 0.1 }, "type": "chat" }, { - "id": "Qwen/Qwen3.5-122B-A10B", - "name": "Qwen3.5 122B-A10B", - "display_name": "Qwen3.5 122B-A10B", + "id": "gpt-5-mini", + "name": "GPT-5 Mini", + "display_name": "GPT-5 Mini", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 131072, - "output": 32768 + "context": 272000, + "output": 128000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { "supported": true, @@ -146494,156 +150942,139 @@ "extra_capabilities": { "reasoning": { "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] + "default_enabled": true, + "mode": "effort", + "effort": "medium", + "effort_options": [ + "minimal", + "low", + "medium", + "high" + ], + "verbosity": "medium", + "verbosity_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" } }, "attachment": true, - "open_weights": true, - "release_date": "2026-02-23", - "last_updated": "2026-02-23", + "open_weights": false, + "knowledge": "2024-05-30", + "release_date": "2025-08-07", + "last_updated": "2025-08-07", "cost": { - "input": 0.4, - "output": 3.2 + "input": 0.25, + "output": 2, + "cache_read": 0.03 }, "type": "chat" }, { - "id": "google/gemini-3-pro", - "name": "Gemini 3 Pro Preview", - "display_name": "Gemini 3 Pro Preview", + "id": "gpt-4.1", + "name": "GPT-4.1", + "display_name": "GPT-4.1", "modalities": { "input": [ "text", - "image", - "video", - "audio", - "pdf" + "image" ], "output": [ "text" ] }, "limit": { - "context": 1048576, - "output": 65536 + "context": 1047576, + "output": 32768 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": true, - "mode": "level", - "level": "high", - "level_options": [ - "low", - "high" - ], - "summaries": true, - "visibility": "summary", - "continuation": [ - "thought_signatures" - ] - } + "supported": false }, "attachment": true, "open_weights": false, - "knowledge": "2025-01", - "release_date": "2025-11-18", - "last_updated": "2025-11-18", + "knowledge": "2024-04", + "release_date": "2025-04-14", + "last_updated": "2025-04-14", "cost": { - "input": 1.25, - "output": 15, - "cache_read": 0 + "input": 2, + "output": 8, + "cache_read": 0.5 }, "type": "chat" }, { - "id": "google/gemini-2.5-pro", - "name": "Gemini 2.5 Pro", - "display_name": "Gemini 2.5 Pro", + "id": "ministral-3b", + "name": "Ministral 3B", + "display_name": "Ministral 3B", "modalities": { "input": [ - "text", - "image", - "audio", - "video", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 1048576, - "output": 65536 + "context": 128000, + "output": 8192 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": true, - "mode": "budget", - "budget": { - "default": -1, - "min": 128, - "max": 32768, - "auto": -1, - "unit": "tokens" - }, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thought_signatures" - ] - } + "attachment": false, + "open_weights": true, + "knowledge": "2024-03", + "release_date": "2024-10-22", + "last_updated": "2024-10-22", + "cost": { + "input": 0.04, + "output": 0.04 + }, + "type": "chat" + }, + { + "id": "llama-3.2-90b-vision-instruct", + "name": "Llama-3.2-90B-Vision-Instruct", + "display_name": "Llama-3.2-90B-Vision-Instruct", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 128000, + "output": 8192 + }, + "temperature": true, + "tool_call": true, + "reasoning": { + "supported": false }, "attachment": true, - "open_weights": false, - "knowledge": "2025-01", - "release_date": "2025-03-20", - "last_updated": "2025-06-05", + "open_weights": true, + "knowledge": "2023-12", + "release_date": "2024-09-25", + "last_updated": "2024-09-25", "cost": { - "input": 1.25, - "output": 10, - "cache_read": 0.125, - "tiers": [ - { - "input": 2.5, - "output": 15, - "cache_read": 0.25, - "tier": { - "type": "context", - "size": 200000 - } - } - ], - "context_over_200k": { - "input": 2.5, - "output": 15, - "cache_read": 0.25 - } + "input": 2.04, + "output": 2.04 }, "type": "chat" }, { - "id": "google/gemma-4-31B-it", - "name": "Gemma 4 31B IT", - "display_name": "Gemma 4 31B IT", + "id": "deepseek-v3.1", + "name": "DeepSeek-V3.1", + "display_name": "DeepSeek-V3.1", "modalities": { "input": [ "text" @@ -146653,8 +151084,8 @@ ] }, "limit": { - "context": 262144, - "output": 32768 + "context": 131072, + "output": 131072 }, "temperature": true, "tool_call": true, @@ -146662,38 +151093,35 @@ "supported": true, "default": true }, - "attachment": true, + "attachment": false, "open_weights": true, - "release_date": "2026-04-02", - "last_updated": "2026-04-02", + "knowledge": "2024-07", + "release_date": "2025-08-21", + "last_updated": "2025-08-21", "cost": { - "input": 0.13, - "output": 0.4, - "cache_read": 0.026 + "input": 0.56, + "output": 1.68 }, "type": "chat" }, { - "id": "google/gemini-3.1-flash-lite", - "name": "Gemini 3.1 Flash Lite", - "display_name": "Gemini 3.1 Flash Lite", + "id": "o1", + "name": "o1", + "display_name": "o1", "modalities": { "input": [ "text", - "image", - "video", - "audio", - "pdf" + "image" ], "output": [ "text" ] }, "limit": { - "context": 1048576, - "output": 65536 + "context": 200000, + "output": 100000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { "supported": true, @@ -146701,99 +151129,80 @@ }, "extra_capabilities": { "reasoning": { - "supported": true + "supported": true, + "default_enabled": true, + "mode": "effort", + "effort": "medium", + "effort_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" } }, - "attachment": true, + "attachment": false, "open_weights": false, - "knowledge": "2025-01", - "release_date": "2026-05-07", - "last_updated": "2026-05-07", + "knowledge": "2023-09", + "release_date": "2024-12-05", + "last_updated": "2024-12-05", "cost": { - "input": 0.25, - "output": 1.5, - "cache_read": 0.025, - "input_audio": 0.5 + "input": 15, + "output": 60, + "cache_read": 7.5 }, "type": "chat" }, { - "id": "google/gemini-2.5-flash-lite", - "name": "Gemini 2.5 Flash-Lite", - "display_name": "Gemini 2.5 Flash-Lite", + "id": "gpt-4.1-nano", + "name": "GPT-4.1 nano", + "display_name": "GPT-4.1 nano", "modalities": { "input": [ "text", - "image", - "audio", - "video", - "pdf" + "image" ], "output": [ "text" ] }, "limit": { - "context": 1048576, - "output": 65536 + "context": 1047576, + "output": 32768 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": false - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": false, - "mode": "budget", - "budget": { - "default": -1, - "min": 512, - "max": 24576, - "auto": -1, - "unit": "tokens" - }, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thought_signatures" - ] - } + "supported": false }, "attachment": true, "open_weights": false, - "knowledge": "2025-01", - "release_date": "2025-06-17", - "last_updated": "2025-06-17", + "knowledge": "2024-04", + "release_date": "2025-04-14", + "last_updated": "2025-04-14", "cost": { "input": 0.1, "output": 0.4, - "cache_read": 0.01, - "input_audio": 0.3 + "cache_read": 0.025 }, "type": "chat" }, { - "id": "google/gemini-2.5-flash", - "name": "Gemini 2.5 Flash", - "display_name": "Gemini 2.5 Flash", + "id": "grok-4-fast-reasoning", + "name": "Grok 4 Fast (Reasoning)", + "display_name": "Grok 4 Fast (Reasoning)", "modalities": { "input": [ "text", - "image", - "audio", - "video", - "pdf" + "image" ], "output": [ "text" ] }, "limit": { - "context": 1048576, - "output": 65536 + "context": 2000000, + "output": 30000 }, "temperature": true, "tool_call": true, @@ -146803,56 +151212,69 @@ }, "extra_capabilities": { "reasoning": { - "supported": true, - "default_enabled": true, - "mode": "budget", - "budget": { - "default": -1, - "min": 0, - "max": 24576, - "auto": -1, - "off": 0, - "unit": "tokens" - }, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thought_signatures" - ] + "supported": true } }, "attachment": true, "open_weights": false, - "knowledge": "2025-01", - "release_date": "2025-03-20", - "last_updated": "2025-06-05", + "knowledge": "2025-07", + "release_date": "2025-09-19", + "last_updated": "2025-09-19", "cost": { - "input": 0.3, - "output": 2.5, - "cache_read": 0.03, - "input_audio": 1 + "input": 0.2, + "output": 0.5, + "cache_read": 0.05 }, "type": "chat" }, { - "id": "google/gemini-3.5-flash", - "name": "Gemini 3.5 Flash", - "display_name": "Gemini 3.5 Flash", + "id": "phi-4", + "name": "Phi-4", + "display_name": "Phi-4", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 128000, + "output": 4096 + }, + "temperature": true, + "tool_call": false, + "reasoning": { + "supported": false + }, + "attachment": false, + "open_weights": true, + "knowledge": "2023-10", + "release_date": "2024-12-11", + "last_updated": "2024-12-11", + "cost": { + "input": 0.125, + "output": 0.5 + }, + "type": "chat" + }, + { + "id": "kimi-k2.5", + "name": "Kimi K2.5", + "display_name": "Kimi K2.5", "modalities": { "input": [ "text", - "image", - "video", - "audio", - "pdf" + "image" ], "output": [ "text" ] }, "limit": { - "context": 1048576, - "output": 65536 + "context": 262144, + "output": 262144 }, "temperature": true, "tool_call": true, @@ -146863,39 +151285,29 @@ "extra_capabilities": { "reasoning": { "supported": true, - "default_enabled": true, - "mode": "level", - "level": "high", - "level_options": [ - "minimal", - "low", - "medium", - "high" - ], + "interleaved": true, "summaries": true, "visibility": "summary", "continuation": [ - "thought_signatures" + "thinking_blocks" ] } }, - "attachment": true, - "open_weights": false, + "attachment": false, + "open_weights": true, "knowledge": "2025-01", - "release_date": "2026-05-19", - "last_updated": "2026-05-19", + "release_date": "2026-02-06", + "last_updated": "2026-02-06", "cost": { - "input": 1.5, - "output": 9, - "cache_read": 0.15, - "input_audio": 1.5 + "input": 0.6, + "output": 3 }, "type": "chat" }, { - "id": "openai/gpt-5-mini", - "name": "GPT-5 Mini", - "display_name": "GPT-5 Mini", + "id": "gpt-5.1-codex-mini", + "name": "GPT-5.1 Codex Mini", + "display_name": "GPT-5.1 Codex Mini", "modalities": { "input": [ "text", @@ -146913,16 +151325,16 @@ "tool_call": true, "reasoning": { "supported": true, - "default": true + "default": false }, "extra_capabilities": { "reasoning": { "supported": true, - "default_enabled": true, + "default_enabled": false, "mode": "effort", - "effort": "medium", + "effort": "none", "effort_options": [ - "minimal", + "none", "low", "medium", "high" @@ -146936,11 +151348,11 @@ "visibility": "hidden" } }, - "attachment": true, + "attachment": false, "open_weights": false, - "knowledge": "2024-05-30", - "release_date": "2025-08-07", - "last_updated": "2025-08-07", + "knowledge": "2024-09-30", + "release_date": "2025-11-14", + "last_updated": "2025-11-14", "cost": { "input": 0.25, "output": 2, @@ -146949,116 +151361,136 @@ "type": "chat" }, { - "id": "openai/gpt-5.2", - "name": "GPT-5.2", - "display_name": "GPT-5.2", + "id": "meta-llama-3.1-8b-instruct", + "name": "Meta-Llama-3.1-8B-Instruct", + "display_name": "Meta-Llama-3.1-8B-Instruct", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 400000, - "output": 128000 + "context": 128000, + "output": 32768 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": false + "supported": false }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": false, - "mode": "effort", - "effort": "none", - "effort_options": [ - "none", - "low", - "medium", - "high", - "xhigh" - ], - "verbosity": "medium", - "verbosity_options": [ - "low", - "medium", - "high" - ], - "visibility": "hidden" - } + "attachment": false, + "open_weights": true, + "knowledge": "2023-12", + "release_date": "2024-07-23", + "last_updated": "2024-07-23", + "cost": { + "input": 0.3, + "output": 0.61 }, - "attachment": true, + "type": "chat" + }, + { + "id": "gpt-3.5-turbo-0301", + "name": "GPT-3.5 Turbo 0301", + "display_name": "GPT-3.5 Turbo 0301", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 4096, + "output": 4096 + }, + "temperature": true, + "tool_call": false, + "reasoning": { + "supported": false + }, + "attachment": false, "open_weights": false, - "knowledge": "2025-08-31", - "release_date": "2025-12-11", - "last_updated": "2025-12-11", + "knowledge": "2021-08", + "release_date": "2023-03-01", + "last_updated": "2023-03-01", "cost": { - "input": 1.8, - "output": 15.5, - "cache_read": 0.18 + "input": 1.5, + "output": 2 }, "type": "chat" }, { - "id": "openai/o3", - "name": "o3", - "display_name": "o3", + "id": "deepseek-v3.2-speciale", + "name": "DeepSeek-V3.2-Speciale", + "display_name": "DeepSeek-V3.2-Speciale", "modalities": { "input": [ - "text", - "image", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 100000 + "context": 128000, + "output": 128000 }, - "temperature": false, - "tool_call": true, + "temperature": true, + "tool_call": false, "reasoning": { "supported": true, "default": true }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": true, - "mode": "effort", - "effort": "medium", - "effort_options": [ - "low", - "medium", - "high" - ], - "visibility": "hidden" - } + "attachment": false, + "open_weights": true, + "knowledge": "2024-07", + "release_date": "2025-12-01", + "last_updated": "2025-12-01", + "cost": { + "input": 0.58, + "output": 1.68 }, - "attachment": true, + "type": "chat" + }, + { + "id": "text-embedding-3-small", + "name": "text-embedding-3-small", + "display_name": "text-embedding-3-small", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 8191, + "output": 1536 + }, + "tool_call": false, + "reasoning": { + "supported": false + }, + "attachment": false, "open_weights": false, - "knowledge": "2024-05", - "release_date": "2025-04-16", - "last_updated": "2025-04-16", + "release_date": "2024-01-25", + "last_updated": "2024-01-25", "cost": { - "input": 2, - "output": 8, - "cache_read": 0.5 + "input": 0.02, + "output": 0 }, - "type": "chat" + "type": "embedding" }, { - "id": "openai/gpt-5", - "name": "GPT-5", - "display_name": "GPT-5", + "id": "gpt-5.3-codex", + "name": "GPT-5.3 Codex", + "display_name": "GPT-5.3 Codex", "modalities": { "input": [ "text", @@ -147085,10 +151517,10 @@ "mode": "effort", "effort": "medium", "effort_options": [ - "minimal", "low", "medium", - "high" + "high", + "xhigh" ], "verbosity": "medium", "verbosity_options": [ @@ -147099,34 +151531,32 @@ "visibility": "hidden" } }, - "attachment": true, + "attachment": false, "open_weights": false, - "knowledge": "2024-09-30", - "release_date": "2025-08-07", - "last_updated": "2025-08-07", + "knowledge": "2025-08-31", + "release_date": "2026-02-24", + "last_updated": "2026-02-24", "cost": { - "input": 1.25, - "output": 10, - "cache_read": 0.125 + "input": 1.75, + "output": 14, + "cache_read": 0.175 }, "type": "chat" }, { - "id": "openai/gpt-4.1-mini", - "name": "GPT-4.1 mini", - "display_name": "GPT-4.1 mini", + "id": "mistral-large-2411", + "name": "Mistral Large 24.11", + "display_name": "Mistral Large 24.11", "modalities": { "input": [ - "text", - "image", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 1047576, + "context": 128000, "output": 32768 }, "temperature": true, @@ -147134,22 +151564,21 @@ "reasoning": { "supported": false }, - "attachment": true, + "attachment": false, "open_weights": false, - "knowledge": "2024-04", - "release_date": "2025-04-14", - "last_updated": "2025-04-14", + "knowledge": "2024-09", + "release_date": "2024-11-01", + "last_updated": "2024-11-01", "cost": { - "input": 0.4, - "output": 1.6, - "cache_read": 0.1 + "input": 2, + "output": 6 }, "type": "chat" }, { - "id": "openai/o4-mini", - "name": "o4-mini", - "display_name": "o4-mini", + "id": "gpt-4-turbo-vision", + "name": "GPT-4 Turbo Vision", + "display_name": "GPT-4 Turbo Vision", "modalities": { "input": [ "text", @@ -147160,57 +151589,40 @@ ] }, "limit": { - "context": 200000, - "output": 100000 + "context": 128000, + "output": 4096 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": true, - "mode": "effort", - "effort": "medium", - "effort_options": [ - "low", - "medium", - "high" - ], - "visibility": "hidden" - } + "supported": false }, "attachment": true, "open_weights": false, - "knowledge": "2024-05", - "release_date": "2025-04-16", - "last_updated": "2025-04-16", + "knowledge": "2023-11", + "release_date": "2023-11-06", + "last_updated": "2024-04-09", "cost": { - "input": 1.1, - "output": 4.4, - "cache_read": 0.275 + "input": 10, + "output": 30 }, "type": "chat" }, { - "id": "openai/gpt-5.4", - "name": "GPT-5.4", - "display_name": "GPT-5.4", + "id": "gpt-5.2", + "name": "GPT-5.2", + "display_name": "GPT-5.2", "modalities": { "input": [ "text", - "image", - "pdf" + "image" ], "output": [ "text" ] }, "limit": { - "context": 1050000, + "context": 400000, "output": 128000 }, "temperature": false, @@ -147244,33 +151656,17 @@ "attachment": true, "open_weights": false, "knowledge": "2025-08-31", - "release_date": "2026-03-05", - "last_updated": "2026-03-05", + "release_date": "2025-12-11", + "last_updated": "2025-12-11", "cost": { - "input": 2.5, - "output": 15, - "cache_read": 0.25, - "tiers": [ - { - "input": 5, - "output": 22.5, - "cache_read": 0.5, - "tier": { - "type": "context", - "size": 272000 - } - } - ], - "context_over_200k": { - "input": 5, - "output": 22.5, - "cache_read": 0.5 - } + "input": 1.75, + "output": 14, + "cache_read": 0.125 }, "type": "chat" }, { - "id": "openai/o3-mini", + "id": "o3-mini", "name": "o3-mini", "display_name": "o3-mini", "modalities": { @@ -147318,138 +151714,71 @@ "type": "chat" }, { - "id": "openai/gpt-5.5", - "name": "GPT-5.5", - "display_name": "GPT-5.5", + "id": "text-embedding-ada-002", + "name": "text-embedding-ada-002", + "display_name": "text-embedding-ada-002", "modalities": { "input": [ - "text", - "image", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 1050000, - "output": 128000 + "context": 8192, + "output": 1536 }, - "temperature": false, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": true, - "mode": "effort", - "effort": "medium", - "effort_options": [ - "low", - "medium", - "high", - "xhigh" - ], - "verbosity": "medium", - "verbosity_options": [ - "low", - "medium", - "high" - ], - "visibility": "hidden" - } + "supported": false }, - "attachment": true, + "attachment": false, "open_weights": false, - "knowledge": "2025-12-01", - "release_date": "2026-04-23", - "last_updated": "2026-04-23", + "release_date": "2022-12-15", + "last_updated": "2022-12-15", "cost": { - "input": 5, - "output": 30, - "cache_read": 0.5, - "tiers": [ - { - "input": 10, - "output": 45, - "cache_read": 1, - "tier": { - "type": "context", - "size": 272000 - } - } - ], - "context_over_200k": { - "input": 10, - "output": 45, - "cache_read": 1 - } + "input": 0.1, + "output": 0 }, - "type": "chat" + "type": "embedding" }, { - "id": "openai/gpt-5.1", - "name": "GPT-5.1", - "display_name": "GPT-5.1", + "id": "meta-llama-3.1-70b-instruct", + "name": "Meta-Llama-3.1-70B-Instruct", + "display_name": "Meta-Llama-3.1-70B-Instruct", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 400000, - "output": 128000 + "context": 128000, + "output": 32768 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": false - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": false, - "mode": "effort", - "effort": "none", - "effort_options": [ - "none", - "low", - "medium", - "high" - ], - "verbosity": "medium", - "verbosity_options": [ - "low", - "medium", - "high" - ], - "visibility": "hidden" - } + "supported": false }, - "attachment": true, - "open_weights": false, - "knowledge": "2024-09-30", - "release_date": "2025-11-13", - "last_updated": "2025-11-13", + "attachment": false, + "open_weights": true, + "knowledge": "2023-12", + "release_date": "2024-07-23", + "last_updated": "2024-07-23", "cost": { - "input": 1.25, - "output": 10, - "cache_read": 0.125 + "input": 2.68, + "output": 3.54 }, "type": "chat" }, { - "id": "openai/gpt-5-nano", - "name": "GPT-5 Nano", - "display_name": "GPT-5 Nano", + "id": "mistral-medium-2505", + "name": "Mistral Medium 3", + "display_name": "Mistral Medium 3", "modalities": { "input": [ "text", @@ -147460,52 +151789,29 @@ ] }, "limit": { - "context": 400000, + "context": 128000, "output": 128000 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": true, - "mode": "effort", - "effort": "medium", - "effort_options": [ - "minimal", - "low", - "medium", - "high" - ], - "verbosity": "medium", - "verbosity_options": [ - "low", - "medium", - "high" - ], - "visibility": "hidden" - } + "supported": false }, "attachment": true, "open_weights": false, - "knowledge": "2024-05-30", - "release_date": "2025-08-07", - "last_updated": "2025-08-07", + "knowledge": "2025-05", + "release_date": "2025-05-07", + "last_updated": "2025-05-07", "cost": { - "input": 0.05, - "output": 0.4, - "cache_read": 0.005 + "input": 0.4, + "output": 2 }, "type": "chat" }, { - "id": "openai/gpt-oss-120b", - "name": "GPT-OSS 120B", - "display_name": "GPT-OSS 120B", + "id": "phi-4-reasoning", + "name": "Phi-4-reasoning", + "display_name": "Phi-4-reasoning", "modalities": { "input": [ "text" @@ -147515,76 +151821,40 @@ ] }, "limit": { - "context": 131000, - "output": 32768 + "context": 32000, + "output": 4096 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": true, "default": true }, - "extra_capabilities": { - "reasoning": { - "supported": true - } - }, "attachment": false, - "open_weights": true, - "release_date": "2025-08-05", - "last_updated": "2025-08-05", - "cost": { - "input": 0.15, - "output": 0.55 - }, - "type": "chat" - }, - { - "id": "openai/gpt-4.1", - "name": "GPT-4.1", - "display_name": "GPT-4.1", - "modalities": { - "input": [ - "text", - "image", - "pdf" - ], - "output": [ - "text" - ] - }, - "limit": { - "context": 1047576, - "output": 32768 - }, - "temperature": true, - "tool_call": true, - "reasoning": { - "supported": false - }, - "attachment": true, - "open_weights": false, - "knowledge": "2024-04", - "release_date": "2025-04-14", - "last_updated": "2025-04-14", + "open_weights": true, + "knowledge": "2023-10", + "release_date": "2024-12-11", + "last_updated": "2024-12-11", "cost": { - "input": 2, - "output": 8, - "cache_read": 0.5 + "input": 0.125, + "output": 0.5 }, "type": "chat" }, { - "id": "openai/gpt-5.4-nano", - "name": "GPT-5.4 nano", - "display_name": "GPT-5.4 nano", + "id": "gpt-5.1-codex", + "name": "GPT-5.1 Codex", + "display_name": "GPT-5.1 Codex", "modalities": { "input": [ "text", - "image" + "image", + "audio" ], "output": [ - "text" + "text", + "image", + "audio" ] }, "limit": { @@ -147607,8 +151877,7 @@ "none", "low", "medium", - "high", - "xhigh" + "high" ], "verbosity": "medium", "verbosity_options": [ @@ -147619,153 +151888,117 @@ "visibility": "hidden" } }, - "attachment": true, + "attachment": false, "open_weights": false, - "knowledge": "2025-08-31", - "release_date": "2026-03-17", - "last_updated": "2026-03-17", + "knowledge": "2024-09-30", + "release_date": "2025-11-14", + "last_updated": "2025-11-14", "cost": { - "input": 0.2, - "output": 1.25, - "cache_read": 0.02 + "input": 1.25, + "output": 10, + "cache_read": 0.125 }, "type": "chat" }, { - "id": "openai/whisper-large-v3", - "name": "Whisper Large v3", - "display_name": "Whisper Large v3", + "id": "gpt-3.5-turbo-0613", + "name": "GPT-3.5 Turbo 0613", + "display_name": "GPT-3.5 Turbo 0613", "modalities": { "input": [ - "audio" + "text" ], "output": [ "text" ] }, "limit": { - "context": 448, - "output": 448 + "context": 16384, + "output": 16384 }, - "temperature": false, + "temperature": true, "tool_call": false, "reasoning": { "supported": false }, "attachment": false, - "open_weights": true, - "release_date": "2023-11-06", - "last_updated": "2023-11-06", + "open_weights": false, + "knowledge": "2021-08", + "release_date": "2023-06-13", + "last_updated": "2023-06-13", "cost": { - "input": 0.01, - "output": 0 + "input": 3, + "output": 4 }, "type": "chat" }, { - "id": "openai/gpt-5.4-mini", - "name": "GPT-5.4 mini", - "display_name": "GPT-5.4 mini", + "id": "cohere-embed-v3-multilingual", + "name": "Embed v3 Multilingual", + "display_name": "Embed v3 Multilingual", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 400000, - "output": 128000 + "context": 512, + "output": 1024 }, "temperature": false, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": false - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": false, - "mode": "effort", - "effort": "none", - "effort_options": [ - "none", - "low", - "medium", - "high", - "xhigh" - ], - "verbosity": "medium", - "verbosity_options": [ - "low", - "medium", - "high" - ], - "visibility": "hidden" - } + "supported": false }, - "attachment": true, - "open_weights": false, - "knowledge": "2025-08-31", - "release_date": "2026-03-17", - "last_updated": "2026-03-17", + "attachment": false, + "open_weights": true, + "release_date": "2023-11-07", + "last_updated": "2023-11-07", "cost": { - "input": 0.75, - "output": 4.5, - "cache_read": 0.075 + "input": 0.1, + "output": 0 }, "type": "chat" }, { - "id": "openai/gpt-4.1-nano", - "name": "GPT-4.1 nano", - "display_name": "GPT-4.1 nano", + "id": "gpt-3.5-turbo-0125", + "name": "GPT-3.5 Turbo 0125", + "display_name": "GPT-3.5 Turbo 0125", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 1047576, - "output": 32768 + "context": 16384, + "output": 16384 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": false }, - "attachment": true, + "attachment": false, "open_weights": false, - "knowledge": "2024-04", - "release_date": "2025-04-14", - "last_updated": "2025-04-14", + "knowledge": "2021-08", + "release_date": "2024-01-25", + "last_updated": "2024-01-25", "cost": { - "input": 0.1, - "output": 0.4, - "cache_read": 0.025 + "input": 0.5, + "output": 1.5 }, "type": "chat" - } - ] - }, - "inceptron": { - "id": "inceptron", - "name": "Inceptron", - "display_name": "Inceptron", - "api": "https://api.inceptron.io/v1", - "doc": "https://docs.inceptron.io", - "models": [ + }, { - "id": "MiniMaxAI/MiniMax-M2.5", - "name": "MiniMax M2.5", - "display_name": "MiniMax M2.5", + "id": "phi-3-small-8k-instruct", + "name": "Phi-3-small-instruct (8k)", + "display_name": "Phi-3-small-instruct (8k)", "modalities": { "input": [ "text" @@ -147775,36 +152008,29 @@ ] }, "limit": { - "context": 196608, - "output": 196608 + "context": 8192, + "output": 2048 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true - } + "supported": false }, "attachment": false, "open_weights": true, - "release_date": "2026-02-12", - "last_updated": "2026-02-12", + "knowledge": "2023-10", + "release_date": "2024-04-23", + "last_updated": "2024-04-23", "cost": { - "input": 0.24, - "output": 0.9, - "cache_read": 0.03, - "cache_write": 0 + "input": 0.15, + "output": 0.6 }, "type": "chat" }, { - "id": "zai-org/GLM-5.1-FP8", - "name": "GLM 5.1", - "display_name": "GLM 5.1", + "id": "deepseek-r1", + "name": "DeepSeek-R1", + "display_name": "DeepSeek-R1", "modalities": { "input": [ "text" @@ -147814,11 +152040,11 @@ ] }, "limit": { - "context": 202752, - "output": 202752 + "context": 163840, + "output": 163840 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": true, "default": true @@ -147836,24 +152062,22 @@ }, "attachment": false, "open_weights": true, - "release_date": "2026-03-27", - "last_updated": "2026-03-27", + "knowledge": "2024-07", + "release_date": "2025-01-20", + "last_updated": "2025-01-20", "cost": { - "input": 1.4, - "output": 4.4, - "cache_read": 0.26, - "cache_write": 0 + "input": 1.35, + "output": 5.4 }, "type": "chat" }, { - "id": "moonshotai/Kimi-K2.6", - "name": "Kimi K2.6", - "display_name": "Kimi K2.6", + "id": "kimi-k2-thinking", + "name": "Kimi K2 Thinking", + "display_name": "Kimi K2 Thinking", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" @@ -147880,23 +152104,60 @@ ] } }, - "attachment": true, + "attachment": false, "open_weights": true, - "knowledge": "2025-01", - "release_date": "2026-04-21", - "last_updated": "2026-04-21", + "knowledge": "2024-08", + "release_date": "2025-11-06", + "last_updated": "2025-12-02", "cost": { - "input": 0.78, - "output": 3.5, - "cache_read": 0.2, - "cache_write": 0 + "input": 0.6, + "output": 2.5, + "cache_read": 0.15 }, "type": "chat" }, { - "id": "nvidia/llama-3.3-70b-instruct-fp8", - "name": "Llama 3.3 70B Instruct", - "display_name": "Llama 3.3 70B Instruct", + "id": "gpt-5.1-chat", + "name": "GPT-5.1 Chat", + "display_name": "GPT-5.1 Chat", + "modalities": { + "input": [ + "text", + "image", + "audio" + ], + "output": [ + "text", + "image", + "audio" + ] + }, + "limit": { + "context": 128000, + "output": 16384 + }, + "temperature": false, + "tool_call": true, + "reasoning": { + "supported": true, + "default": true + }, + "attachment": true, + "open_weights": false, + "knowledge": "2024-09-30", + "release_date": "2025-11-14", + "last_updated": "2025-11-14", + "cost": { + "input": 1.25, + "output": 10, + "cache_read": 0.125 + }, + "type": "chat" + }, + { + "id": "llama-3.3-70b-instruct", + "name": "Llama-3.3-70B-Instruct", + "display_name": "Llama-3.3-70B-Instruct", "modalities": { "input": [ "text" @@ -147906,40 +152167,29 @@ ] }, "limit": { - "context": 131072, - "output": 131072 + "context": 128000, + "output": 32768 }, "temperature": true, "tool_call": true, "reasoning": { "supported": false }, - "attachment": true, + "attachment": false, "open_weights": true, "knowledge": "2023-12", "release_date": "2024-12-06", "last_updated": "2024-12-06", "cost": { - "input": 0.12, - "output": 0.38, - "cache_read": 0, - "cache_write": 0 + "input": 0.71, + "output": 0.71 }, "type": "chat" - } - ] - }, - "xpersona": { - "id": "xpersona", - "name": "Xpersona", - "display_name": "Xpersona", - "api": "https://www.xpersona.co/v1", - "doc": "https://www.xpersona.co/docs", - "models": [ + }, { - "id": "xpersona-gpt-5.5", - "name": "GPT-5.5", - "display_name": "GPT-5.5", + "id": "llama-4-scout-17b-16e-instruct", + "name": "Llama 4 Scout 17B 16E Instruct", + "display_name": "Llama 4 Scout 17B 16E Instruct", "modalities": { "input": [ "text", @@ -147950,492 +152200,306 @@ ] }, "limit": { - "context": 1000000, - "output": 128000 + "context": 128000, + "output": 8192 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } + "supported": false }, - "attachment": false, - "open_weights": false, - "knowledge": "2025-12-30", - "release_date": "2026-05-29", - "last_updated": "2026-05-29", + "attachment": true, + "open_weights": true, + "knowledge": "2024-08", + "release_date": "2025-04-05", + "last_updated": "2025-04-05", "cost": { - "input": 3, - "output": 18, - "reasoning": 18, - "cache_read": 0.3 + "input": 0.2, + "output": 0.78 }, "type": "chat" }, { - "id": "xpersona-frieren-coder", - "name": "Xpersona Frieren 1", - "display_name": "Xpersona Frieren 1", + "id": "gpt-3.5-turbo-1106", + "name": "GPT-3.5 Turbo 1106", + "display_name": "GPT-3.5 Turbo 1106", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 1000000, - "output": 384000 + "context": 16384, + "output": 16384 }, - "temperature": false, - "tool_call": true, + "temperature": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": true + "supported": false }, "attachment": false, "open_weights": false, - "knowledge": "2025-12-30", - "release_date": "2026-05-01", - "last_updated": "2026-05-25", + "knowledge": "2021-08", + "release_date": "2023-11-06", + "last_updated": "2023-11-06", "cost": { - "input": 1.5, - "output": 6, - "reasoning": 6, - "cache_read": 0.15 + "input": 1, + "output": 2 }, "type": "chat" - } - ] - }, - "perplexity-agent": { - "id": "perplexity-agent", - "name": "Perplexity Agent", - "display_name": "Perplexity Agent", - "api": "https://api.perplexity.ai/v1", - "doc": "https://docs.perplexity.ai/docs/agent-api/models", - "models": [ + }, { - "id": "anthropic/claude-opus-4-5", - "name": "Claude Opus 4.5", - "display_name": "Claude Opus 4.5", + "id": "phi-4-mini", + "name": "Phi-4-mini", + "display_name": "Phi-4-mini", "modalities": { "input": [ - "text", - "image", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 64000 + "context": 128000, + "output": 4096 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": false - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": false, - "mode": "mixed", - "budget": { - "min": 1024, - "unit": "tokens" - }, - "effort": "high", - "effort_options": [ - "low", - "medium", - "high" - ], - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ], - "notes": [ - "Claude Opus 4.5 uses manual thinking.type = \"enabled\" with budget_tokens; effort can be used alongside the thinking budget.", - "Interleaved thinking requires the interleaved-thinking-2025-05-14 beta header." - ] - } + "supported": false }, - "attachment": true, - "open_weights": false, - "knowledge": "2025-03-31", - "release_date": "2025-11-24", - "last_updated": "2025-11-24", + "attachment": false, + "open_weights": true, + "knowledge": "2023-10", + "release_date": "2024-12-11", + "last_updated": "2024-12-11", "cost": { - "input": 5, - "output": 25, - "cache_read": 0.5 + "input": 0.075, + "output": 0.3 }, "type": "chat" }, { - "id": "anthropic/claude-sonnet-4-6", - "name": "Claude Sonnet 4.6", - "display_name": "Claude Sonnet 4.6", + "id": "cohere-command-r-plus-08-2024", + "name": "Command R+", + "display_name": "Command R+", "modalities": { "input": [ - "text", - "image", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 64000 + "context": 128000, + "output": 4000 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": false - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": false, - "mode": "mixed", - "budget": { - "min": 1024, - "unit": "tokens" - }, - "effort": "high", - "effort_options": [ - "low", - "medium", - "high", - "max" - ], - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ], - "notes": [ - "Anthropic recommends adaptive thinking with effort for Claude 4.6; budget_tokens remains a deprecated compatibility path.", - "Anthropic API defaults effort to high; lower effort levels should be chosen per workload." - ] - } + "supported": false }, - "attachment": true, - "open_weights": false, - "knowledge": "2025-08-31", - "release_date": "2026-02-17", - "last_updated": "2026-02-17", + "attachment": false, + "open_weights": true, + "knowledge": "2024-06-01", + "release_date": "2024-08-30", + "last_updated": "2024-08-30", "cost": { - "input": 3, - "output": 15, - "cache_read": 0.3 + "input": 2.5, + "output": 10 }, "type": "chat" }, { - "id": "anthropic/claude-haiku-4-5", - "name": "Claude Haiku 4.5", - "display_name": "Claude Haiku 4.5", + "id": "meta-llama-3.1-405b-instruct", + "name": "Meta-Llama-3.1-405B-Instruct", + "display_name": "Meta-Llama-3.1-405B-Instruct", "modalities": { "input": [ - "text", - "image", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 64000 + "context": 128000, + "output": 32768 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": false - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": false, - "mode": "budget", - "budget": { - "min": 1024, - "unit": "tokens" - }, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ], - "notes": [ - "Claude 4 manual thinking uses thinking.type = \"enabled\" with budget_tokens.", - "Interleaved thinking requires the interleaved-thinking-2025-05-14 beta header for this model family." - ] - } + "supported": false }, - "attachment": true, - "open_weights": false, - "knowledge": "2025-02-28", - "release_date": "2025-10-15", - "last_updated": "2025-10-15", + "attachment": false, + "open_weights": true, + "knowledge": "2023-12", + "release_date": "2024-07-23", + "last_updated": "2024-07-23", "cost": { - "input": 1, - "output": 5, - "cache_read": 0.1 + "input": 5.33, + "output": 16 }, "type": "chat" }, { - "id": "anthropic/claude-sonnet-4-5", - "name": "Claude Sonnet 4.5", - "display_name": "Claude Sonnet 4.5", + "id": "gpt-4-32k", + "name": "GPT-4 32K", + "display_name": "GPT-4 32K", "modalities": { "input": [ - "text", - "image", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 64000 + "context": 32768, + "output": 32768 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": false - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": false, - "mode": "budget", - "budget": { - "min": 1024, - "unit": "tokens" - }, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ], - "notes": [ - "Claude 4 manual thinking uses thinking.type = \"enabled\" with budget_tokens.", - "Interleaved thinking requires the interleaved-thinking-2025-05-14 beta header for this model family." - ] - } + "supported": false }, - "attachment": true, + "attachment": false, "open_weights": false, - "knowledge": "2025-07-31", - "release_date": "2025-09-29", - "last_updated": "2025-09-29", + "knowledge": "2023-11", + "release_date": "2023-03-14", + "last_updated": "2023-03-14", "cost": { - "input": 3, - "output": 15, - "cache_read": 0.3 + "input": 60, + "output": 120 }, "type": "chat" }, { - "id": "anthropic/claude-opus-4-6", - "name": "Claude Opus 4.6", - "display_name": "Claude Opus 4.6", + "id": "phi-3-medium-128k-instruct", + "name": "Phi-3-medium-instruct (128k)", + "display_name": "Phi-3-medium-instruct (128k)", "modalities": { "input": [ - "text", - "image", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 128000 + "context": 128000, + "output": 4096 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": false - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": false, - "mode": "mixed", - "budget": { - "min": 1024, - "unit": "tokens" - }, - "effort": "high", - "effort_options": [ - "low", - "medium", - "high", - "max" - ], - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ], - "notes": [ - "Anthropic recommends adaptive thinking with effort for Claude 4.6; budget_tokens remains a deprecated compatibility path.", - "Anthropic API defaults effort to high; lower effort levels should be chosen per workload." - ] - } + "supported": false }, - "attachment": true, - "open_weights": false, - "knowledge": "2025-05-31", - "release_date": "2026-02-05", - "last_updated": "2026-02-05", + "attachment": false, + "open_weights": true, + "knowledge": "2023-10", + "release_date": "2024-04-23", + "last_updated": "2024-04-23", "cost": { - "input": 5, - "output": 25, - "cache_read": 0.5 + "input": 0.17, + "output": 0.68 }, "type": "chat" }, { - "id": "anthropic/claude-opus-4-7", - "name": "Claude Opus 4.7", - "display_name": "Claude Opus 4.7", + "id": "o4-mini", + "name": "o4-mini", + "display_name": "o4-mini", "modalities": { "input": [ "text", - "image", - "pdf" + "image" ], "output": [ "text" ] }, "limit": { - "context": 1000000, - "output": 128000 + "context": 200000, + "output": 100000 }, "temperature": false, "tool_call": true, "reasoning": { "supported": true, - "default": false + "default": true }, "extra_capabilities": { "reasoning": { "supported": true, - "default_enabled": false, + "default_enabled": true, "mode": "effort", - "effort": "high", + "effort": "medium", "effort_options": [ "low", "medium", - "high", - "xhigh", - "max" - ], - "interleaved": true, - "summaries": true, - "visibility": "omitted", - "continuation": [ - "thinking_blocks" + "high" ], - "notes": [ - "Claude Opus 4.7 and newer Opus models require thinking.type = \"adaptive\" to enable thinking explicitly.", - "Manual budget_tokens requests return 400 on Claude Opus 4.7 and newer adaptive-only Opus models.", - "task_budget is separate from thinking control and should not be treated as a thinking budget." - ] + "visibility": "hidden" } }, "attachment": true, "open_weights": false, - "knowledge": "2026-01-31", - "release_date": "2026-04-16", - "last_updated": "2026-04-16", + "knowledge": "2024-05", + "release_date": "2025-04-16", + "last_updated": "2025-04-16", "cost": { - "input": 5, - "output": 25, - "cache_read": 0.5 + "input": 1.1, + "output": 4.4, + "cache_read": 0.275 }, "type": "chat" }, { - "id": "xai/grok-4-1-fast-non-reasoning", - "name": "Grok 4.1 Fast (Non-Reasoning)", - "display_name": "Grok 4.1 Fast (Non-Reasoning)", + "id": "gpt-4", + "name": "GPT-4", + "display_name": "GPT-4", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 2000000, - "output": 30000 + "context": 8192, + "output": 8192 }, "temperature": true, "tool_call": true, "reasoning": { "supported": false }, - "attachment": true, + "attachment": false, "open_weights": false, - "knowledge": "2025-07", - "release_date": "2025-11-19", - "last_updated": "2025-11-19", + "knowledge": "2023-11", + "release_date": "2023-03-14", + "last_updated": "2023-03-14", "cost": { - "input": 0.2, - "output": 0.5, - "cache_read": 0.05 + "input": 60, + "output": 120 }, "type": "chat" }, { - "id": "perplexity/sonar", - "name": "Sonar", - "display_name": "Sonar", + "id": "gpt-4o", + "name": "GPT-4o", + "display_name": "GPT-4o", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" @@ -148443,29 +152507,29 @@ }, "limit": { "context": 128000, - "output": 8192 + "output": 16384 }, "temperature": true, "tool_call": true, "reasoning": { "supported": false }, - "attachment": false, + "attachment": true, "open_weights": false, - "knowledge": "2025-09-01", - "release_date": "2024-01-01", - "last_updated": "2025-09-01", + "knowledge": "2023-09", + "release_date": "2024-05-13", + "last_updated": "2024-08-06", "cost": { - "input": 0.25, - "output": 2.5, - "cache_read": 0.0625 + "input": 2.5, + "output": 10, + "cache_read": 1.25 }, "type": "chat" }, { - "id": "nvidia/nemotron-3-super-120b-a12b", - "name": "Nemotron 3 Super 120B", - "display_name": "Nemotron 3 Super 120B", + "id": "cohere-command-r-08-2024", + "name": "Command R", + "display_name": "Command R", "modalities": { "input": [ "text" @@ -148475,47 +152539,43 @@ ] }, "limit": { - "context": 1000000, - "output": 32000 + "context": 128000, + "output": 4000 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, "attachment": false, "open_weights": true, - "knowledge": "2026-02", - "release_date": "2026-03-11", - "last_updated": "2026-03-11", + "knowledge": "2024-06-01", + "release_date": "2024-08-30", + "last_updated": "2024-08-30", "cost": { - "input": 0.25, - "output": 2.5 + "input": 0.15, + "output": 0.6 }, "type": "chat" }, { - "id": "google/gemini-3-flash-preview", - "name": "Gemini 3 Flash Preview", - "display_name": "Gemini 3 Flash Preview", + "id": "gpt-5-pro", + "name": "GPT-5 Pro", + "display_name": "GPT-5 Pro", "modalities": { "input": [ "text", - "image", - "video", - "audio", - "pdf" + "image" ], "output": [ "text" ] }, "limit": { - "context": 1048576, - "output": 65536 + "context": 400000, + "output": 272000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { "supported": true, @@ -148525,141 +152585,76 @@ "reasoning": { "supported": true, "default_enabled": true, - "mode": "level", - "level": "high", - "level_options": [ - "minimal", + "mode": "fixed", + "effort": "high", + "verbosity": "medium", + "verbosity_options": [ "low", "medium", "high" ], - "summaries": true, - "visibility": "summary", - "continuation": [ - "thought_signatures" - ] + "visibility": "hidden" } }, "attachment": true, "open_weights": false, - "knowledge": "2025-01", - "release_date": "2025-12-17", - "last_updated": "2025-12-17", + "knowledge": "2024-09-30", + "release_date": "2025-10-06", + "last_updated": "2025-10-06", "cost": { - "input": 0.5, - "output": 3, - "cache_read": 0.05, - "tiers": [ - { - "input": 0.5, - "output": 3, - "cache_read": 0.05, - "tier": { - "type": "context", - "size": 200000 - } - } - ], - "context_over_200k": { - "input": 0.5, - "output": 3, - "cache_read": 0.05 - } + "input": 15, + "output": 120 }, "type": "chat" }, { - "id": "google/gemini-2.5-pro", - "name": "Gemini 2.5 Pro", - "display_name": "Gemini 2.5 Pro", + "id": "llama-3.2-11b-vision-instruct", + "name": "Llama-3.2-11B-Vision-Instruct", + "display_name": "Llama-3.2-11B-Vision-Instruct", "modalities": { "input": [ "text", - "image", - "audio", - "video", - "pdf" + "image" ], "output": [ "text" ] }, "limit": { - "context": 1048576, - "output": 65536 + "context": 128000, + "output": 8192 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": true, - "mode": "budget", - "budget": { - "default": -1, - "min": 128, - "max": 32768, - "auto": -1, - "unit": "tokens" - }, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thought_signatures" - ] - } + "supported": false }, "attachment": true, - "open_weights": false, - "knowledge": "2025-01", - "release_date": "2025-03-20", - "last_updated": "2025-06-05", + "open_weights": true, + "knowledge": "2023-12", + "release_date": "2024-09-25", + "last_updated": "2024-09-25", "cost": { - "input": 1.25, - "output": 10, - "cache_read": 0.125, - "tiers": [ - { - "input": 2.5, - "output": 15, - "cache_read": 0.25, - "tier": { - "type": "context", - "size": 200000 - } - } - ], - "context_over_200k": { - "input": 2.5, - "output": 15, - "cache_read": 0.25 - } + "input": 0.37, + "output": 0.37 }, "type": "chat" }, { - "id": "google/gemini-3.1-pro-preview", - "name": "Gemini 3.1 Pro Preview", - "display_name": "Gemini 3.1 Pro Preview", + "id": "cohere-command-a", + "name": "Command A", + "display_name": "Command A", "modalities": { "input": [ - "text", - "image", - "video", - "audio", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 1048576, - "output": 65536 + "context": 256000, + "output": 8000 }, "temperature": true, "tool_call": true, @@ -148667,113 +152662,56 @@ "supported": true, "default": true }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": true, - "mode": "level", - "level": "high", - "level_options": [ - "low", - "high" - ], - "summaries": true, - "visibility": "summary", - "continuation": [ - "thought_signatures" - ] - } - }, - "attachment": true, - "open_weights": false, - "knowledge": "2025-01", - "release_date": "2026-02-19", - "last_updated": "2026-02-19", + "attachment": false, + "open_weights": true, + "knowledge": "2024-06-01", + "release_date": "2025-03-13", + "last_updated": "2025-03-13", "cost": { - "input": 2, - "output": 12, - "cache_read": 0.2, - "tiers": [ - { - "input": 4, - "output": 18, - "cache_read": 0.4, - "tier": { - "type": "context", - "size": 200000 - } - } - ], - "context_over_200k": { - "input": 4, - "output": 18, - "cache_read": 0.4 - } + "input": 2.5, + "output": 10 }, "type": "chat" }, { - "id": "google/gemini-2.5-flash", - "name": "Gemini 2.5 Flash", - "display_name": "Gemini 2.5 Flash", + "id": "gpt-5-chat", + "name": "GPT-5 Chat", + "display_name": "GPT-5 Chat", "modalities": { "input": [ "text", - "image", - "audio", - "video", - "pdf" + "image" ], "output": [ "text" ] }, "limit": { - "context": 1048576, - "output": 65536 + "context": 128000, + "output": 16384 }, - "temperature": true, - "tool_call": true, + "temperature": false, + "tool_call": false, "reasoning": { "supported": true, "default": true }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": true, - "mode": "budget", - "budget": { - "default": -1, - "min": 0, - "max": 24576, - "auto": -1, - "off": 0, - "unit": "tokens" - }, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thought_signatures" - ] - } - }, "attachment": true, - "open_weights": false, - "knowledge": "2025-01", - "release_date": "2025-03-20", - "last_updated": "2025-06-05", + "open_weights": false, + "knowledge": "2024-10-24", + "release_date": "2025-08-07", + "last_updated": "2025-08-07", "cost": { - "input": 0.3, - "output": 2.5, - "cache_read": 0.03 + "input": 1.25, + "output": 10, + "cache_read": 0.13 }, "type": "chat" }, { - "id": "openai/gpt-5-mini", - "name": "GPT-5 Mini", - "display_name": "GPT-5 Mini", + "id": "gpt-5", + "name": "GPT-5", + "display_name": "GPT-5", "modalities": { "input": [ "text", @@ -148784,7 +152722,7 @@ ] }, "limit": { - "context": 400000, + "context": 272000, "output": 128000 }, "temperature": false, @@ -148816,20 +152754,20 @@ }, "attachment": true, "open_weights": false, - "knowledge": "2024-05-30", + "knowledge": "2024-09-30", "release_date": "2025-08-07", "last_updated": "2025-08-07", "cost": { - "input": 0.25, - "output": 2, - "cache_read": 0.025 + "input": 1.25, + "output": 10, + "cache_read": 0.13 }, "type": "chat" }, { - "id": "openai/gpt-5.2", - "name": "GPT-5.2", - "display_name": "GPT-5.2", + "id": "cohere-embed-v-4-0", + "name": "Embed v4", + "display_name": "Embed v4", "modalities": { "input": [ "text", @@ -148840,123 +152778,103 @@ ] }, "limit": { - "context": 400000, - "output": 128000 + "context": 128000, + "output": 1536 }, "temperature": false, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": false - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": false, - "mode": "effort", - "effort": "none", - "effort_options": [ - "none", - "low", - "medium", - "high", - "xhigh" - ], - "verbosity": "medium", - "verbosity_options": [ - "low", - "medium", - "high" - ], - "visibility": "hidden" - } + "supported": false }, "attachment": true, - "open_weights": false, - "knowledge": "2025-08-31", - "release_date": "2025-12-11", - "last_updated": "2025-12-11", + "open_weights": true, + "release_date": "2025-04-15", + "last_updated": "2025-04-15", "cost": { - "input": 1.75, - "output": 14, - "cache_read": 0.175 + "input": 0.12, + "output": 0 }, "type": "chat" }, { - "id": "openai/gpt-5.4", - "name": "GPT-5.4", - "display_name": "GPT-5.4", + "id": "mistral-nemo", + "name": "Mistral Nemo", + "display_name": "Mistral Nemo", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 1050000, + "context": 128000, "output": 128000 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": false + "supported": false }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": false, - "mode": "effort", - "effort": "none", - "effort_options": [ - "none", - "low", - "medium", - "high", - "xhigh" - ], - "verbosity": "medium", - "verbosity_options": [ - "low", - "medium", - "high" - ], - "visibility": "hidden" - } + "attachment": false, + "open_weights": true, + "knowledge": "2024-07", + "release_date": "2024-07-18", + "last_updated": "2024-07-18", + "cost": { + "input": 0.15, + "output": 0.15 }, - "attachment": true, - "open_weights": false, - "knowledge": "2025-08-31", - "release_date": "2026-03-05", - "last_updated": "2026-03-05", + "type": "chat" + }, + { + "id": "phi-3.5-mini-instruct", + "name": "Phi-3.5-mini-instruct", + "display_name": "Phi-3.5-mini-instruct", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 128000, + "output": 4096 + }, + "temperature": true, + "tool_call": false, + "reasoning": { + "supported": false + }, + "attachment": false, + "open_weights": true, + "knowledge": "2023-10", + "release_date": "2024-08-20", + "last_updated": "2024-08-20", "cost": { - "input": 2.5, - "output": 15, - "cache_read": 0.25 + "input": 0.13, + "output": 0.52 }, "type": "chat" }, { - "id": "openai/gpt-5.5", - "name": "GPT-5.5", - "display_name": "GPT-5.5", + "id": "o1-mini", + "name": "o1-mini", + "display_name": "o1-mini", "modalities": { "input": [ - "text", - "image", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 1050000, - "output": 128000 + "context": 128000, + "output": 65536 }, "temperature": false, "tool_call": true, @@ -148971,13 +152889,6 @@ "mode": "effort", "effort": "medium", "effort_options": [ - "low", - "medium", - "high", - "xhigh" - ], - "verbosity": "medium", - "verbosity_options": [ "low", "medium", "high" @@ -148985,22 +152896,52 @@ "visibility": "hidden" } }, - "attachment": true, + "attachment": false, "open_weights": false, - "knowledge": "2025-12-01", - "release_date": "2026-04-23", - "last_updated": "2026-04-23", + "knowledge": "2023-09", + "release_date": "2024-09-12", + "last_updated": "2024-09-12", "cost": { - "input": 5, - "output": 30, - "cache_read": 0.5 + "input": 1.1, + "output": 4.4, + "cache_read": 0.55 }, "type": "chat" }, { - "id": "openai/gpt-5.1", - "name": "GPT-5.1", - "display_name": "GPT-5.1", + "id": "text-embedding-3-large", + "name": "text-embedding-3-large", + "display_name": "text-embedding-3-large", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 8191, + "output": 3072 + }, + "tool_call": false, + "reasoning": { + "supported": false + }, + "attachment": false, + "open_weights": false, + "release_date": "2024-01-25", + "last_updated": "2024-01-25", + "cost": { + "input": 0.13, + "output": 0 + }, + "type": "embedding" + }, + { + "id": "mistral-small-2503", + "name": "Mistral Small 3.1", + "display_name": "Mistral Small 3.1", "modalities": { "input": [ "text", @@ -149011,102 +152952,61 @@ ] }, "limit": { - "context": 400000, - "output": 128000 + "context": 128000, + "output": 32768 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": false - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": false, - "mode": "effort", - "effort": "none", - "effort_options": [ - "none", - "low", - "medium", - "high" - ], - "verbosity": "medium", - "verbosity_options": [ - "low", - "medium", - "high" - ], - "visibility": "hidden" - } + "supported": false }, "attachment": true, "open_weights": false, - "knowledge": "2024-09-30", - "release_date": "2025-11-13", - "last_updated": "2025-11-13", + "knowledge": "2024-09", + "release_date": "2025-03-01", + "last_updated": "2025-03-01", "cost": { - "input": 1.25, - "output": 10, - "cache_read": 0.125 + "input": 0.1, + "output": 0.3 }, "type": "chat" - } - ] - }, - "abliteration-ai": { - "id": "abliteration-ai", - "name": "abliteration.ai", - "display_name": "abliteration.ai", - "api": "https://api.abliteration.ai/v1", - "doc": "https://docs.abliteration.ai/models", - "models": [ + }, { - "id": "abliterated-model", - "name": "Abliterated Model", - "display_name": "Abliterated Model", + "id": "meta-llama-3-8b-instruct", + "name": "Meta-Llama-3-8B-Instruct", + "display_name": "Meta-Llama-3-8B-Instruct", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 150000, - "output": 8192 + "context": 8192, + "output": 2048 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": false }, - "attachment": true, + "attachment": false, "open_weights": true, - "release_date": "2026-01-06", - "last_updated": "2026-01-06", + "knowledge": "2023-12", + "release_date": "2024-04-18", + "last_updated": "2024-04-18", "cost": { - "input": 3, - "output": 3 + "input": 0.3, + "output": 0.61 }, "type": "chat" - } - ] - }, - "minimax-cn": { - "id": "minimax-cn", - "name": "MiniMax (minimaxi.com)", - "display_name": "MiniMax (minimaxi.com)", - "api": "https://api.minimaxi.com/anthropic/v1", - "doc": "https://platform.minimaxi.com/docs/guides/quickstart", - "models": [ + }, { - "id": "MiniMax-M2.5", - "name": "MiniMax-M2.5", - "display_name": "MiniMax-M2.5", + "id": "phi-3-small-128k-instruct", + "name": "Phi-3-small-instruct (128k)", + "display_name": "Phi-3-small-instruct (128k)", "modalities": { "input": [ "text" @@ -149116,51 +153016,75 @@ ] }, "limit": { - "context": 204800, + "context": 128000, + "output": 4096 + }, + "temperature": true, + "tool_call": false, + "reasoning": { + "supported": false + }, + "attachment": false, + "open_weights": true, + "knowledge": "2023-10", + "release_date": "2024-04-23", + "last_updated": "2024-04-23", + "cost": { + "input": 0.15, + "output": 0.6 + }, + "type": "chat" + }, + { + "id": "deepseek-v3-0324", + "name": "DeepSeek-V3-0324", + "display_name": "DeepSeek-V3-0324", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 131072, "output": 131072 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true - } + "supported": false }, "attachment": false, "open_weights": true, - "release_date": "2026-02-12", - "last_updated": "2026-02-12", + "knowledge": "2024-07", + "release_date": "2025-03-24", + "last_updated": "2025-03-24", "cost": { - "input": 0.3, - "output": 1.2, - "cache_read": 0.03, - "cache_write": 0.375 + "input": 1.14, + "output": 4.56 }, "type": "chat" }, { - "id": "MiniMax-M3", - "name": "MiniMax-M3", - "display_name": "MiniMax-M3", + "id": "o3", + "name": "o3", + "display_name": "o3", "modalities": { "input": [ "text", - "image", - "video" + "image" ], "output": [ "text" ] }, "limit": { - "context": 512000, - "output": 128000 + "context": 200000, + "output": 100000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { "supported": true, @@ -149168,63 +153092,69 @@ }, "extra_capabilities": { "reasoning": { - "supported": true + "supported": true, + "default_enabled": true, + "mode": "effort", + "effort": "medium", + "effort_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" } }, "attachment": true, - "open_weights": true, - "release_date": "2026-06-01", - "last_updated": "2026-06-01", + "open_weights": false, + "knowledge": "2024-05", + "release_date": "2025-04-16", + "last_updated": "2025-04-16", "cost": { - "input": 0.6, - "output": 2.4, - "cache_read": 0.12 + "input": 2, + "output": 8, + "cache_read": 0.5 }, "type": "chat" }, { - "id": "MiniMax-M2.5-highspeed", - "name": "MiniMax-M2.5-highspeed", - "display_name": "MiniMax-M2.5-highspeed", + "id": "gpt-5.2-chat", + "name": "GPT-5.2 Chat", + "display_name": "GPT-5.2 Chat", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 204800, - "output": 131072 + "context": 128000, + "output": 16384 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { "supported": true, "default": true }, - "extra_capabilities": { - "reasoning": { - "supported": true - } - }, - "attachment": false, - "open_weights": true, - "release_date": "2026-02-13", - "last_updated": "2026-02-13", + "attachment": true, + "open_weights": false, + "knowledge": "2025-08-31", + "release_date": "2025-12-11", + "last_updated": "2025-12-11", "cost": { - "input": 0.6, - "output": 2.4, - "cache_read": 0.06, - "cache_write": 0.375 + "input": 1.75, + "output": 14, + "cache_read": 0.175 }, "type": "chat" }, { - "id": "MiniMax-M2.7", - "name": "MiniMax-M2.7", - "display_name": "MiniMax-M2.7", + "id": "deepseek-r1-0528", + "name": "DeepSeek-R1-0528", + "display_name": "DeepSeek-R1-0528", "modalities": { "input": [ "text" @@ -149234,8 +153164,8 @@ ] }, "limit": { - "context": 204800, - "output": 131072 + "context": 163840, + "output": 163840 }, "temperature": true, "tool_call": true, @@ -149256,20 +153186,19 @@ }, "attachment": false, "open_weights": true, - "release_date": "2026-03-18", - "last_updated": "2026-03-18", + "knowledge": "2024-07", + "release_date": "2025-05-28", + "last_updated": "2025-05-28", "cost": { - "input": 0.3, - "output": 1.2, - "cache_read": 0.06, - "cache_write": 0.375 + "input": 1.35, + "output": 5.4 }, "type": "chat" }, { - "id": "MiniMax-M2", - "name": "MiniMax-M2", - "display_name": "MiniMax-M2", + "id": "gpt-3.5-turbo-instruct", + "name": "GPT-3.5 Turbo Instruct", + "display_name": "GPT-3.5 Turbo Instruct", "modalities": { "input": [ "text" @@ -149279,34 +153208,61 @@ ] }, "limit": { - "context": 196608, - "output": 128000 + "context": 4096, + "output": 4096 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": true + "supported": false }, - "extra_capabilities": { - "reasoning": { - "supported": true - } + "attachment": false, + "open_weights": false, + "knowledge": "2021-08", + "release_date": "2023-09-21", + "last_updated": "2023-09-21", + "cost": { + "input": 1.5, + "output": 2 + }, + "type": "chat" + }, + { + "id": "phi-3.5-moe-instruct", + "name": "Phi-3.5-MoE-instruct", + "display_name": "Phi-3.5-MoE-instruct", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 128000, + "output": 4096 + }, + "temperature": true, + "tool_call": false, + "reasoning": { + "supported": false }, "attachment": false, "open_weights": true, - "release_date": "2025-10-27", - "last_updated": "2025-10-27", + "knowledge": "2023-10", + "release_date": "2024-08-20", + "last_updated": "2024-08-20", "cost": { - "input": 0.3, - "output": 1.2 + "input": 0.16, + "output": 0.64 }, "type": "chat" }, { - "id": "MiniMax-M2.7-highspeed", - "name": "MiniMax-M2.7-highspeed", - "display_name": "MiniMax-M2.7-highspeed", + "id": "codex-mini", + "name": "Codex Mini", + "display_name": "Codex Mini", "modalities": { "input": [ "text" @@ -149316,8 +153272,52 @@ ] }, "limit": { - "context": 204800, - "output": 131072 + "context": 200000, + "output": 100000 + }, + "temperature": false, + "tool_call": true, + "reasoning": { + "supported": true, + "default": true + }, + "attachment": true, + "open_weights": false, + "knowledge": "2024-04", + "release_date": "2025-05-16", + "last_updated": "2025-05-16", + "cost": { + "input": 1.5, + "output": 6, + "cache_read": 0.375 + }, + "type": "chat" + } + ] + }, + "baseten": { + "id": "baseten", + "name": "Baseten", + "display_name": "Baseten", + "api": "https://inference.baseten.co/v1", + "doc": "https://docs.baseten.co/inference/model-apis/overview", + "models": [ + { + "id": "moonshotai/Kimi-K2.6", + "name": "Kimi K2.6", + "display_name": "Kimi K2.6", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 262000, + "output": 262000 }, "temperature": true, "tool_call": true, @@ -149336,33 +153336,34 @@ ] } }, - "attachment": false, + "attachment": true, "open_weights": true, - "release_date": "2026-03-18", - "last_updated": "2026-03-18", + "knowledge": "2025-01", + "release_date": "2026-04-21", + "last_updated": "2026-04-21", "cost": { - "input": 0.6, - "output": 2.4, - "cache_read": 0.06, - "cache_write": 0.375 + "input": 0.95, + "output": 4, + "cache_read": 0.16 }, "type": "chat" }, { - "id": "MiniMax-M2.1", - "name": "MiniMax-M2.1", - "display_name": "MiniMax-M2.1", + "id": "moonshotai/Kimi-K2.5", + "name": "Kimi K2.5", + "display_name": "Kimi K2.5", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 204800, - "output": 131072 + "context": 262000, + "output": 262000 }, "temperature": true, "tool_call": true, @@ -149372,32 +153373,31 @@ }, "extra_capabilities": { "reasoning": { - "supported": true + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] } }, - "attachment": false, + "attachment": true, "open_weights": true, - "release_date": "2025-12-23", - "last_updated": "2025-12-23", + "knowledge": "2025-12", + "release_date": "2026-01-30", + "last_updated": "2026-02-12", "cost": { - "input": 0.3, - "output": 1.2 + "input": 0.6, + "output": 3, + "cache_read": 0.12 }, "type": "chat" - } - ] - }, - "qiniu-ai": { - "id": "qiniu-ai", - "name": "Qiniu", - "display_name": "Qiniu", - "api": "https://api.qnaigc.com/v1", - "doc": "https://developer.qiniu.com/aitokenapi", - "models": [ + }, { - "id": "qwen3-30b-a3b-instruct-2507", - "name": "Qwen3 30b A3b Instruct 2507", - "display_name": "Qwen3 30b A3b Instruct 2507", + "id": "openai/gpt-oss-120b", + "name": "OpenAI GPT 120B", + "display_name": "OpenAI GPT 120B", "modalities": { "input": [ "text" @@ -149407,24 +153407,35 @@ ] }, "limit": { - "context": 128000, - "output": 32000 + "context": 128072, + "output": 128072 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true + } }, "attachment": false, - "open_weights": false, - "release_date": "2026-02-04", - "last_updated": "2026-02-04", + "open_weights": true, + "knowledge": "2025-08", + "release_date": "2025-08-05", + "last_updated": "2025-08-05", + "cost": { + "input": 0.1, + "output": 0.5 + }, "type": "chat" }, { - "id": "deepseek-r1-0528", - "name": "DeepSeek-R1-0528", - "display_name": "DeepSeek-R1-0528", + "id": "nvidia/Nemotron-120B-A12B", + "name": "Nemotron Super", + "display_name": "Nemotron Super", "modalities": { "input": [ "text" @@ -149434,8 +153445,8 @@ ] }, "limit": { - "context": 128000, - "output": 32000 + "context": 202800, + "output": 202800 }, "temperature": true, "tool_call": true, @@ -149455,28 +153466,32 @@ } }, "attachment": false, - "open_weights": false, - "release_date": "2025-08-05", - "last_updated": "2025-08-05", + "open_weights": true, + "knowledge": "2026-02", + "release_date": "2026-03-11", + "last_updated": "2026-03-11", + "cost": { + "input": 0.06, + "output": 0.75, + "cache_read": 0.06 + }, "type": "chat" }, { - "id": "doubao-seed-2.0-code", - "name": "Doubao Seed 2.0 Code", - "display_name": "Doubao Seed 2.0 Code", + "id": "nvidia/NVIDIA-Nemotron-3-Ultra-550B-A55B", + "name": "Nemotron Ultra", + "display_name": "Nemotron Ultra", "modalities": { "input": [ - "text", - "image", - "video" + "text" ], "output": [ "text" ] }, "limit": { - "context": 256000, - "output": 128000 + "context": 202800, + "output": 202800 }, "temperature": true, "tool_call": true, @@ -149484,44 +153499,77 @@ "supported": true, "default": true }, - "attachment": true, - "open_weights": false, - "release_date": "2026-02-14", - "last_updated": "2026-02-14", + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } + }, + "attachment": false, + "open_weights": true, + "release_date": "2026-06-04", + "last_updated": "2026-06-04", + "cost": { + "input": 0.6, + "output": 2.4, + "cache_read": 0.12 + }, "type": "chat" }, { - "id": "gemini-2.5-flash-image", - "name": "Gemini 2.5 Flash Image", - "display_name": "Gemini 2.5 Flash Image", + "id": "zai-org/GLM-5", + "name": "GLM 5", + "display_name": "GLM 5", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ - "image" + "text" ] }, "limit": { - "context": 32768, - "output": 8192 + "context": 202800, + "output": 202800 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": true, - "open_weights": false, - "release_date": "2025-10-22", - "last_updated": "2025-10-22", - "type": "imageGeneration" + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } + }, + "attachment": false, + "open_weights": true, + "knowledge": "2026-01", + "release_date": "2026-02-12", + "last_updated": "2026-02-12", + "cost": { + "input": 0.95, + "output": 3.15, + "cache_read": 0.2 + }, + "type": "chat" }, { - "id": "qwen3-next-80b-a3b-instruct", - "name": "Qwen3 Next 80B A3B Instruct", - "display_name": "Qwen3 Next 80B A3B Instruct", + "id": "zai-org/GLM-4.7", + "name": "GLM 4.7", + "display_name": "GLM 4.7", "modalities": { "input": [ "text" @@ -149531,24 +153579,42 @@ ] }, "limit": { - "context": 131072, - "output": 32768 + "context": 200000, + "output": 200000 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } }, "attachment": false, - "open_weights": false, - "release_date": "2025-09-12", - "last_updated": "2025-09-12", + "open_weights": true, + "knowledge": "2025-04", + "release_date": "2025-12-22", + "last_updated": "2025-12-22", + "cost": { + "input": 0.12, + "output": 2.2, + "cache_read": 0.12 + }, "type": "chat" }, { - "id": "qwen3-max-preview", - "name": "Qwen3 Max Preview", - "display_name": "Qwen3 Max Preview", + "id": "zai-org/GLM-5.1", + "name": "GLM 5.1", + "display_name": "GLM 5.1", "modalities": { "input": [ "text" @@ -149558,13 +153624,14 @@ ] }, "limit": { - "context": 256000, - "output": 64000 + "context": 202800, + "output": 202800 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true + "supported": true, + "default": true }, "extra_capabilities": { "reasoning": { @@ -149578,45 +153645,52 @@ } }, "attachment": false, - "open_weights": false, - "release_date": "2025-09-06", - "last_updated": "2025-09-06", + "open_weights": true, + "release_date": "2026-03-27", + "last_updated": "2026-03-27", + "cost": { + "input": 1.3, + "output": 4.3, + "cache_read": 0.26 + }, "type": "chat" }, { - "id": "qwen2.5-vl-72b-instruct", - "name": "Qwen 2.5 VL 72B Instruct", - "display_name": "Qwen 2.5 VL 72B Instruct", + "id": "deepseek-ai/DeepSeek-V3.1", + "name": "DeepSeek V3.1", + "display_name": "DeepSeek V3.1", "modalities": { "input": [ - "text", - "image", - "audio", - "video" + "text" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 8192 + "context": 164000, + "output": 131000 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true + }, + "attachment": false, + "open_weights": true, + "release_date": "2025-08-25", + "last_updated": "2025-08-25", + "cost": { + "input": 0.5, + "output": 1.5 }, - "attachment": true, - "open_weights": false, - "release_date": "2025-08-05", - "last_updated": "2025-08-05", "type": "chat" }, { - "id": "qwen3-32b", - "name": "Qwen3 32B", - "display_name": "Qwen3 32B", + "id": "deepseek-ai/DeepSeek-V4-Pro", + "name": "Deepseek V4 Pro", + "display_name": "Deepseek V4 Pro", "modalities": { "input": [ "text" @@ -149626,8 +153700,8 @@ ] }, "limit": { - "context": 40000, - "output": 4096 + "context": 131000, + "output": 131000 }, "temperature": true, "tool_call": true, @@ -149647,15 +153721,21 @@ } }, "attachment": false, - "open_weights": false, - "release_date": "2025-08-05", - "last_updated": "2025-08-05", + "open_weights": true, + "knowledge": "2025-05", + "release_date": "2026-04-24", + "last_updated": "2026-04-24", + "cost": { + "input": 1.74, + "output": 3.48, + "cache_read": 0.145 + }, "type": "chat" }, { - "id": "deepseek-v3-0324", - "name": "DeepSeek-V3-0324", - "display_name": "DeepSeek-V3-0324", + "id": "MiniMaxAI/MiniMax-M2.5", + "name": "MiniMax-M2.5", + "display_name": "MiniMax-M2.5", "modalities": { "input": [ "text" @@ -149665,64 +153745,81 @@ ] }, "limit": { - "context": 128000, - "output": 16000 + "context": 204000, + "output": 204000 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } }, "attachment": false, - "open_weights": false, - "release_date": "2025-08-05", - "last_updated": "2025-08-05", + "open_weights": true, + "knowledge": "2026-01", + "release_date": "2026-02-12", + "last_updated": "2026-02-12", + "cost": { + "input": 0.3, + "output": 1.2 + }, "type": "chat" - }, + } + ] + }, + "atomic-chat": { + "id": "atomic-chat", + "name": "Atomic Chat", + "display_name": "Atomic Chat", + "api": "http://127.0.0.1:1337/v1", + "doc": "https://atomic.chat", + "models": [ { - "id": "qwen3-vl-30b-a3b-thinking", - "name": "Qwen3-Vl 30b A3b Thinking", - "display_name": "Qwen3-Vl 30b A3b Thinking", + "id": "gemma-4-E4B-it-IQ4_XS", + "name": "Gemma 4 E4B Instruct (IQ4_XS)", + "display_name": "Gemma 4 E4B Instruct (IQ4_XS)", "modalities": { "input": [ - "text", - "image", - "video" + "text" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 32000 + "context": 32768, + "output": 8192 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true + "supported": false }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } + "attachment": false, + "open_weights": true, + "release_date": "2026-04-02", + "last_updated": "2026-04-02", + "cost": { + "input": 0, + "output": 0 }, - "attachment": true, - "open_weights": false, - "release_date": "2026-02-09", - "last_updated": "2026-02-09", "type": "chat" }, { - "id": "MiniMax-M1", - "name": "MiniMax M1", - "display_name": "MiniMax M1", + "id": "Meta-Llama-3_1-8B-Instruct-GGUF", + "name": "Meta Llama 3.1 8B Instruct (GGUF)", + "display_name": "Meta Llama 3.1 8B Instruct (GGUF)", "modalities": { "input": [ "text" @@ -149732,113 +153829,132 @@ ] }, "limit": { - "context": 1000000, - "output": 80000 + "context": 131072, + "output": 4096 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, "attachment": false, - "open_weights": false, - "release_date": "2025-08-05", - "last_updated": "2025-08-05", + "open_weights": true, + "release_date": "2024-07-23", + "last_updated": "2024-07-23", + "cost": { + "input": 0, + "output": 0 + }, "type": "chat" }, { - "id": "qwen-max-2025-01-25", - "name": "Qwen2.5-Max-2025-01-25", - "display_name": "Qwen2.5-Max-2025-01-25", + "id": "Qwen3_5-9B-MLX-4bit", + "name": "Qwen 3.5 9B (MLX 4-bit)", + "display_name": "Qwen 3.5 9B (MLX 4-bit)", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 4096 + "context": 32768, + "output": 8192 }, "temperature": true, "tool_call": true, "reasoning": { "supported": false }, - "attachment": false, - "open_weights": false, - "release_date": "2025-08-05", - "last_updated": "2025-08-05", + "attachment": true, + "open_weights": true, + "release_date": "2026-03-05", + "last_updated": "2026-04-04", + "cost": { + "input": 0, + "output": 0 + }, "type": "chat" }, { - "id": "gemini-2.0-flash-lite", - "name": "Gemini 2.0 Flash Lite", - "display_name": "Gemini 2.0 Flash Lite", + "id": "gemma-4-E4B-it-MLX-4bit", + "name": "Gemma 4 E4B Instruct (MLX 4-bit)", + "display_name": "Gemma 4 E4B Instruct (MLX 4-bit)", "modalities": { "input": [ - "text", - "image", - "audio", - "video" + "text" ], "output": [ "text" ] }, "limit": { - "context": 1048576, + "context": 32768, "output": 8192 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": true + "supported": false + }, + "attachment": false, + "open_weights": true, + "release_date": "2026-04-02", + "last_updated": "2026-04-02", + "cost": { + "input": 0, + "output": 0 }, - "attachment": true, - "open_weights": false, - "release_date": "2025-08-05", - "last_updated": "2025-08-05", "type": "chat" }, { - "id": "doubao-seed-2.0-mini", - "name": "Doubao Seed 2.0 Mini", - "display_name": "Doubao Seed 2.0 Mini", + "id": "Qwen3_5-9B-Q4_K_M", + "name": "Qwen 3.5 9B (Q4_K_M)", + "display_name": "Qwen 3.5 9B (Q4_K_M)", "modalities": { "input": [ "text", - "image", - "video" + "image" ], "output": [ "text" ] }, "limit": { - "context": 256000, - "output": 32000 + "context": 32768, + "output": 8192 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, "attachment": true, - "open_weights": false, - "release_date": "2026-02-14", - "last_updated": "2026-02-14", + "open_weights": true, + "release_date": "2026-03-05", + "last_updated": "2026-04-04", + "cost": { + "input": 0, + "output": 0 + }, "type": "chat" - }, + } + ] + }, + "routing-run": { + "id": "routing-run", + "name": "routing.run", + "display_name": "routing.run", + "api": "https://ai.routing.sh/v1", + "doc": "https://docs.routing.run/api-reference/models", + "models": [ { - "id": "qwen3-235b-a22b", - "name": "Qwen 3 235B A22B", - "display_name": "Qwen 3 235B A22B", + "id": "route/deepseek-v4-flash", + "name": "DeepSeek V4 Flash", + "display_name": "DeepSeek V4 Flash", "modalities": { "input": [ "text" @@ -149848,13 +153964,14 @@ ] }, "limit": { - "context": 128000, - "output": 32000 + "context": 1000000, + "output": 131072 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true + "supported": true, + "default": true }, "extra_capabilities": { "reasoning": { @@ -149868,64 +153985,66 @@ } }, "attachment": false, - "open_weights": false, - "release_date": "2025-08-05", - "last_updated": "2025-08-05", + "open_weights": true, + "knowledge": "2025-05", + "release_date": "2026-04-24", + "last_updated": "2026-04-24", + "cost": { + "input": 0.4928, + "output": 0.7392, + "cache_read": 0.0028 + }, "type": "chat" }, { - "id": "claude-3.7-sonnet", - "name": "Claude 3.7 Sonnet", - "display_name": "Claude 3.7 Sonnet", + "id": "route/deepseek-v4-flash-6bit", + "name": "DeepSeek V4 Flash 6bit", + "display_name": "DeepSeek V4 Flash 6bit", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 128000 + "context": 1000000, + "output": 131072 }, "temperature": true, "tool_call": true, "reasoning": { "supported": true, - "default": false + "default": true }, "extra_capabilities": { "reasoning": { "supported": true, - "default_enabled": false, - "mode": "budget", - "budget": { - "min": 1024, - "unit": "tokens" - }, - "interleaved": false, - "summaries": false, - "visibility": "full", + "interleaved": true, + "summaries": true, + "visibility": "summary", "continuation": [ "thinking_blocks" - ], - "notes": [ - "Anthropic uses thinking budget tokens" ] } }, - "attachment": true, - "open_weights": false, - "release_date": "2025-08-05", - "last_updated": "2025-08-05", + "attachment": false, + "open_weights": true, + "knowledge": "2025-05", + "release_date": "2026-04-24", + "last_updated": "2026-04-24", + "cost": { + "input": 0.4928, + "output": 0.7392, + "cache_read": 0.0028 + }, "type": "chat" }, { - "id": "qwen3-max", - "name": "Qwen3 Max", - "display_name": "Qwen3 Max", + "id": "route/minimax-m2.7-highspeed", + "name": "MiniMax M2.7 Highspeed", + "display_name": "MiniMax M2.7 Highspeed", "modalities": { "input": [ "text" @@ -149935,13 +154054,14 @@ ] }, "limit": { - "context": 262144, - "output": 65536 + "context": 100000, + "output": 131072 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true + "supported": true, + "default": true }, "extra_capabilities": { "reasoning": { @@ -149955,15 +154075,21 @@ } }, "attachment": false, - "open_weights": false, - "release_date": "2025-09-24", - "last_updated": "2025-09-24", + "open_weights": true, + "release_date": "2026-03-18", + "last_updated": "2026-03-18", + "cost": { + "input": 0.33, + "output": 1.32, + "cache_read": 0.06, + "cache_write": 0.375 + }, "type": "chat" }, { - "id": "gpt-oss-120b", - "name": "gpt-oss-120b", - "display_name": "gpt-oss-120b", + "id": "route/glm-5.1-6bit", + "name": "GLM 5.1 6bit", + "display_name": "GLM 5.1 6bit", "modalities": { "input": [ "text" @@ -149973,8 +154099,8 @@ ] }, "limit": { - "context": 128000, - "output": 4096 + "context": 202752, + "output": 65536 }, "temperature": true, "tool_call": true, @@ -149984,19 +154110,31 @@ }, "extra_capabilities": { "reasoning": { - "supported": true + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] } }, "attachment": false, - "open_weights": false, - "release_date": "2025-08-06", - "last_updated": "2025-08-06", + "open_weights": true, + "release_date": "2026-03-27", + "last_updated": "2026-03-27", + "cost": { + "input": 1, + "output": 3, + "cache_read": 0.26, + "cache_write": 0 + }, "type": "chat" }, { - "id": "doubao-1.5-thinking-pro", - "name": "Doubao 1.5 Thinking Pro", - "display_name": "Doubao 1.5 Thinking Pro", + "id": "route/minimax-m2.5", + "name": "MiniMax M2.5", + "display_name": "MiniMax M2.5", "modalities": { "input": [ "text" @@ -150006,37 +154144,48 @@ ] }, "limit": { - "context": 128000, - "output": 16000 + "context": 100000, + "output": 131072 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true + } }, "attachment": false, - "open_weights": false, - "release_date": "2025-08-05", - "last_updated": "2025-08-05", + "open_weights": true, + "release_date": "2026-02-12", + "last_updated": "2026-02-12", + "cost": { + "input": 0.193, + "output": 1.238, + "cache_read": 0.03, + "cache_write": 0.375 + }, "type": "chat" }, { - "id": "claude-3.5-haiku", - "name": "Claude 3.5 Haiku", - "display_name": "Claude 3.5 Haiku", + "id": "route/mistral-small-2503", + "name": "Mistral Small 2503", + "display_name": "Mistral Small 2503", "modalities": { "input": [ "text", - "image" + "image", + "video" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 8192 + "context": 128000, + "output": 32768 }, "temperature": true, "tool_call": true, @@ -150044,83 +154193,53 @@ "supported": false }, "attachment": true, - "open_weights": false, - "release_date": "2025-08-26", - "last_updated": "2025-08-26", - "type": "chat" - }, - { - "id": "deepseek-r1", - "name": "DeepSeek-R1", - "display_name": "DeepSeek-R1", - "modalities": { - "input": [ - "text" - ], - "output": [ - "text" - ] - }, - "limit": { - "context": 128000, - "output": 32000 - }, - "temperature": true, - "tool_call": true, - "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } + "open_weights": true, + "knowledge": "2025-06", + "release_date": "2026-03-16", + "last_updated": "2026-03-16", + "cost": { + "input": 0.15, + "output": 0.6 }, - "attachment": false, - "open_weights": false, - "release_date": "2025-08-05", - "last_updated": "2025-08-05", "type": "chat" }, { - "id": "claude-3.5-sonnet", - "name": "Claude 3.5 Sonnet", - "display_name": "Claude 3.5 Sonnet", + "id": "route/gemma-4-31b-it", + "name": "Gemma 4 31B IT", + "display_name": "Gemma 4 31B IT", "modalities": { "input": [ "text", - "image" + "image", + "video" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 8200 + "context": 131072, + "output": 65536 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, "attachment": true, - "open_weights": false, - "release_date": "2025-09-09", - "last_updated": "2025-09-09", + "open_weights": true, + "release_date": "2026-04-02", + "last_updated": "2026-04-02", + "cost": { + "input": 0.1, + "output": 0.3 + }, "type": "chat" }, { - "id": "qwen3-235b-a22b-thinking-2507", - "name": "Qwen3 235B A22B Thinking 2507", - "display_name": "Qwen3 235B A22B Thinking 2507", + "id": "route/step-3.5-flash-2603", + "name": "Step 3.5 Flash 2603", + "display_name": "Step 3.5 Flash 2603", "modalities": { "input": [ "text" @@ -150131,7 +154250,7 @@ }, "limit": { "context": 262144, - "output": 4096 + "output": 65536 }, "temperature": true, "tool_call": true, @@ -150151,15 +154270,21 @@ } }, "attachment": false, - "open_weights": false, - "release_date": "2025-08-12", - "last_updated": "2025-08-12", + "open_weights": true, + "knowledge": "2025-01", + "release_date": "2026-04-02", + "last_updated": "2026-04-02", + "cost": { + "input": 0.1, + "output": 0.3, + "cache_read": 0.02 + }, "type": "chat" }, { - "id": "gpt-oss-20b", - "name": "gpt-oss-20b", - "display_name": "gpt-oss-20b", + "id": "route/glm-5.1", + "name": "GLM 5.1", + "display_name": "GLM 5.1", "modalities": { "input": [ "text" @@ -150169,8 +154294,8 @@ ] }, "limit": { - "context": 128000, - "output": 4096 + "context": 202752, + "output": 65536 }, "temperature": true, "tool_call": true, @@ -150180,33 +154305,42 @@ }, "extra_capabilities": { "reasoning": { - "supported": true + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] } }, "attachment": false, - "open_weights": false, - "release_date": "2025-08-06", - "last_updated": "2025-08-06", + "open_weights": true, + "release_date": "2026-03-27", + "last_updated": "2026-03-27", + "cost": { + "input": 1, + "output": 3, + "cache_read": 0.26, + "cache_write": 0 + }, "type": "chat" }, { - "id": "gemini-2.5-pro", - "name": "Gemini 2.5 Pro", - "display_name": "Gemini 2.5 Pro", + "id": "route/deepseek-v4-pro", + "name": "DeepSeek V4 Pro", + "display_name": "DeepSeek V4 Pro", "modalities": { "input": [ - "text", - "image", - "video", - "audio" + "text" ], "output": [ "text" ] }, "limit": { - "context": 1048576, - "output": 65536 + "context": 1000000, + "output": 131072 }, "temperature": true, "tool_call": true, @@ -150217,32 +154351,30 @@ "extra_capabilities": { "reasoning": { "supported": true, - "default_enabled": true, - "mode": "budget", - "budget": { - "default": -1, - "min": 128, - "max": 32768, - "auto": -1, - "unit": "tokens" - }, + "interleaved": true, "summaries": true, "visibility": "summary", "continuation": [ - "thought_signatures" + "thinking_blocks" ] } }, - "attachment": true, - "open_weights": false, - "release_date": "2025-08-05", - "last_updated": "2025-08-05", + "attachment": false, + "open_weights": true, + "knowledge": "2025-05", + "release_date": "2026-04-24", + "last_updated": "2026-04-24", + "cost": { + "input": 0.4928, + "output": 0.7392, + "cache_read": 0.003625 + }, "type": "chat" }, { - "id": "doubao-1.5-pro-32k", - "name": "Doubao 1.5 Pro 32k", - "display_name": "Doubao 1.5 Pro 32k", + "id": "route/mistral-large-3", + "name": "Mistral Large 3", + "display_name": "Mistral Large 3", "modalities": { "input": [ "text" @@ -150253,7 +154385,7 @@ }, "limit": { "context": 128000, - "output": 12000 + "output": 32768 }, "temperature": true, "tool_call": true, @@ -150261,15 +154393,20 @@ "supported": false }, "attachment": false, - "open_weights": false, - "release_date": "2025-08-05", - "last_updated": "2025-08-05", + "open_weights": true, + "knowledge": "2024-11", + "release_date": "2024-11-01", + "last_updated": "2025-12-02", + "cost": { + "input": 0.5, + "output": 1.5 + }, "type": "chat" }, { - "id": "qwen3-30b-a3b", - "name": "Qwen3 30B A3B", - "display_name": "Qwen3 30B A3B", + "id": "route/deepseek-v4-pro-6bit", + "name": "DeepSeek V4 Pro 6bit", + "display_name": "DeepSeek V4 Pro 6bit", "modalities": { "input": [ "text" @@ -150279,8 +154416,8 @@ ] }, "limit": { - "context": 40000, - "output": 4096 + "context": 1000000, + "output": 131072 }, "temperature": true, "tool_call": true, @@ -150300,49 +154437,25 @@ } }, "attachment": false, - "open_weights": false, - "release_date": "2025-08-05", - "last_updated": "2025-08-05", - "type": "chat" - }, - { - "id": "claude-4.0-sonnet", - "name": "Claude 4.0 Sonnet", - "display_name": "Claude 4.0 Sonnet", - "modalities": { - "input": [ - "text", - "image" - ], - "output": [ - "text" - ] - }, - "limit": { - "context": 200000, - "output": 64000 - }, - "temperature": true, - "tool_call": true, - "reasoning": { - "supported": true, - "default": true + "open_weights": true, + "knowledge": "2025-05", + "release_date": "2026-04-24", + "last_updated": "2026-04-24", + "cost": { + "input": 0.4928, + "output": 0.7392, + "cache_read": 0.003625 }, - "attachment": true, - "open_weights": false, - "release_date": "2025-08-05", - "last_updated": "2025-08-05", "type": "chat" }, { - "id": "qwen-vl-max-2025-01-25", - "name": "Qwen VL-MAX-2025-01-25", - "display_name": "Qwen VL-MAX-2025-01-25", + "id": "route/mistral-medium-2505", + "name": "Mistral Medium 2505", + "display_name": "Mistral Medium 2505", "modalities": { "input": [ "text", "image", - "audio", "video" ], "output": [ @@ -150351,7 +154464,7 @@ }, "limit": { "context": 128000, - "output": 4096 + "output": 32768 }, "temperature": true, "tool_call": true, @@ -150360,91 +154473,64 @@ }, "attachment": true, "open_weights": false, - "release_date": "2025-08-05", - "last_updated": "2025-08-05", - "type": "chat" - }, - { - "id": "qwen3-coder-480b-a35b-instruct", - "name": "Qwen3 Coder 480B A35B Instruct", - "display_name": "Qwen3 Coder 480B A35B Instruct", - "modalities": { - "input": [ - "text" - ], - "output": [ - "text" - ] - }, - "limit": { - "context": 262000, - "output": 4096 - }, - "temperature": true, - "tool_call": true, - "reasoning": { - "supported": false + "knowledge": "2025-05", + "release_date": "2025-05-07", + "last_updated": "2025-05-07", + "cost": { + "input": 0.4, + "output": 2 }, - "attachment": false, - "open_weights": false, - "release_date": "2025-08-14", - "last_updated": "2025-08-14", "type": "chat" }, { - "id": "gemini-2.5-flash-lite", - "name": "Gemini 2.5 Flash Lite", - "display_name": "Gemini 2.5 Flash Lite", + "id": "route/minimax-m2.7", + "name": "MiniMax M2.7", + "display_name": "MiniMax M2.7", "modalities": { "input": [ - "text", - "image", - "audio", - "video" + "text" ], "output": [ "text" ] }, "limit": { - "context": 1048576, - "output": 64000 + "context": 100000, + "output": 131072 }, "temperature": true, "tool_call": true, "reasoning": { "supported": true, - "default": false + "default": true }, "extra_capabilities": { "reasoning": { "supported": true, - "default_enabled": false, - "mode": "budget", - "budget": { - "default": -1, - "min": 512, - "max": 24576, - "auto": -1, - "unit": "tokens" - }, + "interleaved": true, "summaries": true, "visibility": "summary", "continuation": [ - "thought_signatures" + "thinking_blocks" ] } }, - "attachment": true, - "open_weights": false, - "release_date": "2025-08-05", - "last_updated": "2025-08-05", + "attachment": false, + "open_weights": true, + "release_date": "2026-03-18", + "last_updated": "2026-03-18", + "cost": { + "input": 0.33, + "output": 1.32, + "cache_read": 0.06, + "cache_write": 0.375 + }, "type": "chat" }, { - "id": "qwen3-next-80b-a3b-thinking", - "name": "Qwen3 Next 80B A3B Thinking", - "display_name": "Qwen3 Next 80B A3B Thinking", + "id": "route/qwen3.6-27b-202k", + "name": "Qwen3.6 27B 202K", + "display_name": "Qwen3.6 27B 202K", "modalities": { "input": [ "text" @@ -150454,14 +154540,13 @@ ] }, "limit": { - "context": 131072, + "context": 202000, "output": 32768 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": true }, "extra_capabilities": { "reasoning": { @@ -150475,20 +154560,23 @@ } }, "attachment": false, - "open_weights": false, - "release_date": "2025-09-12", - "last_updated": "2025-09-12", + "open_weights": true, + "release_date": "2026-04-22", + "last_updated": "2026-04-22", + "cost": { + "input": 1.1, + "output": 3.3 + }, "type": "chat" }, { - "id": "gemini-2.5-flash", - "name": "Gemini 2.5 Flash", - "display_name": "Gemini 2.5 Flash", + "id": "route/kimi-k2.5", + "name": "Kimi K2.5", + "display_name": "Kimi K2.5", "modalities": { "input": [ "text", "image", - "audio", "video" ], "output": [ @@ -150496,86 +154584,92 @@ ] }, "limit": { - "context": 1048576, - "output": 64000 + "context": 131072, + "output": 32768 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": true }, "extra_capabilities": { "reasoning": { "supported": true, - "default_enabled": true, - "mode": "budget", - "budget": { - "default": -1, - "min": 0, - "max": 24576, - "auto": -1, - "off": 0, - "unit": "tokens" - }, + "interleaved": true, "summaries": true, "visibility": "summary", "continuation": [ - "thought_signatures" + "thinking_blocks" ] } }, "attachment": true, - "open_weights": false, - "release_date": "2025-08-05", - "last_updated": "2025-08-05", + "open_weights": true, + "knowledge": "2025-01", + "release_date": "2026-01", + "last_updated": "2026-01", + "cost": { + "input": 0.462, + "output": 2.42, + "cache_read": 0.1 + }, "type": "chat" }, { - "id": "claude-4.5-haiku", - "name": "Claude 4.5 Haiku", - "display_name": "Claude 4.5 Haiku", + "id": "route/minimax-m2.5-highspeed", + "name": "MiniMax M2.5 Highspeed", + "display_name": "MiniMax M2.5 Highspeed", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 64000 + "context": 100000, + "output": 131072 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true + } + }, + "attachment": false, + "open_weights": true, + "release_date": "2026-02-13", + "last_updated": "2026-02-13", + "cost": { + "input": 0.193, + "output": 1.238, + "cache_read": 0.06, + "cache_write": 0.375 }, - "attachment": true, - "open_weights": false, - "release_date": "2025-10-16", - "last_updated": "2025-10-16", "type": "chat" }, { - "id": "claude-4.1-opus", - "name": "Claude 4.1 Opus", - "display_name": "Claude 4.1 Opus", + "id": "route/kimi-k2.6-6bit", + "name": "Kimi K2.6 6bit", + "display_name": "Kimi K2.6 6bit", "modalities": { "input": [ "text", - "image" + "image", + "video" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 32000 + "context": 262144, + "output": 262144 }, "temperature": true, "tool_call": true, @@ -150583,19 +154677,38 @@ "supported": true, "default": true }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } + }, "attachment": true, - "open_weights": false, - "release_date": "2025-08-06", - "last_updated": "2025-08-06", + "open_weights": true, + "knowledge": "2025-01", + "release_date": "2026-04-21", + "last_updated": "2026-04-21", + "cost": { + "input": 0.462, + "output": 2.42, + "cache_read": 0.16 + }, "type": "chat" }, { - "id": "qwen-turbo", - "name": "Qwen-Turbo", - "display_name": "Qwen-Turbo", + "id": "route/mimo-v2.5", + "name": "MiMo V2.5", + "display_name": "MiMo V2.5", "modalities": { "input": [ - "text" + "text", + "image", + "video" ], "output": [ "text" @@ -150603,7 +154716,7 @@ }, "limit": { "context": 1000000, - "output": 4096 + "output": 262144 }, "temperature": true, "tool_call": true, @@ -150622,16 +154735,38 @@ ] } }, - "attachment": false, - "open_weights": false, - "release_date": "2025-08-05", - "last_updated": "2025-08-05", + "attachment": true, + "open_weights": true, + "knowledge": "2024-12", + "release_date": "2026-04-22", + "last_updated": "2026-04-22", + "cost": { + "input": 0.45, + "output": 1.35, + "cache_read": 0.2, + "tiers": [ + { + "input": 2, + "output": 6, + "cache_read": 0.4, + "tier": { + "type": "context", + "size": 256000 + } + } + ], + "context_over_200k": { + "input": 2, + "output": 6, + "cache_read": 0.4 + } + }, "type": "chat" }, { - "id": "doubao-seed-2.0-pro", - "name": "Doubao Seed 2.0 Pro", - "display_name": "Doubao Seed 2.0 Pro", + "id": "route/kimi-k2.6", + "name": "Kimi K2.6", + "display_name": "Kimi K2.6", "modalities": { "input": [ "text", @@ -150643,8 +154778,8 @@ ] }, "limit": { - "context": 256000, - "output": 128000 + "context": 262144, + "output": 262144 }, "temperature": true, "tool_call": true, @@ -150652,79 +154787,79 @@ "supported": true, "default": true }, - "attachment": true, - "open_weights": false, - "release_date": "2026-02-14", - "last_updated": "2026-02-14", - "type": "chat" - }, - { - "id": "doubao-1.5-vision-pro", - "name": "Doubao 1.5 Vision Pro", - "display_name": "Doubao 1.5 Vision Pro", - "modalities": { - "input": [ - "text", - "image", - "video" - ], - "output": [ - "text" - ] - }, - "limit": { - "context": 128000, - "output": 16000 - }, - "temperature": true, - "tool_call": false, - "reasoning": { - "supported": false + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } }, "attachment": true, - "open_weights": false, - "release_date": "2025-08-05", - "last_updated": "2025-08-05", + "open_weights": true, + "knowledge": "2025-01", + "release_date": "2026-04-21", + "last_updated": "2026-04-21", + "cost": { + "input": 0.462, + "output": 2.42, + "cache_read": 0.16 + }, "type": "chat" }, { - "id": "claude-4.5-opus", - "name": "Claude 4.5 Opus", - "display_name": "Claude 4.5 Opus", + "id": "route/qwen3.6-27b", + "name": "Qwen3.6 27B", + "display_name": "Qwen3.6 27B", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 200000 + "context": 202000, + "output": 32768 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } + }, + "attachment": false, + "open_weights": true, + "release_date": "2026-04-22", + "last_updated": "2026-04-22", + "cost": { + "input": 1.1, + "output": 3.3 }, - "attachment": true, - "open_weights": false, - "release_date": "2025-11-25", - "last_updated": "2025-11-25", "type": "chat" }, { - "id": "gemini-2.0-flash", - "name": "Gemini 2.0 Flash", - "display_name": "Gemini 2.0 Flash", + "id": "route/mimo-v2.5-pro-6bit", + "name": "MiMo V2.5 Pro 6bit", + "display_name": "MiMo V2.5 Pro 6bit", "modalities": { "input": [ "text", "image", - "audio", "video" ], "output": [ @@ -150732,36 +154867,69 @@ ] }, "limit": { - "context": 1048576, - "output": 8192 + "context": 1000000, + "output": 262144 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } }, "attachment": true, - "open_weights": false, - "release_date": "2025-08-05", - "last_updated": "2025-08-05", + "open_weights": true, + "knowledge": "2024-12", + "release_date": "2026-04-22", + "last_updated": "2026-04-22", + "cost": { + "input": 0.45, + "output": 1.35, + "cache_read": 0.2, + "tiers": [ + { + "input": 2, + "output": 6, + "cache_read": 0.4, + "tier": { + "type": "context", + "size": 256000 + } + } + ], + "context_over_200k": { + "input": 2, + "output": 6, + "cache_read": 0.4 + } + }, "type": "chat" }, { - "id": "claude-4.5-sonnet", - "name": "Claude 4.5 Sonnet", - "display_name": "Claude 4.5 Sonnet", + "id": "route/stepfun-3.5-flash", + "name": "StepFun 3.5 Flash", + "display_name": "StepFun 3.5 Flash", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 64000 + "context": 262144, + "output": 65536 }, "temperature": true, "tool_call": true, @@ -150769,16 +154937,33 @@ "supported": true, "default": true }, - "attachment": true, - "open_weights": false, - "release_date": "2025-09-30", - "last_updated": "2025-09-30", + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } + }, + "attachment": false, + "open_weights": true, + "knowledge": "2025-01", + "release_date": "2026-01-29", + "last_updated": "2026-02-13", + "cost": { + "input": 0.096, + "output": 0.288, + "cache_read": 0.019 + }, "type": "chat" }, { - "id": "doubao-seed-1.6-flash", - "name": "Doubao-Seed 1.6 Flash", - "display_name": "Doubao-Seed 1.6 Flash", + "id": "route/mimo-v2.5-pro", + "name": "MiMo V2.5 Pro", + "display_name": "MiMo V2.5 Pro", "modalities": { "input": [ "text", @@ -150790,8 +154975,8 @@ ] }, "limit": { - "context": 256000, - "output": 32000 + "context": 1000000, + "output": 262144 }, "temperature": true, "tool_call": true, @@ -150799,28 +154984,60 @@ "supported": true, "default": true }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } + }, "attachment": true, - "open_weights": false, - "release_date": "2025-08-15", - "last_updated": "2025-08-15", + "open_weights": true, + "knowledge": "2024-12", + "release_date": "2026-04-22", + "last_updated": "2026-04-22", + "cost": { + "input": 0.45, + "output": 1.35, + "cache_read": 0.2, + "tiers": [ + { + "input": 2, + "output": 6, + "cache_read": 0.4, + "tier": { + "type": "context", + "size": 256000 + } + } + ], + "context_over_200k": { + "input": 2, + "output": 6, + "cache_read": 0.4 + } + }, "type": "chat" }, { - "id": "claude-4.0-opus", - "name": "Claude 4.0 Opus", - "display_name": "Claude 4.0 Opus", + "id": "route/step-3.5-flash", + "name": "Step 3.5 Flash", + "display_name": "Step 3.5 Flash", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 32000 + "context": 262144, + "output": 65536 }, "temperature": true, "tool_call": true, @@ -150828,61 +155045,46 @@ "supported": true, "default": true }, - "attachment": true, - "open_weights": false, - "release_date": "2025-08-05", - "last_updated": "2025-08-05", - "type": "chat" - }, - { - "id": "qwen2.5-vl-7b-instruct", - "name": "Qwen 2.5 VL 7B Instruct", - "display_name": "Qwen 2.5 VL 7B Instruct", - "modalities": { - "input": [ - "text", - "image", - "audio", - "video" - ], - "output": [ - "text" - ] - }, - "limit": { - "context": 128000, - "output": 8192 + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } }, - "temperature": true, - "tool_call": true, - "reasoning": { - "supported": false + "attachment": false, + "open_weights": true, + "knowledge": "2025-01", + "release_date": "2026-01-29", + "last_updated": "2026-02-13", + "cost": { + "input": 0.096, + "output": 0.288, + "cache_read": 0.019 }, - "attachment": true, - "open_weights": false, - "release_date": "2025-08-05", - "last_updated": "2025-08-05", "type": "chat" }, { - "id": "gemini-3.0-pro-preview", - "name": "Gemini 3.0 Pro Preview", - "display_name": "Gemini 3.0 Pro Preview", + "id": "route/deepseek-v3.2", + "name": "DeepSeek V3.2", + "display_name": "DeepSeek V3.2", "modalities": { "input": [ "text", "image", - "video", - "pdf", - "audio" + "video" ], "output": [ "text" ] }, "limit": { - "context": 1000000, - "output": 64000 + "context": 163840, + "output": 163840 }, "temperature": true, "tool_call": true, @@ -150893,44 +155095,51 @@ "extra_capabilities": { "reasoning": { "supported": true, - "default_enabled": true, - "mode": "level", - "level": "high", - "level_options": [ - "low", - "high" - ], + "interleaved": true, "summaries": true, "visibility": "summary", "continuation": [ - "thought_signatures" + "thinking_blocks" ] } }, "attachment": true, - "open_weights": false, - "release_date": "2025-11-19", - "last_updated": "2025-11-19", + "open_weights": true, + "knowledge": "2024-07", + "release_date": "2025-12-01", + "last_updated": "2025-12-01", + "cost": { + "input": 0.4928, + "output": 0.7392 + }, "type": "chat" - }, + } + ] + }, + "google-vertex": { + "id": "google-vertex", + "name": "Vertex", + "display_name": "Vertex", + "doc": "https://cloud.google.com/vertex-ai/generative-ai/docs/models", + "models": [ { - "id": "qwen3-30b-a3b-thinking-2507", - "name": "Qwen3 30b A3b Thinking 2507", - "display_name": "Qwen3 30b A3b Thinking 2507", + "id": "gemini-2.5-pro-tts", + "name": "Gemini 2.5 Pro TTS", + "display_name": "Gemini 2.5 Pro TTS", "modalities": { "input": [ "text" ], "output": [ - "text" + "audio" ] }, "limit": { - "context": 126000, - "output": 32000 + "context": 32768, + "output": 16384 }, - "temperature": true, - "tool_call": true, + "temperature": false, + "tool_call": false, "reasoning": { "supported": true, "default": true @@ -150938,35 +155147,52 @@ "extra_capabilities": { "reasoning": { "supported": true, - "interleaved": true, + "default_enabled": true, + "mode": "budget", + "budget": { + "default": -1, + "min": 128, + "max": 32768, + "auto": -1, + "unit": "tokens" + }, "summaries": true, "visibility": "summary", "continuation": [ - "thinking_blocks" + "thought_signatures" ] } }, "attachment": false, "open_weights": false, - "release_date": "2026-02-04", - "last_updated": "2026-02-04", + "knowledge": "2025-01", + "release_date": "2025-09-30", + "last_updated": "2025-12-10", + "cost": { + "input": 1, + "output": 20 + }, "type": "chat" }, { - "id": "glm-4.5", - "name": "GLM 4.5", - "display_name": "GLM 4.5", + "id": "gemini-3.1-flash-lite", + "name": "Gemini 3.1 Flash Lite", + "display_name": "Gemini 3.1 Flash Lite", "modalities": { "input": [ - "text" + "text", + "image", + "video", + "audio", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 131072, - "output": 98304 + "context": 1048576, + "output": 65536 }, "temperature": true, "tool_call": true, @@ -150974,82 +155200,148 @@ "supported": true, "default": true }, - "attachment": false, + "extra_capabilities": { + "reasoning": { + "supported": true + } + }, + "attachment": true, "open_weights": false, - "release_date": "2025-08-05", - "last_updated": "2025-08-05", + "knowledge": "2025-01", + "release_date": "2026-05-07", + "last_updated": "2026-05-07", + "cost": { + "input": 0.25, + "output": 1.5, + "cache_read": 0.025, + "input_audio": 0.5 + }, "type": "chat" }, { - "id": "deepseek-v3", - "name": "DeepSeek-V3", - "display_name": "DeepSeek-V3", + "id": "gemini-2.5-pro", + "name": "Gemini 2.5 Pro", + "display_name": "Gemini 2.5 Pro", "modalities": { "input": [ - "text" + "text", + "image", + "audio", + "video", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 16000 + "context": 1048576, + "output": 65536 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": false, + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": true, + "mode": "budget", + "budget": { + "default": -1, + "min": 128, + "max": 32768, + "auto": -1, + "unit": "tokens" + }, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thought_signatures" + ] + } + }, + "attachment": true, "open_weights": false, - "release_date": "2025-08-13", - "last_updated": "2025-08-13", + "knowledge": "2025-01", + "release_date": "2025-03-20", + "last_updated": "2025-06-05", + "cost": { + "input": 1.25, + "output": 10, + "cache_read": 0.125, + "tiers": [ + { + "input": 2.5, + "output": 15, + "cache_read": 0.25, + "tier": { + "type": "context", + "size": 200000 + } + } + ], + "context_over_200k": { + "input": 2.5, + "output": 15, + "cache_read": 0.25 + } + }, "type": "chat" }, { - "id": "qwen3-235b-a22b-instruct-2507", - "name": "Qwen3 235b A22B Instruct 2507", - "display_name": "Qwen3 235b A22B Instruct 2507", + "id": "gemini-2.5-flash-tts", + "name": "Gemini 2.5 Flash TTS", + "display_name": "Gemini 2.5 Flash TTS", "modalities": { "input": [ "text" ], "output": [ - "text" + "audio" ] }, "limit": { - "context": 262144, - "output": 64000 + "context": 32768, + "output": 16384 }, - "temperature": true, - "tool_call": true, + "temperature": false, + "tool_call": false, "reasoning": { "supported": false }, "attachment": false, "open_weights": false, - "release_date": "2025-08-12", - "last_updated": "2025-08-12", + "knowledge": "2025-01", + "release_date": "2025-09-30", + "last_updated": "2025-12-10", + "cost": { + "input": 0.5, + "output": 10 + }, "type": "chat" }, { - "id": "qwen3.5-397b-a17b", - "name": "Qwen3.5 397B A17B", - "display_name": "Qwen3.5 397B A17B", + "id": "gemini-2.5-flash", + "name": "Gemini 2.5 Flash", + "display_name": "Gemini 2.5 Flash", "modalities": { "input": [ "text", - "image" + "image", + "audio", + "video", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 256000, - "output": 64000 + "context": 1048576, + "output": 65536 }, "temperature": true, "tool_call": true, @@ -151060,30 +155352,46 @@ "extra_capabilities": { "reasoning": { "supported": true, - "interleaved": true, + "default_enabled": true, + "mode": "budget", + "budget": { + "default": -1, + "min": 0, + "max": 24576, + "auto": -1, + "off": 0, + "unit": "tokens" + }, "summaries": true, "visibility": "summary", "continuation": [ - "thinking_blocks" + "thought_signatures" ] } }, "attachment": true, "open_weights": false, - "release_date": "2026-02-22", - "last_updated": "2026-02-22", + "knowledge": "2025-01", + "release_date": "2025-06-17", + "last_updated": "2025-06-17", + "cost": { + "input": 0.3, + "output": 2.5, + "cache_read": 0.075, + "cache_write": 0.383 + }, "type": "chat" }, { - "id": "gemini-3.0-flash-preview", - "name": "Gemini 3.0 Flash Preview", - "display_name": "Gemini 3.0 Flash Preview", + "id": "gemini-3.5-flash", + "name": "Gemini 3.5 Flash", + "display_name": "Gemini 3.5 Flash", "modalities": { "input": [ "text", "image", - "audio", "video", + "audio", "pdf" ], "output": [ @@ -151091,8 +155399,8 @@ ] }, "limit": { - "context": 1000000, - "output": 64000 + "context": 1048576, + "output": 65536 }, "temperature": true, "tool_call": true, @@ -151121,14 +155429,21 @@ }, "attachment": true, "open_weights": false, - "release_date": "2025-12-18", - "last_updated": "2025-12-18", + "knowledge": "2025-01", + "release_date": "2026-05-19", + "last_updated": "2026-05-19", + "cost": { + "input": 1.5, + "output": 9, + "cache_read": 0.15, + "input_audio": 1.5 + }, "type": "chat" }, { - "id": "mimo-v2-flash", - "name": "Mimo-V2-Flash", - "display_name": "Mimo-V2-Flash", + "id": "gemini-embedding-001", + "name": "Gemini Embedding 001", + "display_name": "Gemini Embedding 001", "modalities": { "input": [ "text" @@ -151138,71 +155453,115 @@ ] }, "limit": { - "context": 256000, - "output": 256000 + "context": 2048, + "output": 1 }, - "temperature": true, - "tool_call": true, + "temperature": false, + "tool_call": false, "reasoning": { - "supported": true, - "default": true + "supported": false }, "attachment": false, - "open_weights": true, - "knowledge": "2024-12-01", - "release_date": "2025-12-16", - "last_updated": "2026-02-04", + "open_weights": false, + "knowledge": "2025-05", + "release_date": "2025-05-20", + "last_updated": "2025-05-20", "cost": { - "input": 0.1, - "output": 0.3, - "cache_read": 0.01 + "input": 0.15, + "output": 0 }, - "type": "chat" + "type": "embedding" }, { - "id": "kimi-k2", - "name": "Kimi K2", - "display_name": "Kimi K2", + "id": "gemini-3.1-pro-preview-customtools", + "name": "Gemini 3.1 Pro Preview Custom Tools", + "display_name": "Gemini 3.1 Pro Preview Custom Tools", "modalities": { "input": [ - "text" + "text", + "image", + "video", + "audio", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 128000 + "context": 1048576, + "output": 65536 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": false, + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": true, + "mode": "level", + "level": "high", + "level_options": [ + "low", + "high" + ], + "summaries": true, + "visibility": "summary", + "continuation": [ + "thought_signatures" + ] + } + }, + "attachment": true, "open_weights": false, - "release_date": "2025-08-05", - "last_updated": "2025-08-05", + "knowledge": "2025-01", + "release_date": "2026-02-19", + "last_updated": "2026-02-19", + "cost": { + "input": 2, + "output": 12, + "cache_read": 0.2, + "tiers": [ + { + "input": 4, + "output": 18, + "cache_read": 0.4, + "tier": { + "type": "context", + "size": 200000 + } + } + ], + "context_over_200k": { + "input": 4, + "output": 18, + "cache_read": 0.4 + } + }, "type": "chat" }, { - "id": "doubao-seed-1.6-thinking", - "name": "Doubao-Seed 1.6 Thinking", - "display_name": "Doubao-Seed 1.6 Thinking", + "id": "gemini-flash-lite-latest", + "name": "Gemini Flash-Lite Latest", + "display_name": "Gemini Flash-Lite Latest", "modalities": { "input": [ - "image", "text", - "video" + "image", + "audio", + "video", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 256000, - "output": 32000 + "context": 1048576, + "output": 65536 }, "temperature": true, "tool_call": true, @@ -151212,58 +155571,96 @@ }, "attachment": true, "open_weights": false, - "release_date": "2025-08-15", - "last_updated": "2025-08-15", + "knowledge": "2025-01", + "release_date": "2025-09-25", + "last_updated": "2025-09-25", + "cost": { + "input": 0.1, + "output": 0.4, + "cache_read": 0.025 + }, "type": "chat" }, { - "id": "deepseek-v3.1", - "name": "DeepSeek-V3.1", - "display_name": "DeepSeek-V3.1", + "id": "gemini-2.5-flash-lite", + "name": "Gemini 2.5 Flash-Lite", + "display_name": "Gemini 2.5 Flash-Lite", "modalities": { "input": [ - "text" + "text", + "image", + "audio", + "video", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 32000 + "context": 1048576, + "output": 65536 }, "temperature": true, "tool_call": true, "reasoning": { "supported": true, - "default": true + "default": false }, - "attachment": false, + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": false, + "mode": "budget", + "budget": { + "default": -1, + "min": 512, + "max": 24576, + "auto": -1, + "unit": "tokens" + }, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thought_signatures" + ] + } + }, + "attachment": true, "open_weights": false, - "release_date": "2025-08-19", - "last_updated": "2025-08-19", + "knowledge": "2025-01", + "release_date": "2025-06-17", + "last_updated": "2025-06-17", + "cost": { + "input": 0.1, + "output": 0.4, + "cache_read": 0.01, + "input_audio": 0.3 + }, "type": "chat" }, { - "id": "gemini-3.0-pro-image-preview", - "name": "Gemini 3.0 Pro Image Preview", - "display_name": "Gemini 3.0 Pro Image Preview", + "id": "gemini-3.1-pro-preview", + "name": "Gemini 3.1 Pro Preview", + "display_name": "Gemini 3.1 Pro Preview", "modalities": { "input": [ "text", - "image" + "image", + "video", + "audio", + "pdf" ], "output": [ - "text", - "image" + "text" ] }, "limit": { - "context": 32768, - "output": 8192 + "context": 1048576, + "output": 65536 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { "supported": true, "default": true @@ -151287,25 +155684,51 @@ }, "attachment": true, "open_weights": false, - "release_date": "2025-11-20", - "last_updated": "2025-11-20", + "knowledge": "2025-01", + "release_date": "2026-02-19", + "last_updated": "2026-02-19", + "cost": { + "input": 2, + "output": 12, + "cache_read": 0.2, + "tiers": [ + { + "input": 4, + "output": 18, + "cache_read": 0.4, + "tier": { + "type": "context", + "size": 200000 + } + } + ], + "context_over_200k": { + "input": 4, + "output": 18, + "cache_read": 0.4 + } + }, "type": "chat" }, { - "id": "glm-4.5-air", - "name": "GLM 4.5 Air", - "display_name": "GLM 4.5 Air", + "id": "gemini-3-flash-preview", + "name": "Gemini 3 Flash Preview", + "display_name": "Gemini 3 Flash Preview", "modalities": { "input": [ - "text" + "text", + "image", + "video", + "audio", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 131000, - "output": 4096 + "context": 1048576, + "output": 65536 }, "temperature": true, "tool_call": true, @@ -151313,58 +155736,96 @@ "supported": true, "default": true }, - "attachment": false, + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": true, + "mode": "level", + "level": "high", + "level_options": [ + "minimal", + "low", + "medium", + "high" + ], + "summaries": true, + "visibility": "summary", + "continuation": [ + "thought_signatures" + ] + } + }, + "attachment": true, "open_weights": false, - "release_date": "2025-08-05", - "last_updated": "2025-08-05", + "knowledge": "2025-01", + "release_date": "2025-12-17", + "last_updated": "2025-12-17", + "cost": { + "input": 0.5, + "output": 3, + "cache_read": 0.05, + "input_audio": 1 + }, "type": "chat" }, { - "id": "kling-v2-6", - "name": "Kling-V2 6", - "display_name": "Kling-V2 6", + "id": "gemini-flash-latest", + "name": "Gemini Flash Latest", + "display_name": "Gemini Flash Latest", "modalities": { "input": [ "text", "image", - "video" + "audio", + "video", + "pdf" ], "output": [ - "video" + "text" ] }, "limit": { - "context": 99999999, - "output": 99999999 + "context": 1048576, + "output": 65536 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "attachment": true, "open_weights": false, - "release_date": "2026-01-13", - "last_updated": "2026-01-13", + "knowledge": "2025-01", + "release_date": "2025-09-25", + "last_updated": "2025-09-25", + "cost": { + "input": 0.3, + "output": 2.5, + "cache_read": 0.075, + "cache_write": 0.383 + }, "type": "chat" }, { - "id": "doubao-seed-1.6", - "name": "Doubao-Seed 1.6", - "display_name": "Doubao-Seed 1.6", + "id": "gemini-3.1-flash-lite-preview", + "name": "Gemini 3.1 Flash Lite Preview", + "display_name": "Gemini 3.1 Flash Lite Preview", "modalities": { "input": [ "text", "image", - "video" + "video", + "audio", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 256000, - "output": 32000 + "context": 1048576, + "output": 65536 }, "temperature": true, "tool_call": true, @@ -151372,29 +155833,39 @@ "supported": true, "default": true }, + "extra_capabilities": { + "reasoning": { + "supported": true + } + }, "attachment": true, "open_weights": false, - "release_date": "2025-08-15", - "last_updated": "2025-08-15", + "knowledge": "2025-01", + "release_date": "2026-03-03", + "last_updated": "2026-03-03", + "cost": { + "input": 0.25, + "output": 1.5, + "cache_read": 0.025, + "input_audio": 0.5 + }, "type": "chat" }, { - "id": "doubao-seed-2.0-lite", - "name": "Doubao Seed 2.0 Lite", - "display_name": "Doubao Seed 2.0 Lite", + "id": "moonshotai/kimi-k2-thinking-maas", + "name": "Kimi K2 Thinking", + "display_name": "Kimi K2 Thinking", "modalities": { "input": [ - "text", - "image", - "video" + "text" ], "output": [ "text" ] }, "limit": { - "context": 256000, - "output": 32000 + "context": 262144, + "output": 262144 }, "temperature": true, "tool_call": true, @@ -151402,16 +155873,32 @@ "supported": true, "default": true }, - "attachment": true, - "open_weights": false, - "release_date": "2026-02-14", - "last_updated": "2026-02-14", + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } + }, + "attachment": false, + "open_weights": true, + "knowledge": "2024-08", + "release_date": "2025-11-13", + "last_updated": "2025-11-13", + "cost": { + "input": 0.6, + "output": 2.5 + }, "type": "chat" }, { - "id": "z-ai/glm-4.6", - "name": "Z-AI/GLM 4.6", - "display_name": "Z-AI/GLM 4.6", + "id": "openai/gpt-oss-120b-maas", + "name": "GPT OSS 120B", + "display_name": "GPT OSS 120B", "modalities": { "input": [ "text" @@ -151421,29 +155908,29 @@ ] }, "limit": { - "context": 200000, - "output": 200000 + "context": 131072, + "output": 32768 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true - } + "supported": true, + "default": true }, "attachment": false, - "open_weights": false, - "release_date": "2025-10-11", - "last_updated": "2025-10-11", + "open_weights": true, + "release_date": "2025-08-05", + "last_updated": "2025-08-05", + "cost": { + "input": 0.09, + "output": 0.36 + }, "type": "chat" }, { - "id": "z-ai/glm-4.7", - "name": "Z-Ai/GLM 4.7", - "display_name": "Z-Ai/GLM 4.7", + "id": "openai/gpt-oss-20b-maas", + "name": "GPT OSS 20B", + "display_name": "GPT OSS 20B", "modalities": { "input": [ "text" @@ -151453,8 +155940,8 @@ ] }, "limit": { - "context": 200000, - "output": 200000 + "context": 131072, + "output": 32768 }, "temperature": true, "tool_call": true, @@ -151462,55 +155949,65 @@ "supported": true, "default": true }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } - }, "attachment": false, - "open_weights": false, - "release_date": "2025-12-23", - "last_updated": "2025-12-23", + "open_weights": true, + "release_date": "2025-08-05", + "last_updated": "2025-08-05", + "cost": { + "input": 0.07, + "output": 0.25 + }, "type": "chat" }, { - "id": "z-ai/autoglm-phone-9b", - "name": "Z-Ai/Autoglm Phone 9b", - "display_name": "Z-Ai/Autoglm Phone 9b", + "id": "zai-org/glm-4.7-maas", + "name": "GLM-4.7", + "display_name": "GLM-4.7", "modalities": { "input": [ "text", - "image" + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 12800, - "output": 4096 + "context": 200000, + "output": 128000 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } + }, + "attachment": false, + "open_weights": true, + "knowledge": "2025-04", + "release_date": "2026-01-06", + "last_updated": "2026-01-06", + "cost": { + "input": 0.6, + "output": 2.2 }, - "attachment": true, - "open_weights": false, - "release_date": "2025-12-23", - "last_updated": "2025-12-23", "type": "chat" }, { - "id": "z-ai/glm-5", - "name": "Z-Ai/GLM 5", - "display_name": "Z-Ai/GLM 5", + "id": "zai-org/glm-5-maas", + "name": "GLM-5", + "display_name": "GLM-5", "modalities": { "input": [ "text" @@ -151520,8 +156017,8 @@ ] }, "limit": { - "context": 200000, - "output": 128000 + "context": 202752, + "output": 131072 }, "temperature": true, "tool_call": true, @@ -151541,70 +156038,87 @@ } }, "attachment": false, - "open_weights": false, - "release_date": "2026-02-12", - "last_updated": "2026-02-12", + "open_weights": true, + "release_date": "2026-02-11", + "last_updated": "2026-02-11", + "cost": { + "input": 1, + "output": 3.2, + "cache_read": 0.1 + }, "type": "chat" }, { - "id": "deepseek/deepseek-v3.2-exp-thinking", - "name": "DeepSeek/DeepSeek-V3.2-Exp-Thinking", - "display_name": "DeepSeek/DeepSeek-V3.2-Exp-Thinking", + "id": "deepseek-ai/deepseek-v3.1-maas", + "name": "DeepSeek V3.1", + "display_name": "DeepSeek V3.1", "modalities": { "input": [ - "text" + "text", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 32000 + "context": 163840, + "output": 32768 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { "supported": true, "default": true }, "attachment": false, - "open_weights": false, - "release_date": "2025-09-29", - "last_updated": "2025-09-29", + "open_weights": true, + "release_date": "2025-08-28", + "last_updated": "2025-08-28", + "cost": { + "input": 0.6, + "output": 1.7 + }, "type": "chat" }, { - "id": "deepseek/deepseek-v3.1-terminus", - "name": "DeepSeek/DeepSeek-V3.1-Terminus", - "display_name": "DeepSeek/DeepSeek-V3.1-Terminus", + "id": "deepseek-ai/deepseek-v3.2-maas", + "name": "DeepSeek V3.2", + "display_name": "DeepSeek V3.2", "modalities": { "input": [ - "text" + "text", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 32000 + "context": 163840, + "output": 65536 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "attachment": false, - "open_weights": false, - "release_date": "2025-09-22", - "last_updated": "2025-09-22", + "open_weights": true, + "release_date": "2025-12-17", + "last_updated": "2026-04-04", + "cost": { + "input": 0.56, + "output": 1.68, + "cache_read": 0.056 + }, "type": "chat" }, { - "id": "deepseek/deepseek-v3.1-terminus-thinking", - "name": "DeepSeek/DeepSeek-V3.1-Terminus-Thinking", - "display_name": "DeepSeek/DeepSeek-V3.1-Terminus-Thinking", + "id": "qwen/qwen3-235b-a22b-instruct-2507-maas", + "name": "Qwen3 235B A22B Instruct", + "display_name": "Qwen3 235B A22B Instruct", "modalities": { "input": [ "text" @@ -151614,25 +156128,29 @@ ] }, "limit": { - "context": 128000, - "output": 32000 + "context": 262144, + "output": 16384 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { "supported": true, "default": true }, "attachment": false, - "open_weights": false, - "release_date": "2025-09-22", - "last_updated": "2025-09-22", + "open_weights": true, + "release_date": "2025-08-13", + "last_updated": "2025-08-13", + "cost": { + "input": 0.22, + "output": 0.88 + }, "type": "chat" }, { - "id": "deepseek/deepseek-v3.2-251201", - "name": "Deepseek/DeepSeek-V3.2", - "display_name": "Deepseek/DeepSeek-V3.2", + "id": "meta/llama-3.3-70b-instruct-maas", + "name": "Llama 3.3 70B Instruct", + "display_name": "Llama 3.3 70B Instruct", "modalities": { "input": [ "text" @@ -151643,254 +156161,313 @@ }, "limit": { "context": 128000, - "output": 32000 + "output": 8192 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, "attachment": false, - "open_weights": false, - "release_date": "2025-12-01", - "last_updated": "2025-12-01", + "open_weights": true, + "knowledge": "2023-12", + "release_date": "2025-04-29", + "last_updated": "2025-04-29", + "cost": { + "input": 0.72, + "output": 0.72 + }, "type": "chat" }, { - "id": "deepseek/deepseek-v3.2-exp", - "name": "DeepSeek/DeepSeek-V3.2-Exp", - "display_name": "DeepSeek/DeepSeek-V3.2-Exp", + "id": "meta/llama-4-maverick-17b-128e-instruct-maas", + "name": "Llama 4 Maverick 17B 128E Instruct", + "display_name": "Llama 4 Maverick 17B 128E Instruct", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 32000 + "context": 524288, + "output": 8192 }, "temperature": true, "tool_call": true, "reasoning": { "supported": false }, - "attachment": false, + "attachment": true, + "open_weights": true, + "knowledge": "2024-08", + "release_date": "2025-04-29", + "last_updated": "2025-04-29", + "cost": { + "input": 0.35, + "output": 1.15 + }, + "type": "chat" + } + ] + }, + "nano-gpt": { + "id": "nano-gpt", + "name": "NanoGPT", + "display_name": "NanoGPT", + "api": "https://nano-gpt.com/api/v1", + "doc": "https://docs.nano-gpt.com", + "models": [ + { + "id": "step-3", + "name": "Step-3", + "display_name": "Step-3", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 65536, + "output": 8192 + }, + "tool_call": false, + "reasoning": { + "supported": false + }, + "attachment": true, "open_weights": false, - "release_date": "2025-09-29", - "last_updated": "2025-09-29", + "release_date": "2025-07-31", + "last_updated": "2025-07-31", + "cost": { + "input": 0.2499, + "output": 0.6494 + }, "type": "chat" }, { - "id": "deepseek/deepseek-math-v2", - "name": "Deepseek/Deepseek-Math-V2", - "display_name": "Deepseek/Deepseek-Math-V2", + "id": "qwen3.5-35b-a3b:thinking", + "name": "Qwen3.5 35B A3B Thinking", + "display_name": "Qwen3.5 35B A3B Thinking", "modalities": { "input": [ - "text" + "text", + "image", + "video" ], "output": [ "text" ] }, "limit": { - "context": 160000, - "output": 160000 + "context": 260096, + "output": 65536 }, - "temperature": true, "tool_call": false, "reasoning": { "supported": true, "default": true }, - "attachment": false, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } + }, + "attachment": true, "open_weights": false, - "release_date": "2025-12-04", - "last_updated": "2025-12-04", + "release_date": "2026-02-24", + "last_updated": "2026-02-24", + "cost": { + "input": 0.225, + "output": 1.8 + }, "type": "chat" }, { - "id": "xiaomi/mimo-v2-flash", - "name": "Xiaomi/Mimo-V2-Flash", - "display_name": "Xiaomi/Mimo-V2-Flash", + "id": "glm-4.1v-thinking-flashx", + "name": "GLM 4.1V Thinking FlashX", + "display_name": "GLM 4.1V Thinking FlashX", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 256000, - "output": 256000 + "context": 64000, + "output": 8192 }, - "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": true + "supported": false }, - "attachment": false, - "open_weights": true, - "knowledge": "2024-12-01", - "release_date": "2025-12-16", - "last_updated": "2026-02-04", + "attachment": true, + "open_weights": false, + "release_date": "2025-07-09", + "last_updated": "2025-07-09", "cost": { - "input": 0.1, - "output": 0.3, - "cache_read": 0.01 + "input": 0.3, + "output": 0.3 }, "type": "chat" }, { - "id": "moonshotai/kimi-k2-thinking", - "name": "Kimi K2 Thinking", - "display_name": "Kimi K2 Thinking", + "id": "ernie-x1.1-preview", + "name": "ERNIE X1.1", + "display_name": "ERNIE X1.1", "modalities": { "input": [ - "text" + "text", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 256000, - "output": 100000 + "context": 64000, + "output": 8192 }, - "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": true }, "extra_capabilities": { "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] + "supported": true } }, - "attachment": false, - "open_weights": false, - "release_date": "2025-11-07", - "last_updated": "2025-11-07", + "attachment": true, + "open_weights": false, + "release_date": "2025-09-10", + "last_updated": "2025-09-10", + "cost": { + "input": 0.15, + "output": 0.6 + }, "type": "chat" }, { - "id": "moonshotai/kimi-k2-0905", - "name": "Kimi K2 0905", - "display_name": "Kimi K2 0905", + "id": "qwen25-vl-72b-instruct", + "name": "Qwen25 VL 72b", + "display_name": "Qwen25 VL 72b", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 256000, - "output": 100000 + "context": 32000, + "output": 32768 }, - "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": false }, - "attachment": false, + "attachment": true, "open_weights": false, - "release_date": "2025-09-08", - "last_updated": "2025-09-08", + "release_date": "2025-05-10", + "last_updated": "2025-05-10", + "cost": { + "input": 0.69989, + "output": 0.69989 + }, "type": "chat" }, { - "id": "moonshotai/kimi-k2.5", - "name": "Moonshotai/Kimi-K2.5", - "display_name": "Moonshotai/Kimi-K2.5", + "id": "gemini-2.0-pro-exp-02-05", + "name": "Gemini 2.0 Pro 0205", + "display_name": "Gemini 2.0 Pro 0205", "modalities": { "input": [ "text", - "image", - "video" + "image" ], "output": [ "text" ] }, "limit": { - "context": 256000, - "output": 256000 + "context": 2097152, + "output": 8192 }, - "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } + "supported": false }, "attachment": true, "open_weights": false, - "release_date": "2026-01-28", - "last_updated": "2026-01-28", + "release_date": "2025-02-05", + "last_updated": "2025-02-05", + "cost": { + "input": 1.989, + "output": 7.956 + }, "type": "chat" }, { - "id": "x-ai/grok-4.1-fast-non-reasoning", - "name": "X-Ai/Grok 4.1 Fast Non Reasoning", - "display_name": "X-Ai/Grok 4.1 Fast Non Reasoning", + "id": "doubao-seed-2-0-lite-260215", + "name": "Doubao Seed 2.0 Lite", + "display_name": "Doubao Seed 2.0 Lite", "modalities": { "input": [ - "text", - "image", - "audio", - "video" + "text" ], "output": [ "text" ] }, "limit": { - "context": 2000000, - "output": 2000000 + "context": 256000, + "output": 32000 }, - "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": true + "supported": true }, - "attachment": true, + "extra_capabilities": { + "reasoning": { + "supported": true + } + }, + "attachment": false, "open_weights": false, - "release_date": "2025-12-19", - "last_updated": "2025-12-19", + "release_date": "2026-02-14", + "last_updated": "2026-02-14", + "cost": { + "input": 0.1462, + "output": 0.8738 + }, "type": "chat" }, { - "id": "x-ai/grok-4-fast-non-reasoning", - "name": "X-Ai/Grok-4-Fast-Non-Reasoning", - "display_name": "X-Ai/Grok-4-Fast-Non-Reasoning", + "id": "Qwen3.5-27B-Writer-V2-Derestricted", + "name": "Qwen3.5 27B Writer V2 Derestricted", + "display_name": "Qwen3.5 27B Writer V2 Derestricted", "modalities": { "input": [ "text", "image", - "audio", "video" ], "output": [ @@ -151898,92 +156475,136 @@ ] }, "limit": { - "context": 2000000, - "output": 2000000 + "context": 262144, + "output": 16384 }, - "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": true, "default": true }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } + }, "attachment": true, "open_weights": false, - "release_date": "2025-12-18", - "last_updated": "2025-12-18", + "release_date": "2026-04-06", + "last_updated": "2026-04-06", + "cost": { + "input": 0.306, + "output": 0.306 + }, "type": "chat" }, { - "id": "x-ai/grok-4.1-fast-reasoning", - "name": "X-Ai/Grok 4.1 Fast Reasoning", - "display_name": "X-Ai/Grok 4.1 Fast Reasoning", + "id": "claude-opus-4-thinking:8192", + "name": "Claude 4 Opus Thinking (8K)", + "display_name": "Claude 4 Opus Thinking (8K)", "modalities": { "input": [ "text", "image", - "audio", - "video" + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 20000000, - "output": 2000000 + "context": 200000, + "output": 32000 }, - "temperature": true, "tool_call": true, "reasoning": { "supported": true, "default": true }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": true, + "mode": "budget", + "budget": { + "min": 1024, + "unit": "tokens" + }, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ], + "notes": [ + "Claude 4 manual thinking uses thinking.type = \"enabled\" with budget_tokens.", + "Interleaved thinking requires the interleaved-thinking-2025-05-14 beta header for this model family." + ] + } + }, "attachment": true, "open_weights": false, - "release_date": "2025-12-19", - "last_updated": "2025-12-19", + "release_date": "2025-05-22", + "last_updated": "2025-05-22", + "cost": { + "input": 14.994, + "output": 75.004 + }, "type": "chat" }, { - "id": "x-ai/grok-4-fast-reasoning", - "name": "X-Ai/Grok-4-Fast-Reasoning", - "display_name": "X-Ai/Grok-4-Fast-Reasoning", + "id": "qwen3-vl-235b-a22b-thinking", + "name": "Qwen3 VL 235B A22B Thinking", + "display_name": "Qwen3 VL 235B A22B Thinking", "modalities": { "input": [ "text", - "image", - "audio", - "video" + "image" ], "output": [ "text" ] }, "limit": { - "context": 2000000, - "output": 2000000 + "context": 32768, + "output": 32768 }, - "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": true, "default": true }, "extra_capabilities": { "reasoning": { - "supported": true + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] } }, "attachment": true, "open_weights": false, - "release_date": "2025-12-18", - "last_updated": "2025-12-18", + "release_date": "2025-08-26", + "last_updated": "2025-08-26", + "cost": { + "input": 0.5, + "output": 6 + }, "type": "chat" }, { - "id": "x-ai/grok-4.1-fast", - "name": "x-AI/Grok-4.1-Fast", - "display_name": "x-AI/Grok-4.1-Fast", + "id": "glm-4-air-0111", + "name": "GLM 4 Air 0111", + "display_name": "GLM 4 Air 0111", "modalities": { "input": [ "text" @@ -151993,145 +156614,194 @@ ] }, "limit": { - "context": 2000000, - "output": 2000000 + "context": 128000, + "output": 4096 }, - "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": true + "supported": false }, "attachment": false, "open_weights": false, - "release_date": "2025-11-20", - "last_updated": "2025-11-20", + "release_date": "2025-01-11", + "last_updated": "2025-01-11", + "cost": { + "input": 0.1394, + "output": 0.1394 + }, "type": "chat" }, { - "id": "x-ai/grok-code-fast-1", - "name": "x-AI/Grok-Code-Fast 1", - "display_name": "x-AI/Grok-Code-Fast 1", + "id": "Qwen3.5-27B-Queen-Derestricted", + "name": "Qwen3.5 27B Queen Derestricted", + "display_name": "Qwen3.5 27B Queen Derestricted", "modalities": { "input": [ - "text" + "text", + "image", + "video" ], "output": [ "text" ] }, "limit": { - "context": 256000, - "output": 10000 + "context": 262144, + "output": 16384 }, - "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": true, "default": true }, "extra_capabilities": { "reasoning": { - "supported": true + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] } }, - "attachment": false, + "attachment": true, "open_weights": false, - "release_date": "2025-09-02", - "last_updated": "2025-09-02", + "release_date": "2026-04-30", + "last_updated": "2026-04-30", + "cost": { + "input": 0.306, + "output": 0.306 + }, "type": "chat" }, { - "id": "x-ai/grok-4-fast", - "name": "x-AI/Grok-4-Fast", - "display_name": "x-AI/Grok-4-Fast", + "id": "gemini-2.5-pro-preview-03-25", + "name": "Gemini 2.5 Pro Preview 0325", + "display_name": "Gemini 2.5 Pro Preview 0325", "modalities": { "input": [ "text", - "image", - "audio", - "video" + "image" ], "output": [ "text" ] }, "limit": { - "context": 2000000, - "output": 2000000 + "context": 1048756, + "output": 65536 }, - "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": true, "default": true }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": true, + "mode": "budget", + "budget": { + "default": -1, + "min": 128, + "max": 32768, + "auto": -1, + "unit": "tokens" + }, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thought_signatures" + ] + } + }, "attachment": true, "open_weights": false, - "release_date": "2025-09-20", - "last_updated": "2025-09-20", + "release_date": "2025-03-25", + "last_updated": "2025-03-25", + "cost": { + "input": 2.5, + "output": 10 + }, "type": "chat" }, { - "id": "stepfun-ai/gelab-zero-4b-preview", - "name": "Stepfun-Ai/Gelab Zero 4b Preview", - "display_name": "Stepfun-Ai/Gelab Zero 4b Preview", + "id": "brave-research", + "name": "Brave (Research)", + "display_name": "Brave (Research)", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 8192, - "output": 4096 + "context": 16384, + "output": 16384 }, - "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": false }, - "attachment": true, + "attachment": false, "open_weights": false, - "release_date": "2025-12-23", - "last_updated": "2025-12-23", + "release_date": "2023-03-02", + "last_updated": "2024-01-01", + "cost": { + "input": 5, + "output": 5 + }, "type": "chat" }, { - "id": "stepfun/step-3.5-flash", - "name": "Stepfun/Step-3.5 Flash", - "display_name": "Stepfun/Step-3.5 Flash", + "id": "qwen-plus", + "name": "Qwen Plus", + "display_name": "Qwen Plus", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 64000, - "output": 4096 + "context": 995904, + "output": 32768 }, - "temperature": true, "tool_call": false, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": true, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } + }, + "attachment": false, "open_weights": false, - "release_date": "2026-02-02", - "last_updated": "2026-02-02", + "release_date": "2024-01-25", + "last_updated": "2024-01-25", + "cost": { + "input": 0.3995, + "output": 1.2002 + }, "type": "chat" }, { - "id": "meituan/longcat-flash-lite", - "name": "Meituan/Longcat-Flash-Lite", - "display_name": "Meituan/Longcat-Flash-Lite", + "id": "doubao-seed-2-0-mini-260215", + "name": "Doubao Seed 2.0 Mini", + "display_name": "Doubao Seed 2.0 Mini", "modalities": { "input": [ "text" @@ -152142,150 +156812,133 @@ }, "limit": { "context": 256000, - "output": 320000 + "output": 32000 }, - "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": false }, "attachment": false, "open_weights": false, - "release_date": "2026-02-06", - "last_updated": "2026-02-06", + "release_date": "2026-02-14", + "last_updated": "2026-02-14", + "cost": { + "input": 0.0493, + "output": 0.4845 + }, "type": "chat" }, { - "id": "meituan/longcat-flash-chat", - "name": "Meituan/Longcat-Flash-Chat", - "display_name": "Meituan/Longcat-Flash-Chat", + "id": "Qwen3.5-27B-BlueStar-v3-Derestricted-Lite", + "name": "Qwen3.5 27B BlueStar v3 Derestricted Lite", + "display_name": "Qwen3.5 27B BlueStar v3 Derestricted Lite", "modalities": { "input": [ - "text" + "text", + "image", + "video" ], "output": [ "text" ] }, "limit": { - "context": 131072, - "output": 131072 + "context": 262144, + "output": 16384 }, - "temperature": true, "tool_call": false, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": false, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } + }, + "attachment": true, "open_weights": false, - "release_date": "2025-11-05", - "last_updated": "2025-11-05", + "release_date": "2026-04-30", + "last_updated": "2026-04-30", + "cost": { + "input": 0.306, + "output": 0.306 + }, "type": "chat" }, { - "id": "openai/gpt-5.2", - "name": "OpenAI/GPT-5.2", - "display_name": "OpenAI/GPT-5.2", + "id": "deepseek-v3-0324", + "name": "DeepSeek Chat 0324", + "display_name": "DeepSeek Chat 0324", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 400000, - "output": 128000 + "context": 128000, + "output": 8192 }, - "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": false - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": false, - "mode": "effort", - "effort": "none", - "effort_options": [ - "none", - "low", - "medium", - "high", - "xhigh" - ], - "verbosity": "medium", - "verbosity_options": [ - "low", - "medium", - "high" - ], - "visibility": "hidden" - } + "supported": false }, - "attachment": true, + "attachment": false, "open_weights": false, - "release_date": "2025-12-11", - "last_updated": "2025-12-11", + "release_date": "2025-03-24", + "last_updated": "2025-03-24", + "cost": { + "input": 0.25, + "output": 0.7 + }, "type": "chat" }, { - "id": "openai/gpt-5", - "name": "OpenAI/GPT-5", - "display_name": "OpenAI/GPT-5", + "id": "Gemma-4-31B-Musica-v1", + "name": "Gemma 4 31B Musica v1", + "display_name": "Gemma 4 31B Musica v1", "modalities": { "input": [ - "text" + "text", + "image", + "video" ], "output": [ "text" ] }, "limit": { - "context": 400000, - "output": 128000 + "context": 262144, + "output": 16384 }, - "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": true, "default": true }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": true, - "mode": "effort", - "effort": "medium", - "effort_options": [ - "minimal", - "low", - "medium", - "high" - ], - "verbosity": "medium", - "verbosity_options": [ - "low", - "medium", - "high" - ], - "visibility": "hidden" - } - }, - "attachment": false, + "attachment": true, "open_weights": false, - "release_date": "2025-09-19", - "last_updated": "2025-09-19", + "release_date": "2026-05-01", + "last_updated": "2026-05-01", + "cost": { + "input": 0.306, + "output": 0.306 + }, "type": "chat" }, { - "id": "minimax/minimax-m2.1", - "name": "Minimax/Minimax-M2.1", - "display_name": "Minimax/Minimax-M2.1", + "id": "mirothinker-1-7-deepresearch-mini", + "name": "MiroThinker 1.7 Deep Research Mini", + "display_name": "MiroThinker 1.7 Deep Research Mini", "modalities": { "input": [ "text" @@ -152295,30 +156948,28 @@ ] }, "limit": { - "context": 204800, - "output": 128000 + "context": 262144, + "output": 16384 }, - "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": true, "default": true }, - "extra_capabilities": { - "reasoning": { - "supported": true - } - }, "attachment": false, "open_weights": false, - "release_date": "2025-12-23", - "last_updated": "2025-12-23", + "release_date": "2026-05-11", + "last_updated": "2026-05-11", + "cost": { + "input": 1.25, + "output": 10 + }, "type": "chat" }, { - "id": "minimax/minimax-m2", - "name": "Minimax/Minimax-M2", - "display_name": "Minimax/Minimax-M2", + "id": "Baichuan4-Turbo", + "name": "Baichuan 4 Turbo", + "display_name": "Baichuan 4 Turbo", "modalities": { "input": [ "text" @@ -152328,30 +156979,27 @@ ] }, "limit": { - "context": 200000, - "output": 128000 + "context": 128000, + "output": 32768 }, - "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true - } + "supported": false }, "attachment": false, "open_weights": false, - "release_date": "2025-10-28", - "last_updated": "2025-10-28", + "release_date": "2025-08-19", + "last_updated": "2025-08-19", + "cost": { + "input": 2.42, + "output": 2.42 + }, "type": "chat" }, { - "id": "minimax/minimax-m2.5", - "name": "Minimax/Minimax-M2.5", - "display_name": "Minimax/Minimax-M2.5", + "id": "doubao-seed-1-6-flash-250615", + "name": "Doubao Seed 1.6 Flash", + "display_name": "Doubao Seed 1.6 Flash", "modalities": { "input": [ "text" @@ -152361,72 +157009,58 @@ ] }, "limit": { - "context": 204800, - "output": 128000 + "context": 256000, + "output": 16384 }, - "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true - } + "supported": false }, "attachment": false, "open_weights": false, - "release_date": "2026-02-12", - "last_updated": "2026-02-12", + "release_date": "2025-06-15", + "last_updated": "2025-06-15", + "cost": { + "input": 0.0374, + "output": 0.374 + }, "type": "chat" }, { - "id": "minimax/minimax-m2.5-highspeed", - "name": "Minimax/Minimax-M2.5 Highspeed", - "display_name": "Minimax/Minimax-M2.5 Highspeed", + "id": "kimi-k2-instruct-fast", + "name": "Kimi K2 0711 Fast", + "display_name": "Kimi K2 0711 Fast", "modalities": { "input": [ - "text" + "text", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 204800, - "output": 128000 + "context": 131072, + "output": 16384 }, - "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true - } + "supported": false }, - "attachment": false, + "attachment": true, "open_weights": false, - "release_date": "2026-02-14", - "last_updated": "2026-02-14", + "release_date": "2025-07-15", + "last_updated": "2025-07-15", + "cost": { + "input": 0.1, + "output": 2 + }, "type": "chat" - } - ] - }, - "morph": { - "id": "morph", - "name": "Morph", - "display_name": "Morph", - "api": "https://api.morphllm.com/v1", - "doc": "https://docs.morphllm.com/api-reference/introduction", - "models": [ + }, { - "id": "morph-v3-fast", - "name": "Morph v3 Fast", - "display_name": "Morph v3 Fast", + "id": "glm-4-plus", + "name": "GLM-4 Plus", + "display_name": "GLM-4 Plus", "modalities": { "input": [ "text" @@ -152436,28 +157070,27 @@ ] }, "limit": { - "context": 16000, - "output": 16000 + "context": 128000, + "output": 4096 }, - "temperature": false, "tool_call": false, "reasoning": { "supported": false }, "attachment": false, "open_weights": false, - "release_date": "2024-08-15", - "last_updated": "2024-08-15", + "release_date": "2024-08-01", + "last_updated": "2024-08-01", "cost": { - "input": 0.8, - "output": 1.2 + "input": 7.497, + "output": 7.497 }, "type": "chat" }, { - "id": "morph-v3-large", - "name": "Morph v3 Large", - "display_name": "Morph v3 Large", + "id": "v0-1.0-md", + "name": "v0 1.0 MD", + "display_name": "v0 1.0 MD", "modalities": { "input": [ "text" @@ -152467,28 +157100,27 @@ ] }, "limit": { - "context": 32000, - "output": 32000 + "context": 200000, + "output": 64000 }, - "temperature": false, "tool_call": false, "reasoning": { "supported": false }, "attachment": false, "open_weights": false, - "release_date": "2024-08-15", - "last_updated": "2024-08-15", + "release_date": "2025-07-04", + "last_updated": "2025-07-04", "cost": { - "input": 0.9, - "output": 1.9 + "input": 3, + "output": 15 }, "type": "chat" }, { - "id": "auto", - "name": "Auto", - "display_name": "Auto", + "id": "qwen3-coder-30b-a3b-instruct", + "name": "Qwen3 Coder 30B A3B Instruct", + "display_name": "Qwen3 Coder 30B A3B Instruct", "modalities": { "input": [ "text" @@ -152498,50 +157130,41 @@ ] }, "limit": { - "context": 32000, - "output": 32000 + "context": 128000, + "output": 65536 }, - "temperature": false, - "tool_call": false, + "tool_call": true, "reasoning": { "supported": false }, "attachment": false, "open_weights": false, - "release_date": "2024-06-01", - "last_updated": "2024-06-01", + "release_date": "2025-08-05", + "last_updated": "2025-08-05", "cost": { - "input": 0.85, - "output": 1.55 + "input": 0.1, + "output": 0.4 }, "type": "chat" - } - ] - }, - "xiaomi-token-plan-sgp": { - "id": "xiaomi-token-plan-sgp", - "name": "Xiaomi Token Plan (Singapore)", - "display_name": "Xiaomi Token Plan (Singapore)", - "api": "https://token-plan-sgp.xiaomimimo.com/v1", - "doc": "https://platform.xiaomimimo.com/#/docs", - "models": [ + }, { - "id": "mimo-v2.5-pro", - "name": "MiMo-V2.5-Pro", - "display_name": "MiMo-V2.5-Pro", + "id": "gemini-2.5-flash-preview-09-2025-thinking", + "name": "Gemini 2.5 Flash Preview (09/2025) – Thinking", + "display_name": "Gemini 2.5 Flash Preview (09/2025) – Thinking", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 1048576, - "output": 131072 + "context": 1048756, + "output": 65536 }, - "temperature": true, "tool_call": true, "reasoning": { "supported": true, @@ -152550,65 +157173,71 @@ "extra_capabilities": { "reasoning": { "supported": true, - "interleaved": true, + "default_enabled": true, + "mode": "budget", + "budget": { + "default": -1, + "min": 0, + "max": 24576, + "auto": -1, + "off": 0, + "unit": "tokens" + }, "summaries": true, "visibility": "summary", "continuation": [ - "thinking_blocks" + "thought_signatures" ] } }, - "attachment": false, - "open_weights": true, - "knowledge": "2024-12", - "release_date": "2026-04-22", - "last_updated": "2026-04-22", + "attachment": true, + "open_weights": false, + "release_date": "2025-09-25", + "last_updated": "2025-09-25", "cost": { - "input": 0, - "output": 0, - "cache_read": 0 + "input": 0.3, + "output": 2.5 }, "type": "chat" }, { - "id": "mimo-v2.5-tts", - "name": "MiMo-V2.5-TTS", - "display_name": "MiMo-V2.5-TTS", + "id": "v0-1.5-lg", + "name": "v0 1.5 LG", + "display_name": "v0 1.5 LG", "modalities": { "input": [ "text" ], "output": [ - "audio" + "text" ] }, "limit": { - "context": 8192, - "output": 8192 + "context": 1000000, + "output": 64000 }, "tool_call": false, "reasoning": { "supported": false }, "attachment": false, - "open_weights": true, - "release_date": "2026-04-22", - "last_updated": "2026-04-22", + "open_weights": false, + "release_date": "2025-07-04", + "last_updated": "2025-07-04", "cost": { - "input": 0, - "output": 0 + "input": 15, + "output": 75 }, "type": "chat" }, { - "id": "mimo-v2.5", - "name": "MiMo-V2.5", - "display_name": "MiMo-V2.5", + "id": "qwen3.5-flash:thinking", + "name": "Qwen3.5 Flash Thinking", + "display_name": "Qwen3.5 Flash Thinking", "modalities": { "input": [ "text", "image", - "audio", "video" ], "output": [ @@ -152616,11 +157245,10 @@ ] }, "limit": { - "context": 1048576, - "output": 131072 + "context": 991808, + "output": 65536 }, - "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": true, "default": true @@ -152637,21 +157265,19 @@ } }, "attachment": true, - "open_weights": true, - "knowledge": "2024-12", - "release_date": "2026-04-22", - "last_updated": "2026-04-22", + "open_weights": false, + "release_date": "2026-02-24", + "last_updated": "2026-02-24", "cost": { - "input": 0, - "output": 0, - "cache_read": 0 + "input": 0.09, + "output": 0.36 }, "type": "chat" }, { - "id": "mimo-v2-pro", - "name": "MiMo-V2-Pro", - "display_name": "MiMo-V2-Pro", + "id": "jamba-large", + "name": "Jamba Large", + "display_name": "Jamba Large", "modalities": { "input": [ "text" @@ -152661,108 +157287,94 @@ ] }, "limit": { - "context": 1048576, - "output": 131072 + "context": 256000, + "output": 4096 }, - "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } + "supported": false }, "attachment": false, "open_weights": false, - "knowledge": "2024-12", - "release_date": "2026-03-18", - "last_updated": "2026-03-18", + "release_date": "2025-07-09", + "last_updated": "2025-07-09", "cost": { - "input": 0, - "output": 0, - "cache_read": 0 + "input": 1.989, + "output": 7.99 }, "type": "chat" }, { - "id": "mimo-v2.5-tts-voiceclone", - "name": "MiMo-V2.5-TTS-VoiceClone", - "display_name": "MiMo-V2.5-TTS-VoiceClone", + "id": "kimi-thinking-preview", + "name": "Kimi Thinking Preview", + "display_name": "Kimi Thinking Preview", "modalities": { "input": [ - "text" + "text", + "pdf" ], "output": [ - "audio" + "text" ] }, "limit": { - "context": 8192, - "output": 8192 + "context": 128000, + "output": 16384 }, "tool_call": false, "reasoning": { "supported": false }, - "attachment": false, - "open_weights": true, - "release_date": "2026-04-22", - "last_updated": "2026-04-22", + "attachment": true, + "open_weights": false, + "release_date": "2025-05-07", + "last_updated": "2025-05-07", "cost": { - "input": 0, - "output": 0 + "input": 31.46, + "output": 31.46 }, "type": "chat" }, { - "id": "mimo-v2.5-tts-voicedesign", - "name": "MiMo-V2.5-TTS-VoiceDesign", - "display_name": "MiMo-V2.5-TTS-VoiceDesign", + "id": "gemini-2.0-flash-thinking-exp-01-21", + "name": "Gemini 2.0 Flash Thinking 0121", + "display_name": "Gemini 2.0 Flash Thinking 0121", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ - "audio" + "text" ] }, "limit": { - "context": 8192, + "context": 1000000, "output": 8192 }, "tool_call": false, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": false, - "open_weights": true, - "release_date": "2026-04-22", - "last_updated": "2026-04-22", + "attachment": true, + "open_weights": false, + "release_date": "2025-01-21", + "last_updated": "2025-01-21", "cost": { - "input": 0, - "output": 0 + "input": 0.306, + "output": 1.003 }, "type": "chat" }, { - "id": "mimo-v2-omni", - "name": "MiMo-V2-Omni", - "display_name": "MiMo-V2-Omni", + "id": "claude-opus-4-1-thinking:1024", + "name": "Claude 4.1 Opus Thinking (1K)", + "display_name": "Claude 4.1 Opus Thinking (1K)", "modalities": { "input": [ "text", "image", - "audio", - "video", "pdf" ], "output": [ @@ -152770,10 +157382,9 @@ ] }, "limit": { - "context": 262144, - "output": 131072 + "context": 200000, + "output": 32000 }, - "temperature": true, "tool_call": true, "reasoning": { "supported": true, @@ -152782,228 +157393,245 @@ "extra_capabilities": { "reasoning": { "supported": true, + "default_enabled": true, + "mode": "budget", + "budget": { + "min": 1024, + "unit": "tokens" + }, "interleaved": true, "summaries": true, "visibility": "summary", "continuation": [ "thinking_blocks" + ], + "notes": [ + "Claude 4 manual thinking uses thinking.type = \"enabled\" with budget_tokens.", + "Interleaved thinking requires the interleaved-thinking-2025-05-14 beta header for this model family." ] } }, "attachment": true, "open_weights": false, - "knowledge": "2024-12", - "release_date": "2026-03-18", - "last_updated": "2026-03-18", + "release_date": "2025-05-22", + "last_updated": "2025-05-22", "cost": { - "input": 0, - "output": 0, - "cache_read": 0 + "input": 14.994, + "output": 75.004 }, "type": "chat" }, { - "id": "mimo-v2-tts", - "name": "MiMo-V2-TTS", - "display_name": "MiMo-V2-TTS", + "id": "Qwen3.5-27B-NaNovel-Derestricted-Lite", + "name": "Qwen3.5 27B NaNovel Derestricted Lite", + "display_name": "Qwen3.5 27B NaNovel Derestricted Lite", "modalities": { "input": [ - "text" + "text", + "image", + "video" ], "output": [ - "audio" + "text" ] }, "limit": { - "context": 8192, - "output": 8192 + "context": 262144, + "output": 16384 }, "tool_call": false, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": false, - "open_weights": true, - "release_date": "2026-03-18", - "last_updated": "2026-03-18", + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } + }, + "attachment": true, + "open_weights": false, + "release_date": "2026-04-30", + "last_updated": "2026-04-30", "cost": { - "input": 0, - "output": 0 + "input": 0.306, + "output": 0.306 }, "type": "chat" - } - ] - }, - "fastrouter": { - "id": "fastrouter", - "name": "FastRouter", - "display_name": "FastRouter", - "api": "https://go.fastrouter.ai/api/v1", - "doc": "https://fastrouter.ai/models", - "models": [ + }, + { + "id": "doubao-seed-1-6-250615", + "name": "Doubao Seed 1.6", + "display_name": "Doubao Seed 1.6", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 256000, + "output": 16384 + }, + "tool_call": false, + "reasoning": { + "supported": false + }, + "attachment": false, + "open_weights": false, + "release_date": "2025-06-15", + "last_updated": "2025-06-15", + "cost": { + "input": 0.204, + "output": 0.51 + }, + "type": "chat" + }, { - "id": "z-ai/glm-5", - "name": "GLM-5", - "display_name": "GLM-5", + "id": "ernie-5.0-thinking-preview", + "name": "Ernie 5.0 Thinking Preview", + "display_name": "Ernie 5.0 Thinking Preview", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 204800, - "output": 131072 + "context": 128000, + "output": 16384 }, - "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": true, "default": true }, "extra_capabilities": { "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] + "supported": true } }, - "attachment": false, - "open_weights": true, - "release_date": "2026-02-11", - "last_updated": "2026-02-11", + "attachment": true, + "open_weights": false, + "release_date": "2025-11-18", + "last_updated": "2025-11-18", "cost": { - "input": 0.95, - "output": 3.15 + "input": 1.1, + "output": 2 }, "type": "chat" }, { - "id": "anthropic/claude-sonnet-4", - "name": "Claude Sonnet 4", - "display_name": "Claude Sonnet 4", + "id": "gemini-2.5-flash-preview-05-20:thinking", + "name": "Gemini 2.5 Flash 0520 Thinking", + "display_name": "Gemini 2.5 Flash 0520 Thinking", "modalities": { "input": [ "text", - "image", - "pdf" + "image" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 64000 + "context": 1048000, + "output": 65536 }, - "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": true, - "default": false + "default": true }, "extra_capabilities": { "reasoning": { "supported": true, - "default_enabled": false, + "default_enabled": true, "mode": "budget", "budget": { - "min": 1024, + "default": -1, + "min": 0, + "max": 24576, + "auto": -1, + "off": 0, "unit": "tokens" }, - "interleaved": true, "summaries": true, "visibility": "summary", "continuation": [ - "thinking_blocks" - ], - "notes": [ - "Claude 4 manual thinking uses thinking.type = \"enabled\" with budget_tokens.", - "Interleaved thinking requires the interleaved-thinking-2025-05-14 beta header for this model family." + "thought_signatures" ] } }, "attachment": true, "open_weights": false, - "knowledge": "2025-03-31", - "release_date": "2025-05-22", - "last_updated": "2025-05-22", + "release_date": "2025-05-20", + "last_updated": "2025-05-20", "cost": { - "input": 3, - "output": 15, - "cache_read": 0.3, - "cache_write": 3.75 + "input": 0.15, + "output": 3.5 }, "type": "chat" }, { - "id": "anthropic/claude-opus-4.1", - "name": "Claude Opus 4.1", - "display_name": "Claude Opus 4.1", + "id": "Qwen3.5-27B-Omega-Evolution-v2.2-Derestricted", + "name": "Qwen3.5 27B Omega Evolution v2.2 Derestricted", + "display_name": "Qwen3.5 27B Omega Evolution v2.2 Derestricted", "modalities": { "input": [ "text", "image", - "pdf" + "video" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 32000 + "context": 262144, + "output": 16384 }, - "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": true, - "default": false + "default": true }, "extra_capabilities": { "reasoning": { "supported": true, - "default_enabled": false, - "mode": "budget", - "budget": { - "min": 1024, - "unit": "tokens" - }, "interleaved": true, "summaries": true, "visibility": "summary", "continuation": [ "thinking_blocks" - ], - "notes": [ - "Claude 4 manual thinking uses thinking.type = \"enabled\" with budget_tokens.", - "Interleaved thinking requires the interleaved-thinking-2025-05-14 beta header for this model family." ] } }, "attachment": true, "open_weights": false, - "knowledge": "2025-03-31", - "release_date": "2025-08-05", - "last_updated": "2025-08-05", + "release_date": "2026-05-02", + "last_updated": "2026-05-02", "cost": { - "input": 15, - "output": 75, - "cache_read": 1.5, - "cache_write": 18.75 + "input": 0.306, + "output": 0.306 }, "type": "chat" }, { - "id": "qwen/qwen3-coder", - "name": "Qwen3 Coder", - "display_name": "Qwen3 Coder", + "id": "azure-o1", + "name": "Azure o1", + "display_name": "Azure o1", "modalities": { "input": [ "text" @@ -153013,61 +157641,65 @@ ] }, "limit": { - "context": 262144, - "output": 66536 + "context": 200000, + "output": 100000 }, - "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": false }, "attachment": false, - "open_weights": true, - "knowledge": "2025-04", - "release_date": "2025-07-23", - "last_updated": "2025-07-23", + "open_weights": false, + "release_date": "2024-12-17", + "last_updated": "2024-12-17", "cost": { - "input": 0.3, - "output": 1.2 + "input": 14.994, + "output": 59.993 }, "type": "chat" }, { - "id": "moonshotai/kimi-k2", - "name": "Kimi K2", - "display_name": "Kimi K2", + "id": "qwen3.7-plus", + "name": "Qwen3.7 Plus", + "display_name": "Qwen3.7 Plus", "modalities": { "input": [ - "text" + "text", + "image", + "video" ], "output": [ "text" ] }, "limit": { - "context": 131072, - "output": 32768 + "context": 991808, + "output": 65536 }, - "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": false + "supported": true }, - "attachment": false, - "open_weights": true, - "knowledge": "2024-10", - "release_date": "2025-07-11", - "last_updated": "2025-07-11", + "extra_capabilities": { + "reasoning": { + "supported": true + } + }, + "attachment": true, + "open_weights": false, + "release_date": "2026-06-01", + "last_updated": "2026-06-01", "cost": { - "input": 0.55, - "output": 2.2 + "input": 0.4, + "output": 1.6, + "cache_read": 0.04 }, "type": "chat" }, { - "id": "x-ai/grok-4", - "name": "Grok 4", - "display_name": "Grok 4", + "id": "glm-4-airx", + "name": "GLM-4 AirX", + "display_name": "GLM-4 AirX", "modalities": { "input": [ "text" @@ -153077,37 +157709,27 @@ ] }, "limit": { - "context": 256000, - "output": 64000 + "context": 8000, + "output": 4096 }, - "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true - } + "supported": false }, "attachment": false, "open_weights": false, - "knowledge": "2025-07", - "release_date": "2025-07-09", - "last_updated": "2025-07-09", + "release_date": "2024-06-05", + "last_updated": "2024-06-05", "cost": { - "input": 3, - "output": 15, - "cache_read": 0.75, - "cache_write": 15 + "input": 2.006, + "output": 2.006 }, "type": "chat" }, { - "id": "deepseek-ai/deepseek-r1-distill-llama-70b", - "name": "DeepSeek R1 Distill Llama 70B", - "display_name": "DeepSeek R1 Distill Llama 70B", + "id": "step-r1-v-mini", + "name": "Step R1 V Mini", + "display_name": "Step R1 V Mini", "modalities": { "input": [ "text" @@ -153117,51 +157739,41 @@ ] }, "limit": { - "context": 131072, - "output": 131072 + "context": 128000, + "output": 65536 }, - "temperature": true, "tool_call": false, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true - } + "supported": false }, "attachment": false, - "open_weights": true, - "knowledge": "2024-10", - "release_date": "2025-01-23", - "last_updated": "2025-01-23", + "open_weights": false, + "release_date": "2025-04-08", + "last_updated": "2025-04-08", "cost": { - "input": 0.03, - "output": 0.14 + "input": 2.5, + "output": 11 }, "type": "chat" }, { - "id": "google/gemini-2.5-pro", + "id": "gemini-2.5-pro", "name": "Gemini 2.5 Pro", "display_name": "Gemini 2.5 Pro", "modalities": { "input": [ "text", - "image", - "pdf" + "image" ], "output": [ "text" ] }, "limit": { - "context": 1048576, + "context": 1048756, "output": 65536 }, - "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": true, "default": true @@ -153187,20 +157799,18 @@ }, "attachment": true, "open_weights": false, - "knowledge": "2025-01", - "release_date": "2025-06-17", - "last_updated": "2025-06-17", + "release_date": "2025-06-05", + "last_updated": "2025-06-05", "cost": { - "input": 1.25, - "output": 10, - "cache_read": 0.31 + "input": 2.5, + "output": 10 }, "type": "chat" }, { - "id": "google/gemini-2.5-flash", - "name": "Gemini 2.5 Flash", - "display_name": "Gemini 2.5 Flash", + "id": "claude-haiku-4-5-20251001-thinking", + "name": "Claude Haiku 4.5 Thinking", + "display_name": "Claude Haiku 4.5 Thinking", "modalities": { "input": [ "text", @@ -153212,10 +157822,9 @@ ] }, "limit": { - "context": 1048576, - "output": 65536 + "context": 200000, + "output": 64000 }, - "temperature": true, "tool_call": true, "reasoning": { "supported": true, @@ -153227,217 +157836,166 @@ "default_enabled": true, "mode": "budget", "budget": { - "default": -1, - "min": 0, - "max": 24576, - "auto": -1, - "off": 0, + "min": 1024, "unit": "tokens" }, + "interleaved": true, "summaries": true, "visibility": "summary", "continuation": [ - "thought_signatures" + "thinking_blocks" + ], + "notes": [ + "Claude 4 manual thinking uses thinking.type = \"enabled\" with budget_tokens.", + "Interleaved thinking requires the interleaved-thinking-2025-05-14 beta header for this model family." ] } }, "attachment": true, "open_weights": false, - "knowledge": "2025-01", - "release_date": "2025-06-17", - "last_updated": "2025-06-17", + "release_date": "2025-10-15", + "last_updated": "2025-10-15", "cost": { - "input": 0.3, - "output": 2.5, - "cache_read": 0.0375 + "input": 1, + "output": 5, + "cache_read": 0.1 }, "type": "chat" }, { - "id": "openai/gpt-5-mini", - "name": "GPT-5 Mini", - "display_name": "GPT-5 Mini", + "id": "jamba-mini-1.6", + "name": "Jamba Mini 1.6", + "display_name": "Jamba Mini 1.6", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 400000, - "output": 128000 + "context": 256000, + "output": 4096 }, - "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": true, - "mode": "effort", - "effort": "medium", - "effort_options": [ - "minimal", - "low", - "medium", - "high" - ], - "verbosity": "medium", - "verbosity_options": [ - "low", - "medium", - "high" - ], - "visibility": "hidden" - } + "supported": false }, - "attachment": true, + "attachment": false, "open_weights": false, - "knowledge": "2024-10-01", - "release_date": "2025-08-07", - "last_updated": "2025-08-07", + "release_date": "2025-03-01", + "last_updated": "2025-03-01", "cost": { - "input": 0.25, - "output": 2, - "cache_read": 0.025 + "input": 0.1989, + "output": 0.408 }, "type": "chat" }, { - "id": "openai/gpt-5", - "name": "GPT-5", - "display_name": "GPT-5", + "id": "claude-haiku-4-5-20251001", + "name": "Claude Haiku 4.5", + "display_name": "Claude Haiku 4.5", "modalities": { "input": [ "text", - "image" + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 400000, - "output": 128000 + "context": 200000, + "output": 64000 }, - "temperature": true, "tool_call": true, "reasoning": { "supported": true, - "default": true + "default": false }, "extra_capabilities": { "reasoning": { "supported": true, - "default_enabled": true, - "mode": "effort", - "effort": "medium", - "effort_options": [ - "minimal", - "low", - "medium", - "high" - ], - "verbosity": "medium", - "verbosity_options": [ - "low", - "medium", - "high" + "default_enabled": false, + "mode": "budget", + "budget": { + "min": 1024, + "unit": "tokens" + }, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" ], - "visibility": "hidden" + "notes": [ + "Claude 4 manual thinking uses thinking.type = \"enabled\" with budget_tokens.", + "Interleaved thinking requires the interleaved-thinking-2025-05-14 beta header for this model family." + ] } }, "attachment": true, "open_weights": false, - "knowledge": "2024-10-01", - "release_date": "2025-08-07", - "last_updated": "2025-08-07", + "release_date": "2025-10-15", + "last_updated": "2025-10-15", "cost": { - "input": 1.25, - "output": 10, - "cache_read": 0.125 + "input": 1, + "output": 5 }, "type": "chat" }, { - "id": "openai/gpt-5-nano", - "name": "GPT-5 Nano", - "display_name": "GPT-5 Nano", + "id": "claude-3-5-haiku-20241022", + "name": "Claude 3.5 Haiku", + "display_name": "Claude 3.5 Haiku", "modalities": { "input": [ "text", - "image" + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 400000, - "output": 128000 + "context": 200000, + "output": 8192 }, - "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": true, - "mode": "effort", - "effort": "medium", - "effort_options": [ - "minimal", - "low", - "medium", - "high" - ], - "verbosity": "medium", - "verbosity_options": [ - "low", - "medium", - "high" - ], - "visibility": "hidden" - } + "supported": false }, "attachment": true, "open_weights": false, - "knowledge": "2024-10-01", - "release_date": "2025-08-07", - "last_updated": "2025-08-07", + "release_date": "2024-10-22", + "last_updated": "2024-10-22", "cost": { - "input": 0.05, - "output": 0.4, - "cache_read": 0.005 + "input": 0.8, + "output": 4 }, "type": "chat" }, { - "id": "openai/gpt-oss-120b", - "name": "GPT OSS 120B", - "display_name": "GPT OSS 120B", + "id": "claude-sonnet-4-thinking:32768", + "name": "Claude 4 Sonnet Thinking (32K)", + "display_name": "Claude 4 Sonnet Thinking (32K)", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 131072, - "output": 32768 + "context": 1000000, + "output": 64000 }, - "temperature": true, "tool_call": true, "reasoning": { "supported": true, @@ -153445,167 +158003,127 @@ }, "extra_capabilities": { "reasoning": { - "supported": true + "supported": true, + "default_enabled": true, + "mode": "budget", + "budget": { + "min": 1024, + "unit": "tokens" + }, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ], + "notes": [ + "Claude 4 manual thinking uses thinking.type = \"enabled\" with budget_tokens.", + "Interleaved thinking requires the interleaved-thinking-2025-05-14 beta header for this model family." + ] } }, - "attachment": false, - "open_weights": true, - "release_date": "2025-08-05", - "last_updated": "2025-08-05", + "attachment": true, + "open_weights": false, + "release_date": "2025-05-22", + "last_updated": "2025-05-22", "cost": { - "input": 0.15, - "output": 0.6 + "input": 2.992, + "output": 14.994 }, "type": "chat" }, { - "id": "openai/gpt-oss-20b", - "name": "GPT OSS 20B", - "display_name": "GPT OSS 20B", + "id": "hermes-low", + "name": "Hermes Low", + "display_name": "Hermes Low", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 131072, + "context": 1048576, "output": 65536 }, - "temperature": true, "tool_call": true, "reasoning": { "supported": true, "default": true }, - "extra_capabilities": { - "reasoning": { - "supported": true - } - }, - "attachment": false, - "open_weights": true, - "release_date": "2025-08-05", - "last_updated": "2025-08-05", - "cost": { - "input": 0.05, - "output": 0.2 - }, - "type": "chat" - }, - { - "id": "openai/gpt-4.1", - "name": "GPT-4.1", - "display_name": "GPT-4.1", - "modalities": { - "input": [ - "text", - "image" - ], - "output": [ - "text" - ] - }, - "limit": { - "context": 1047576, - "output": 32768 - }, - "temperature": true, - "tool_call": true, - "reasoning": { - "supported": false - }, "attachment": true, "open_weights": false, - "knowledge": "2024-04", - "release_date": "2025-04-14", - "last_updated": "2025-04-14", - "cost": { - "input": 2, - "output": 8, - "cache_read": 0.5 - }, - "type": "chat" - } - ] - }, - "siliconflow-com": { - "id": "siliconflow-com", - "name": "SiliconFlow", - "display_name": "SiliconFlow", - "api": "https://api.siliconflow.com/v1", - "doc": "https://cloud.siliconflow.com/models", - "models": [ - { - "id": "THUDM/GLM-Z1-32B-0414", - "name": "THUDM/GLM-Z1-32B-0414", - "display_name": "THUDM/GLM-Z1-32B-0414", - "modalities": { - "input": [ - "text" - ], - "output": [ - "text" - ] - }, - "limit": { - "context": 131000, - "output": 131000 - }, - "temperature": true, - "tool_call": true, - "reasoning": { - "supported": true, - "default": true - }, - "attachment": false, - "open_weights": false, - "release_date": "2025-04-18", - "last_updated": "2025-11-25", + "release_date": "2026-05-11", + "last_updated": "2026-05-11", "cost": { - "input": 0.14, - "output": 0.57 + "input": 0.25, + "output": 1.5, + "cache_read": 0.025 }, "type": "chat" }, { - "id": "THUDM/GLM-Z1-9B-0414", - "name": "THUDM/GLM-Z1-9B-0414", - "display_name": "THUDM/GLM-Z1-9B-0414", + "id": "claude-sonnet-4-thinking", + "name": "Claude 4 Sonnet Thinking", + "display_name": "Claude 4 Sonnet Thinking", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 131000, - "output": 131000 + "context": 1000000, + "output": 64000 }, - "temperature": true, "tool_call": true, "reasoning": { "supported": true, "default": true }, - "attachment": false, + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": true, + "mode": "budget", + "budget": { + "min": 1024, + "unit": "tokens" + }, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ], + "notes": [ + "Claude 4 manual thinking uses thinking.type = \"enabled\" with budget_tokens.", + "Interleaved thinking requires the interleaved-thinking-2025-05-14 beta header for this model family." + ] + } + }, + "attachment": true, "open_weights": false, - "release_date": "2025-04-18", - "last_updated": "2025-11-25", + "release_date": "2025-02-24", + "last_updated": "2025-02-24", "cost": { - "input": 0.086, - "output": 0.086 + "input": 2.992, + "output": 14.994 }, "type": "chat" }, { - "id": "THUDM/GLM-4-32B-0414", - "name": "THUDM/GLM-4-32B-0414", - "display_name": "THUDM/GLM-4-32B-0414", + "id": "qwen3.7-max", + "name": "Qwen3.7 Max", + "display_name": "Qwen3.7 Max", "modalities": { "input": [ "text" @@ -153615,28 +158133,33 @@ ] }, "limit": { - "context": 33000, - "output": 33000 + "context": 1000000, + "output": 65536 }, - "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": false + "supported": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true + } }, "attachment": false, "open_weights": false, - "release_date": "2025-04-18", - "last_updated": "2025-11-25", + "release_date": "2026-05-21", + "last_updated": "2026-05-21", "cost": { - "input": 0.27, - "output": 0.27 + "input": 2.5, + "output": 7.5, + "cache_read": 0.25 }, "type": "chat" }, { - "id": "THUDM/GLM-4-9B-0414", - "name": "THUDM/GLM-4-9B-0414", - "display_name": "THUDM/GLM-4-9B-0414", + "id": "yi-medium-200k", + "name": "Yi Medium 200k", + "display_name": "Yi Medium 200k", "modalities": { "input": [ "text" @@ -153646,162 +158169,180 @@ ] }, "limit": { - "context": 33000, - "output": 33000 + "context": 200000, + "output": 4096 }, - "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": false }, "attachment": false, "open_weights": false, - "release_date": "2025-04-18", - "last_updated": "2025-11-25", + "release_date": "2024-03-01", + "last_updated": "2024-03-01", "cost": { - "input": 0.086, - "output": 0.086 + "input": 2.499, + "output": 2.499 }, "type": "chat" }, { - "id": "MiniMaxAI/MiniMax-M2.5", - "name": "MiniMaxAI/MiniMax-M2.5", - "display_name": "MiniMaxAI/MiniMax-M2.5", + "id": "Qwen3.5-27B-BlueStar-v2-Derestricted-Lite", + "name": "Qwen3.5 27B BlueStar v2 Derestricted Lite", + "display_name": "Qwen3.5 27B BlueStar v2 Derestricted Lite", "modalities": { "input": [ - "text" + "text", + "image", + "video" ], "output": [ "text" ] }, "limit": { - "context": 197000, - "output": 131000 + "context": 262144, + "output": 16384 }, - "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true + "supported": true, + "default": true }, "extra_capabilities": { "reasoning": { - "supported": true + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] } }, - "attachment": false, + "attachment": true, "open_weights": false, - "release_date": "2026-02-15", - "last_updated": "2026-02-15", + "release_date": "2026-04-06", + "last_updated": "2026-04-06", "cost": { - "input": 0.3, - "output": 1.2 + "input": 0.306, + "output": 0.306 }, "type": "chat" }, { - "id": "MiniMaxAI/MiniMax-M2.1", - "name": "MiniMaxAI/MiniMax-M2.1", - "display_name": "MiniMaxAI/MiniMax-M2.1", + "id": "Gemma-4-31B-Claude-4.6-Opus-Reasoning-Distilled", + "name": "Gemma 4 31B Claude 4.6 Opus Reasoning Distilled", + "display_name": "Gemma 4 31B Claude 4.6 Opus Reasoning Distilled", "modalities": { "input": [ - "text" + "text", + "image", + "video" ], "output": [ "text" ] }, "limit": { - "context": 197000, - "output": 131000 + "context": 262144, + "output": 16384 }, - "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true - } + "supported": true, + "default": true }, - "attachment": false, + "attachment": true, "open_weights": false, - "release_date": "2025-12-23", - "last_updated": "2025-12-23", + "release_date": "2026-05-01", + "last_updated": "2026-05-01", "cost": { - "input": 0.3, - "output": 1.2 + "input": 0.306, + "output": 0.306, + "cache_read": 0.0306 }, "type": "chat" }, { - "id": "inclusionAI/Ling-mini-2.0", - "name": "inclusionAI/Ling-mini-2.0", - "display_name": "inclusionAI/Ling-mini-2.0", + "id": "doubao-1-5-thinking-vision-pro-250428", + "name": "Doubao 1.5 Thinking Vision Pro", + "display_name": "Doubao 1.5 Thinking Vision Pro", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 131000, - "output": 131000 + "context": 128000, + "output": 16384 }, - "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": false }, - "attachment": false, + "attachment": true, "open_weights": false, - "release_date": "2025-09-10", - "last_updated": "2025-11-25", + "release_date": "2025-05-15", + "last_updated": "2025-05-15", "cost": { - "input": 0.07, - "output": 0.28 + "input": 0.55, + "output": 1.43 }, "type": "chat" }, { - "id": "inclusionAI/Ling-flash-2.0", - "name": "inclusionAI/Ling-flash-2.0", - "display_name": "inclusionAI/Ling-flash-2.0", + "id": "Qwen3.5-27B-BlueStar-Derestricted-Lite", + "name": "Qwen3.5 27B BlueStar Derestricted Lite", + "display_name": "Qwen3.5 27B BlueStar Derestricted Lite", "modalities": { "input": [ - "text" + "text", + "image", + "video" ], "output": [ "text" ] }, "limit": { - "context": 131000, - "output": 131000 + "context": 262144, + "output": 16384 }, - "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": false, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } + }, + "attachment": true, "open_weights": false, - "release_date": "2025-09-18", - "last_updated": "2025-11-25", + "release_date": "2026-04-06", + "last_updated": "2026-04-06", "cost": { - "input": 0.14, - "output": 0.57 + "input": 0.306, + "output": 0.306 }, "type": "chat" }, { - "id": "inclusionAI/Ring-flash-2.0", - "name": "inclusionAI/Ring-flash-2.0", - "display_name": "inclusionAI/Ring-flash-2.0", + "id": "Qwen2.5-32B-EVA-v0.2", + "name": "Qwen 2.5 32b EVA", + "display_name": "Qwen 2.5 32b EVA", "modalities": { "input": [ "text" @@ -153811,48 +158352,41 @@ ] }, "limit": { - "context": 131000, - "output": 131000 + "context": 24576, + "output": 8192 }, - "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true - } + "supported": false }, "attachment": false, "open_weights": false, - "release_date": "2025-09-29", - "last_updated": "2025-11-25", + "release_date": "2024-09-01", + "last_updated": "2024-09-01", "cost": { - "input": 0.14, - "output": 0.57 + "input": 0.493, + "output": 0.493 }, "type": "chat" }, { - "id": "zai-org/GLM-4.7", - "name": "zai-org/GLM-4.7", - "display_name": "zai-org/GLM-4.7", + "id": "gemini-2.5-flash", + "name": "Gemini 2.5 Flash", + "display_name": "Gemini 2.5 Flash", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 205000, - "output": 205000 + "context": 1048756, + "output": 65536 }, - "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": true, "default": true @@ -153860,102 +158394,101 @@ "extra_capabilities": { "reasoning": { "supported": true, - "interleaved": true, + "default_enabled": true, + "mode": "budget", + "budget": { + "default": -1, + "min": 0, + "max": 24576, + "auto": -1, + "off": 0, + "unit": "tokens" + }, "summaries": true, "visibility": "summary", "continuation": [ - "thinking_blocks" + "thought_signatures" ] } }, - "attachment": false, + "attachment": true, "open_weights": false, - "release_date": "2025-12-22", - "last_updated": "2025-12-22", + "release_date": "2025-06-05", + "last_updated": "2025-06-05", "cost": { - "input": 0.6, - "output": 2.2 + "input": 0.3, + "output": 2.5 }, "type": "chat" }, { - "id": "zai-org/GLM-4.5-Air", - "name": "zai-org/GLM-4.5-Air", - "display_name": "zai-org/GLM-4.5-Air", + "id": "qwen-long", + "name": "Qwen Long 10M", + "display_name": "Qwen Long 10M", "modalities": { "input": [ - "text" + "text", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 131000, - "output": 131000 + "context": 10000000, + "output": 8192 }, - "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": false }, - "attachment": false, + "attachment": true, "open_weights": false, - "release_date": "2025-07-28", - "last_updated": "2025-11-25", + "release_date": "2025-01-25", + "last_updated": "2025-01-25", "cost": { - "input": 0.14, - "output": 0.86 + "input": 0.1003, + "output": 0.408 }, "type": "chat" }, { - "id": "zai-org/GLM-5", - "name": "zai-org/GLM-5", - "display_name": "zai-org/GLM-5", + "id": "Gemma-4-31B-DarkIdol", + "name": "Gemma 4 31B DarkIdol", + "display_name": "Gemma 4 31B DarkIdol", "modalities": { "input": [ - "text" + "text", + "image", + "video" ], "output": [ "text" ] }, "limit": { - "context": 205000, - "output": 205000 + "context": 262144, + "output": 16384 }, - "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": true, "default": true }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } - }, - "attachment": false, - "open_weights": true, - "release_date": "2026-02-12", - "last_updated": "2026-02-12", + "attachment": true, + "open_weights": false, + "release_date": "2026-05-01", + "last_updated": "2026-05-01", "cost": { - "input": 1, - "output": 3.2 + "input": 0.306, + "output": 0.306 }, "type": "chat" }, { - "id": "zai-org/GLM-5.1", - "name": "zai-org/GLM-5.1", - "display_name": "zai-org/GLM-5.1", + "id": "step-2-16k-exp", + "name": "Step-2 16k Exp", + "display_name": "Step-2 16k Exp", "modalities": { "input": [ "text" @@ -153965,88 +158498,86 @@ ] }, "limit": { - "context": 205000, - "output": 205000 + "context": 16000, + "output": 8192 }, - "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } + "supported": false }, "attachment": false, - "open_weights": true, - "release_date": "2026-04-08", - "last_updated": "2026-04-08", + "open_weights": false, + "release_date": "2024-07-05", + "last_updated": "2024-07-05", "cost": { - "input": 1.4, - "output": 4.4, - "cache_write": 0 + "input": 7.004, + "output": 19.992 }, "type": "chat" }, { - "id": "zai-org/GLM-4.5V", - "name": "zai-org/GLM-4.5V", - "display_name": "zai-org/GLM-4.5V", + "id": "Qwen3.5-27B-Marvin-V2-Derestricted-Lite", + "name": "Qwen3.5 27B Marvin V2 Derestricted Lite", + "display_name": "Qwen3.5 27B Marvin V2 Derestricted Lite", "modalities": { "input": [ "text", - "image" + "image", + "video" ], "output": [ "text" ] }, "limit": { - "context": 66000, - "output": 66000 + "context": 262144, + "output": 16384 }, - "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": false + "supported": true, + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } }, "attachment": true, "open_weights": false, - "release_date": "2025-08-13", - "last_updated": "2025-11-25", + "release_date": "2026-04-30", + "last_updated": "2026-04-30", "cost": { - "input": 0.14, - "output": 0.86 + "input": 0.306, + "output": 0.306 }, "type": "chat" }, { - "id": "zai-org/GLM-5V-Turbo", - "name": "zai-org/GLM-5V-Turbo", - "display_name": "zai-org/GLM-5V-Turbo", + "id": "Qwen3.5-27B-NaNovel-Derestricted", + "name": "Qwen3.5 27B NaNovel Derestricted", + "display_name": "Qwen3.5 27B NaNovel Derestricted", "modalities": { "input": [ "text", - "image" + "image", + "video" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 131072 + "context": 262144, + "output": 16384 }, - "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": true, "default": true @@ -154064,19 +158595,18 @@ }, "attachment": true, "open_weights": false, - "release_date": "2026-04-01", - "last_updated": "2026-04-01", + "release_date": "2026-04-30", + "last_updated": "2026-04-30", "cost": { - "input": 1.2, - "output": 4, - "cache_write": 0 + "input": 0.306, + "output": 0.306 }, "type": "chat" }, { - "id": "zai-org/GLM-4.5", - "name": "zai-org/GLM-4.5", - "display_name": "zai-org/GLM-4.5", + "id": "ernie-4.5-8k-preview", + "name": "Ernie 4.5 8k Preview", + "display_name": "Ernie 4.5 8k Preview", "modalities": { "input": [ "text" @@ -154086,142 +158616,139 @@ ] }, "limit": { - "context": 131000, - "output": 131000 + "context": 8000, + "output": 16384 }, - "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": false }, "attachment": false, "open_weights": false, - "release_date": "2025-07-28", - "last_updated": "2025-11-25", + "release_date": "2025-03-25", + "last_updated": "2025-03-25", "cost": { - "input": 0.4, - "output": 2 + "input": 0.66, + "output": 2.6 }, "type": "chat" }, { - "id": "zai-org/GLM-4.6V", - "name": "zai-org/GLM-4.6V", - "display_name": "zai-org/GLM-4.6V", + "id": "gemini-2.0-flash-exp-image-generation", + "name": "Gemini Text + Image", + "display_name": "Gemini Text + Image", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 131000, - "output": 131000 + "context": 32767, + "output": 8192 }, - "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": true + "supported": false }, - "attachment": true, + "attachment": false, "open_weights": false, - "release_date": "2025-12-07", - "last_updated": "2025-12-07", + "release_date": "2025-02-19", + "last_updated": "2025-02-19", "cost": { - "input": 0.3, - "output": 0.9 + "input": 0.2, + "output": 0.8 }, "type": "chat" }, { - "id": "zai-org/GLM-4.6", - "name": "zai-org/GLM-4.6", - "display_name": "zai-org/GLM-4.6", + "id": "gemini-2.5-flash-lite-preview-09-2025", + "name": "Gemini 2.5 Flash Lite Preview (09/2025)", + "display_name": "Gemini 2.5 Flash Lite Preview (09/2025)", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 205000, - "output": 205000 + "context": 1048756, + "output": 65536 }, - "temperature": true, "tool_call": true, "reasoning": { - "supported": true + "supported": true, + "default": false }, "extra_capabilities": { "reasoning": { - "supported": true + "supported": true, + "default_enabled": false, + "mode": "budget", + "budget": { + "default": -1, + "min": 512, + "max": 24576, + "auto": -1, + "unit": "tokens" + }, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thought_signatures" + ] } }, - "attachment": false, + "attachment": true, "open_weights": false, - "release_date": "2025-10-04", - "last_updated": "2025-11-25", + "release_date": "2025-09-25", + "last_updated": "2025-09-25", "cost": { - "input": 0.5, - "output": 1.9 + "input": 0.1, + "output": 0.4 }, "type": "chat" }, { - "id": "moonshotai/Kimi-K2.6", - "name": "moonshotai/Kimi-K2.6", - "display_name": "moonshotai/Kimi-K2.6", + "id": "deepseek-reasoner-cheaper", + "name": "Deepseek R1 Cheaper", + "display_name": "Deepseek R1 Cheaper", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 262000, - "output": 262000 + "context": 128000, + "output": 65536 }, - "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } + "supported": false }, "attachment": false, - "open_weights": true, - "release_date": "2026-04-21", - "last_updated": "2026-04-21", + "open_weights": false, + "release_date": "2025-01-20", + "last_updated": "2025-01-20", "cost": { - "input": 0.95, - "output": 4, - "cache_read": 0.16 + "input": 0.4, + "output": 1.7 }, "type": "chat" }, { - "id": "moonshotai/Kimi-K2-Instruct-0905", - "name": "moonshotai/Kimi-K2-Instruct-0905", - "display_name": "moonshotai/Kimi-K2-Instruct-0905", + "id": "venice-uncensored", + "name": "Venice Uncensored", + "display_name": "Venice Uncensored", "modalities": { "input": [ "text" @@ -154231,28 +158758,27 @@ ] }, "limit": { - "context": 262000, - "output": 262000 + "context": 128000, + "output": 16384 }, - "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": false }, "attachment": false, "open_weights": false, - "release_date": "2025-09-08", - "last_updated": "2025-11-25", + "release_date": "2025-02-24", + "last_updated": "2025-02-24", "cost": { "input": 0.4, - "output": 2 + "output": 0.4 }, "type": "chat" }, { - "id": "moonshotai/Kimi-K2.5", - "name": "moonshotai/Kimi-K2.5", - "display_name": "moonshotai/Kimi-K2.5", + "id": "gemini-2.0-flash-001", + "name": "Gemini 2.0 Flash", + "display_name": "Gemini 2.0 Flash", "modalities": { "input": [ "text", @@ -154263,276 +158789,287 @@ ] }, "limit": { - "context": 262000, - "output": 262000 + "context": 1000000, + "output": 8192 }, - "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } + "supported": false }, - "attachment": false, - "open_weights": true, - "release_date": "2026-01-27", - "last_updated": "2026-01-27", + "attachment": true, + "open_weights": false, + "release_date": "2024-12-11", + "last_updated": "2024-12-11", "cost": { - "input": 0.45, - "output": 2.25 + "input": 0.1003, + "output": 0.408 }, "type": "chat" }, { - "id": "moonshotai/Kimi-K2-Instruct", - "name": "moonshotai/Kimi-K2-Instruct", - "display_name": "moonshotai/Kimi-K2-Instruct", + "id": "gemma-4-31B-Larkspur-v0.5", + "name": "Gemma 4 31B Larkspur v0.5", + "display_name": "Gemma 4 31B Larkspur v0.5", "modalities": { "input": [ - "text" + "text", + "image", + "video" ], "output": [ "text" ] }, "limit": { - "context": 131000, - "output": 131000 + "context": 262144, + "output": 16384 }, - "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": false, + "attachment": true, "open_weights": false, - "release_date": "2025-07-13", - "last_updated": "2025-11-25", + "release_date": "2026-05-02", + "last_updated": "2026-05-02", "cost": { - "input": 0.58, - "output": 2.29 + "input": 0.306, + "output": 0.306 }, "type": "chat" }, { - "id": "moonshotai/Kimi-K2-Thinking", - "name": "moonshotai/Kimi-K2-Thinking", - "display_name": "moonshotai/Kimi-K2-Thinking", + "id": "claude-opus-4-1-20250805", + "name": "Claude 4.1 Opus", + "display_name": "Claude 4.1 Opus", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 262000, - "output": 262000 + "context": 200000, + "output": 32000 }, - "temperature": true, "tool_call": true, "reasoning": { "supported": true, - "default": true + "default": false }, "extra_capabilities": { "reasoning": { "supported": true, + "default_enabled": false, + "mode": "budget", + "budget": { + "min": 1024, + "unit": "tokens" + }, "interleaved": true, "summaries": true, "visibility": "summary", "continuation": [ "thinking_blocks" + ], + "notes": [ + "Claude 4 manual thinking uses thinking.type = \"enabled\" with budget_tokens.", + "Interleaved thinking requires the interleaved-thinking-2025-05-14 beta header for this model family." ] } }, - "attachment": false, + "attachment": true, "open_weights": false, - "release_date": "2025-11-07", - "last_updated": "2025-11-25", + "release_date": "2025-08-05", + "last_updated": "2025-08-05", "cost": { - "input": 0.55, - "output": 2.5 + "input": 14.994, + "output": 75.004 }, "type": "chat" }, { - "id": "meta-llama/Meta-Llama-3.1-8B-Instruct", - "name": "meta-llama/Meta-Llama-3.1-8B-Instruct", - "display_name": "meta-llama/Meta-Llama-3.1-8B-Instruct", + "id": "holo3-35b-a3b", + "name": "Holo3-35B-A3B", + "display_name": "Holo3-35B-A3B", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 33000, - "output": 4000 + "context": 65536, + "output": 65536 }, - "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": false, + "attachment": true, "open_weights": false, - "release_date": "2025-04-23", - "last_updated": "2025-11-25", + "release_date": "2024-01-01", + "last_updated": "2024-01-01", "cost": { - "input": 0.06, - "output": 0.06 + "input": 0.25, + "output": 1.8 }, "type": "chat" }, { - "id": "ByteDance-Seed/Seed-OSS-36B-Instruct", - "name": "ByteDance-Seed/Seed-OSS-36B-Instruct", - "display_name": "ByteDance-Seed/Seed-OSS-36B-Instruct", + "id": "qwen3.5-omni-plus", + "name": "Qwen3.5 Omni Plus", + "display_name": "Qwen3.5 Omni Plus", "modalities": { "input": [ - "text" + "text", + "image", + "video", + "audio" ], "output": [ "text" ] }, "limit": { - "context": 262000, - "output": 262000 + "context": 983616, + "output": 65536 }, - "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true - } + "supported": false }, - "attachment": false, + "attachment": true, "open_weights": false, - "release_date": "2025-09-04", - "last_updated": "2025-11-25", + "release_date": "2026-03-30", + "last_updated": "2026-03-30", "cost": { - "input": 0.21, - "output": 0.57 + "input": 0, + "output": 0 }, "type": "chat" }, { - "id": "baidu/ERNIE-4.5-300B-A47B", - "name": "baidu/ERNIE-4.5-300B-A47B", - "display_name": "baidu/ERNIE-4.5-300B-A47B", + "id": "Gemma-4-31B-it", + "name": "Gemma 4 31B IT", + "display_name": "Gemma 4 31B IT", "modalities": { "input": [ - "text" + "text", + "image", + "video" ], "output": [ "text" ] }, "limit": { - "context": 131000, - "output": 131000 + "context": 262144, + "output": 16384 }, - "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": false, + "attachment": true, "open_weights": false, - "release_date": "2025-07-02", - "last_updated": "2025-11-25", + "release_date": "2026-04-09", + "last_updated": "2026-04-09", "cost": { - "input": 0.28, - "output": 1.1 + "input": 0.306, + "output": 0.306 }, "type": "chat" }, { - "id": "deepseek-ai/DeepSeek-V3.1", - "name": "deepseek-ai/DeepSeek-V3.1", - "display_name": "deepseek-ai/DeepSeek-V3.1", + "id": "Qwen3.5-27B-Derestricted", + "name": "Qwen3.5 27B Derestricted", + "display_name": "Qwen3.5 27B Derestricted", "modalities": { "input": [ - "text" + "text", + "image", + "video" ], "output": [ "text" ] }, "limit": { - "context": 164000, - "output": 164000 + "context": 262144, + "output": 16384 }, - "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": true, "default": true }, - "attachment": false, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } + }, + "attachment": true, "open_weights": false, - "release_date": "2025-08-25", - "last_updated": "2025-11-25", + "release_date": "2026-03-17", + "last_updated": "2026-03-17", "cost": { - "input": 0.27, - "output": 1 + "input": 0.306, + "output": 0.306 }, "type": "chat" }, { - "id": "deepseek-ai/deepseek-vl2", - "name": "deepseek-ai/deepseek-vl2", - "display_name": "deepseek-ai/deepseek-vl2", + "id": "sonar-reasoning-pro", + "name": "Perplexity Reasoning Pro", + "display_name": "Perplexity Reasoning Pro", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 4000, - "output": 4000 + "context": 127000, + "output": 128000 }, - "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": true, + "attachment": false, "open_weights": false, - "release_date": "2024-12-13", - "last_updated": "2025-11-25", + "release_date": "2025-02-19", + "last_updated": "2025-02-19", "cost": { - "input": 0.15, - "output": 0.15 + "input": 2.006, + "output": 7.9985 }, "type": "chat" }, { - "id": "deepseek-ai/DeepSeek-V3.1-Terminus", - "name": "deepseek-ai/DeepSeek-V3.1-Terminus", - "display_name": "deepseek-ai/DeepSeek-V3.1-Terminus", + "id": "venice-uncensored:web", + "name": "Venice Uncensored Web", + "display_name": "Venice Uncensored Web", "modalities": { "input": [ "text" @@ -154542,29 +159079,27 @@ ] }, "limit": { - "context": 164000, - "output": 164000 + "context": 80000, + "output": 16384 }, - "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": true + "supported": false }, "attachment": false, "open_weights": false, - "release_date": "2025-09-29", - "last_updated": "2025-11-25", + "release_date": "2024-05-01", + "last_updated": "2024-05-01", "cost": { - "input": 0.27, - "output": 1 + "input": 0.4, + "output": 0.4 }, "type": "chat" }, { - "id": "deepseek-ai/DeepSeek-V3.2", - "name": "deepseek-ai/DeepSeek-V3.2", - "display_name": "deepseek-ai/DeepSeek-V3.2", + "id": "doubao-1.5-pro-32k", + "name": "Doubao 1.5 Pro 32k", + "display_name": "Doubao 1.5 Pro 32k", "modalities": { "input": [ "text" @@ -154574,34 +159109,27 @@ ] }, "limit": { - "context": 164000, - "output": 164000 + "context": 32000, + "output": 8192 }, - "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true - } + "supported": false }, "attachment": false, "open_weights": false, - "release_date": "2025-12-03", - "last_updated": "2025-12-03", + "release_date": "2025-01-22", + "last_updated": "2025-01-22", "cost": { - "input": 0.27, - "output": 0.42 + "input": 0.1343, + "output": 0.3349 }, "type": "chat" }, { - "id": "deepseek-ai/DeepSeek-R1-Distill-Qwen-32B", - "name": "deepseek-ai/DeepSeek-R1-Distill-Qwen-32B", - "display_name": "deepseek-ai/DeepSeek-R1-Distill-Qwen-32B", + "id": "qwen3-30b-a3b-instruct-2507", + "name": "Qwen3 30B A3B Instruct 2507", + "display_name": "Qwen3 30B A3B Instruct 2507", "modalities": { "input": [ "text" @@ -154611,72 +159139,61 @@ ] }, "limit": { - "context": 131000, - "output": 131000 + "context": 256000, + "output": 32768 }, - "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": true + "supported": false }, "attachment": false, "open_weights": false, - "release_date": "2025-01-20", - "last_updated": "2025-11-25", + "release_date": "2025-02-20", + "last_updated": "2025-02-20", "cost": { - "input": 0.18, - "output": 0.18 + "input": 0.2, + "output": 0.5 }, "type": "chat" }, { - "id": "deepseek-ai/DeepSeek-R1", - "name": "deepseek-ai/DeepSeek-R1", - "display_name": "deepseek-ai/DeepSeek-R1", + "id": "ernie-5.1:thinking", + "name": "ERNIE 5.1 Thinking", + "display_name": "ERNIE 5.1 Thinking", "modalities": { "input": [ - "text" + "text", + "image", + "video" ], "output": [ "text" ] }, "limit": { - "context": 164000, - "output": 164000 + "context": 119000, + "output": 64000 }, - "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": true, "default": true }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } - }, - "attachment": false, + "attachment": true, "open_weights": false, - "release_date": "2025-05-28", - "last_updated": "2025-11-25", + "release_date": "2026-05-10", + "last_updated": "2026-05-10", "cost": { - "input": 0.5, - "output": 2.18 + "input": 0.75, + "output": 3, + "cache_read": 0.75 }, "type": "chat" }, { - "id": "deepseek-ai/DeepSeek-R1-Distill-Qwen-14B", - "name": "deepseek-ai/DeepSeek-R1-Distill-Qwen-14B", - "display_name": "deepseek-ai/DeepSeek-R1-Distill-Qwen-14B", + "id": "mirothinker-1-7-deepresearch", + "name": "MiroThinker 1.7 Deep Research", + "display_name": "MiroThinker 1.7 Deep Research", "modalities": { "input": [ "text" @@ -154686,61 +159203,61 @@ ] }, "limit": { - "context": 131000, - "output": 131000 + "context": 262144, + "output": 16384 }, - "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": true, "default": true }, "attachment": false, "open_weights": false, - "release_date": "2025-01-20", - "last_updated": "2025-11-25", + "release_date": "2026-05-11", + "last_updated": "2026-05-11", "cost": { - "input": 0.1, - "output": 0.1 + "input": 4, + "output": 25 }, "type": "chat" }, { - "id": "deepseek-ai/DeepSeek-V3.2-Exp", - "name": "deepseek-ai/DeepSeek-V3.2-Exp", - "display_name": "deepseek-ai/DeepSeek-V3.2-Exp", + "id": "hermes-high", + "name": "Hermes High", + "display_name": "Hermes High", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 164000, - "output": 164000 + "context": 1000000, + "output": 128000 }, - "temperature": true, "tool_call": true, "reasoning": { "supported": true, "default": true }, - "attachment": false, + "attachment": true, "open_weights": false, - "release_date": "2025-10-10", - "last_updated": "2025-11-25", + "release_date": "2026-05-11", + "last_updated": "2026-05-11", "cost": { - "input": 0.27, - "output": 0.41 + "input": 4.998, + "output": 25.007 }, "type": "chat" }, { - "id": "deepseek-ai/DeepSeek-V3", - "name": "deepseek-ai/DeepSeek-V3", - "display_name": "deepseek-ai/DeepSeek-V3", + "id": "jamba-large-1.6", + "name": "Jamba Large 1.6", + "display_name": "Jamba Large 1.6", "modalities": { "input": [ "text" @@ -154750,28 +159267,27 @@ ] }, "limit": { - "context": 164000, - "output": 164000 + "context": 256000, + "output": 4096 }, - "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": false }, "attachment": false, "open_weights": false, - "release_date": "2024-12-26", - "last_updated": "2025-11-25", + "release_date": "2025-03-12", + "last_updated": "2025-03-12", "cost": { - "input": 0.25, - "output": 1 + "input": 1.989, + "output": 7.99 }, "type": "chat" }, { - "id": "deepseek-ai/deepseek-v4-flash", - "name": "DeepSeek V4 Flash", - "display_name": "DeepSeek V4 Flash", + "id": "glm-4-long", + "name": "GLM-4 Long", + "display_name": "GLM-4 Long", "modalities": { "input": [ "text" @@ -154782,54 +159298,40 @@ }, "limit": { "context": 1000000, - "output": 384000 + "output": 4096 }, - "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } + "supported": false }, "attachment": false, - "open_weights": true, - "knowledge": "2025-05", - "release_date": "2026-04-24", - "last_updated": "2026-04-24", + "open_weights": false, + "release_date": "2024-08-01", + "last_updated": "2024-08-01", "cost": { - "input": 0.14, - "output": 0.28, - "cache_read": 0.028 + "input": 0.2006, + "output": 0.2006 }, "type": "chat" }, { - "id": "deepseek-ai/deepseek-v4-pro", - "name": "DeepSeek V4 Pro", - "display_name": "DeepSeek V4 Pro", + "id": "claude-opus-4-thinking:32768", + "name": "Claude 4 Opus Thinking (32K)", + "display_name": "Claude 4 Opus Thinking (32K)", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 1000000, - "output": 384000 + "context": 200000, + "output": 32000 }, - "temperature": true, "tool_call": true, "reasoning": { "supported": true, @@ -154838,62 +159340,92 @@ "extra_capabilities": { "reasoning": { "supported": true, + "default_enabled": true, + "mode": "budget", + "budget": { + "min": 1024, + "unit": "tokens" + }, "interleaved": true, "summaries": true, "visibility": "summary", "continuation": [ "thinking_blocks" + ], + "notes": [ + "Claude 4 manual thinking uses thinking.type = \"enabled\" with budget_tokens.", + "Interleaved thinking requires the interleaved-thinking-2025-05-14 beta header for this model family." ] } }, - "attachment": false, - "open_weights": true, - "knowledge": "2025-05", - "release_date": "2026-04-24", - "last_updated": "2026-04-24", + "attachment": true, + "open_weights": false, + "release_date": "2025-05-22", + "last_updated": "2025-05-22", "cost": { - "input": 1.74, - "output": 3.48, - "cache_read": 0.145 + "input": 14.994, + "output": 75.004 }, "type": "chat" }, { - "id": "stepfun-ai/Step-3.5-Flash", - "name": "stepfun-ai/Step-3.5-Flash", - "display_name": "stepfun-ai/Step-3.5-Flash", + "id": "claude-sonnet-4-thinking:8192", + "name": "Claude 4 Sonnet Thinking (8K)", + "display_name": "Claude 4 Sonnet Thinking (8K)", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 262000, - "output": 262000 + "context": 1000000, + "output": 64000 }, - "temperature": true, "tool_call": true, "reasoning": { "supported": true, "default": true }, - "attachment": false, + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": true, + "mode": "budget", + "budget": { + "min": 1024, + "unit": "tokens" + }, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ], + "notes": [ + "Claude 4 manual thinking uses thinking.type = \"enabled\" with budget_tokens.", + "Interleaved thinking requires the interleaved-thinking-2025-05-14 beta header for this model family." + ] + } + }, + "attachment": true, "open_weights": false, - "release_date": "2026-02-11", - "last_updated": "2026-02-11", + "release_date": "2025-05-22", + "last_updated": "2025-05-22", "cost": { - "input": 0.1, - "output": 0.3 + "input": 2.992, + "output": 14.994 }, "type": "chat" }, { - "id": "nex-agi/DeepSeek-V3.1-Nex-N1", - "name": "nex-agi/DeepSeek-V3.1-Nex-N1", - "display_name": "nex-agi/DeepSeek-V3.1-Nex-N1", + "id": "azure-o3-mini", + "name": "Azure o3-mini", + "display_name": "Azure o3-mini", "modalities": { "input": [ "text" @@ -154903,106 +159435,117 @@ ] }, "limit": { - "context": 131000, - "output": 131000 + "context": 200000, + "output": 65536 }, - "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": true + "supported": false }, "attachment": false, "open_weights": false, - "release_date": "2025-01-01", - "last_updated": "2025-11-25", + "release_date": "2025-01-31", + "last_updated": "2025-01-31", "cost": { - "input": 0.5, - "output": 2 + "input": 1.088, + "output": 4.3996 }, "type": "chat" }, { - "id": "tencent/Hunyuan-A13B-Instruct", - "name": "tencent/Hunyuan-A13B-Instruct", - "display_name": "tencent/Hunyuan-A13B-Instruct", + "id": "qvq-max", + "name": "Qwen: QvQ Max", + "display_name": "Qwen: QvQ Max", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 131000, - "output": 131000 + "context": 128000, + "output": 8192 }, - "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": false }, - "attachment": false, + "attachment": true, "open_weights": false, - "release_date": "2025-06-30", - "last_updated": "2025-11-25", + "release_date": "2025-03-28", + "last_updated": "2025-03-28", "cost": { - "input": 0.14, - "output": 0.57 + "input": 1.4, + "output": 5.3 }, "type": "chat" }, { - "id": "tencent/Hunyuan-MT-7B", - "name": "tencent/Hunyuan-MT-7B", - "display_name": "tencent/Hunyuan-MT-7B", + "id": "Qwen3.5-27B-BlueStar-v2-Derestricted", + "name": "Qwen3.5 27B BlueStar v2 Derestricted", + "display_name": "Qwen3.5 27B BlueStar v2 Derestricted", "modalities": { "input": [ - "text" + "text", + "image", + "video" ], "output": [ "text" ] }, "limit": { - "context": 33000, - "output": 33000 + "context": 262144, + "output": 16384 }, - "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": false, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } + }, + "attachment": true, "open_weights": false, - "release_date": "2025-09-18", - "last_updated": "2025-11-25", + "release_date": "2026-04-06", + "last_updated": "2026-04-06", "cost": { - "input": 0, - "output": 0 + "input": 0.306, + "output": 0.306 }, "type": "chat" }, { - "id": "Qwen/Qwen3-VL-235B-A22B-Thinking", - "name": "Qwen/Qwen3-VL-235B-A22B-Thinking", - "display_name": "Qwen/Qwen3-VL-235B-A22B-Thinking", + "id": "Qwen3.5-27B-Vivid-Durian", + "name": "Qwen3.5 27B Vivid Durian", + "display_name": "Qwen3.5 27B Vivid Durian", "modalities": { "input": [ "text", - "image" + "image", + "video" ], "output": [ "text" ] }, "limit": { - "context": 262000, - "output": 262000 + "context": 262144, + "output": 16384 }, - "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": true, "default": true @@ -155020,18 +159563,18 @@ }, "attachment": true, "open_weights": false, - "release_date": "2025-10-04", - "last_updated": "2025-11-25", + "release_date": "2026-03-18", + "last_updated": "2026-03-18", "cost": { - "input": 0.45, - "output": 3.5 + "input": 0.306, + "output": 0.306 }, "type": "chat" }, { - "id": "Qwen/Qwen3-Coder-480B-A35B-Instruct", - "name": "Qwen/Qwen3-Coder-480B-A35B-Instruct", - "display_name": "Qwen/Qwen3-Coder-480B-A35B-Instruct", + "id": "jamba-large-1.7", + "name": "Jamba Large 1.7", + "display_name": "Jamba Large 1.7", "modalities": { "input": [ "text" @@ -155041,149 +159584,144 @@ ] }, "limit": { - "context": 262000, - "output": 262000 + "context": 256000, + "output": 4096 }, - "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": false }, "attachment": false, "open_weights": false, - "release_date": "2025-07-31", - "last_updated": "2025-11-25", + "release_date": "2025-07-09", + "last_updated": "2025-07-09", "cost": { - "input": 0.25, - "output": 1 + "input": 1.989, + "output": 7.99 }, "type": "chat" }, { - "id": "Qwen/Qwen3-VL-8B-Instruct", - "name": "Qwen/Qwen3-VL-8B-Instruct", - "display_name": "Qwen/Qwen3-VL-8B-Instruct", + "id": "Baichuan-M2", + "name": "Baichuan M2 32B Medical", + "display_name": "Baichuan M2 32B Medical", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 262000, - "output": 262000 + "context": 32768, + "output": 32768 }, - "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": false }, - "attachment": true, + "attachment": false, "open_weights": false, - "release_date": "2025-10-15", - "last_updated": "2025-11-25", + "release_date": "2025-08-19", + "last_updated": "2025-08-19", "cost": { - "input": 0.18, - "output": 0.68 + "input": 15.73, + "output": 15.73 }, "type": "chat" }, { - "id": "Qwen/Qwen3-VL-8B-Thinking", - "name": "Qwen/Qwen3-VL-8B-Thinking", - "display_name": "Qwen/Qwen3-VL-8B-Thinking", + "id": "Magistral-Small-2506", + "name": "Magistral Small 2506", + "display_name": "Magistral Small 2506", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 262000, - "output": 262000 + "context": 32768, + "output": 32768 }, - "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } + "supported": false }, - "attachment": true, + "attachment": false, "open_weights": false, - "release_date": "2025-10-15", - "last_updated": "2025-11-25", + "release_date": "2025-09-25", + "last_updated": "2025-09-25", "cost": { - "input": 0.18, - "output": 2 + "input": 0.4, + "output": 1.4 }, "type": "chat" }, { - "id": "Qwen/Qwen3-Omni-30B-A3B-Captioner", - "name": "Qwen/Qwen3-Omni-30B-A3B-Captioner", - "display_name": "Qwen/Qwen3-Omni-30B-A3B-Captioner", + "id": "deepseek-r1", + "name": "DeepSeek R1", + "display_name": "DeepSeek R1", "modalities": { "input": [ - "audio" + "text" ], "output": [ "text" ] }, "limit": { - "context": 66000, - "output": 66000 + "context": 128000, + "output": 8192 }, - "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": true, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } + }, + "attachment": false, "open_weights": false, - "release_date": "2025-10-04", - "last_updated": "2025-11-25", + "release_date": "2025-01-20", + "last_updated": "2025-01-20", "cost": { - "input": 0.1, - "output": 0.4 + "input": 0.4, + "output": 1.7 }, "type": "chat" - }, - { - "id": "Qwen/QwQ-32B", - "name": "Qwen/QwQ-32B", - "display_name": "Qwen/QwQ-32B", + }, + { + "id": "Qwen3.5-27B-earica-Derestricted-Lite", + "name": "Qwen3.5 27B earica Derestricted Lite", + "display_name": "Qwen3.5 27B earica Derestricted Lite", "modalities": { "input": [ - "text" + "text", + "image", + "video" ], "output": [ "text" ] }, "limit": { - "context": 131000, - "output": 131000 + "context": 262144, + "output": 16384 }, - "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": true, "default": true @@ -155199,20 +159737,20 @@ ] } }, - "attachment": false, + "attachment": true, "open_weights": false, - "release_date": "2025-03-06", - "last_updated": "2025-11-25", + "release_date": "2026-04-30", + "last_updated": "2026-04-30", "cost": { - "input": 0.15, - "output": 0.58 + "input": 0.306, + "output": 0.306 }, "type": "chat" }, { - "id": "Qwen/Qwen2.5-72B-Instruct", - "name": "Qwen/Qwen2.5-72B-Instruct", - "display_name": "Qwen/Qwen2.5-72B-Instruct", + "id": "doubao-seed-2-0-pro-260215", + "name": "Doubao Seed 2.0 Pro", + "display_name": "Doubao Seed 2.0 Pro", "modalities": { "input": [ "text" @@ -155222,150 +159760,166 @@ ] }, "limit": { - "context": 33000, - "output": 4000 + "context": 256000, + "output": 128000 }, - "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": false }, "attachment": false, "open_weights": false, - "release_date": "2024-09-18", - "last_updated": "2025-11-25", + "release_date": "2026-02-14", + "last_updated": "2026-02-14", "cost": { - "input": 0.59, - "output": 0.59 + "input": 0.782, + "output": 3.876 }, "type": "chat" }, { - "id": "Qwen/Qwen3-Omni-30B-A3B-Instruct", - "name": "Qwen/Qwen3-Omni-30B-A3B-Instruct", - "display_name": "Qwen/Qwen3-Omni-30B-A3B-Instruct", + "id": "step-2-mini", + "name": "Step-2 Mini", + "display_name": "Step-2 Mini", "modalities": { "input": [ - "text", - "image", - "audio" + "text" ], "output": [ "text" ] }, "limit": { - "context": 66000, - "output": 66000 + "context": 8000, + "output": 4096 }, - "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": false }, - "attachment": true, + "attachment": false, "open_weights": false, - "release_date": "2025-10-04", - "last_updated": "2025-11-25", + "release_date": "2024-07-05", + "last_updated": "2024-07-05", "cost": { - "input": 0.1, - "output": 0.4 + "input": 0.2006, + "output": 0.408 }, "type": "chat" }, { - "id": "Qwen/Qwen3-30B-A3B-Instruct-2507", - "name": "Qwen/Qwen3-30B-A3B-Instruct-2507", - "display_name": "Qwen/Qwen3-30B-A3B-Instruct-2507", + "id": "gemini-exp-1206", + "name": "Gemini 2.0 Pro 1206", + "display_name": "Gemini 2.0 Pro 1206", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 262000, - "output": 262000 + "context": 2097152, + "output": 8192 }, - "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": false }, - "attachment": false, + "attachment": true, "open_weights": false, - "release_date": "2025-07-30", - "last_updated": "2025-11-25", + "release_date": "2024-12-06", + "last_updated": "2024-12-06", "cost": { - "input": 0.09, - "output": 0.3 + "input": 1.258, + "output": 4.998 }, "type": "chat" }, { - "id": "Qwen/Qwen3-235B-A22B", - "name": "Qwen/Qwen3-235B-A22B", - "display_name": "Qwen/Qwen3-235B-A22B", + "id": "claude-opus-4-5-20251101:thinking", + "name": "Claude 4.5 Opus Thinking", + "display_name": "Claude 4.5 Opus Thinking", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 131000, - "output": 131000 + "context": 200000, + "output": 32000 }, - "temperature": true, "tool_call": true, "reasoning": { - "supported": true + "supported": true, + "default": true }, "extra_capabilities": { "reasoning": { "supported": true, + "default_enabled": true, + "mode": "mixed", + "budget": { + "min": 1024, + "unit": "tokens" + }, + "effort": "high", + "effort_options": [ + "low", + "medium", + "high" + ], "interleaved": true, "summaries": true, "visibility": "summary", "continuation": [ "thinking_blocks" + ], + "notes": [ + "Claude Opus 4.5 uses manual thinking.type = \"enabled\" with budget_tokens; effort can be used alongside the thinking budget.", + "Interleaved thinking requires the interleaved-thinking-2025-05-14 beta header." ] } }, - "attachment": false, + "attachment": true, "open_weights": false, - "release_date": "2025-04-30", - "last_updated": "2025-11-25", + "release_date": "2025-11-01", + "last_updated": "2025-11-01", "cost": { - "input": 0.35, - "output": 1.42 + "input": 4.998, + "output": 25.007 }, "type": "chat" }, { - "id": "Qwen/Qwen3-14B", - "name": "Qwen/Qwen3-14B", - "display_name": "Qwen/Qwen3-14B", + "id": "Qwen3.5-27B-BlueStar-v3-Derestricted", + "name": "Qwen3.5 27B BlueStar v3 Derestricted", + "display_name": "Qwen3.5 27B BlueStar v3 Derestricted", "modalities": { "input": [ - "text" + "text", + "image", + "video" ], "output": [ "text" ] }, "limit": { - "context": 131000, - "output": 131000 + "context": 262144, + "output": 16384 }, - "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true + "supported": true, + "default": true }, "extra_capabilities": { "reasoning": { @@ -155378,39 +159932,92 @@ ] } }, - "attachment": false, + "attachment": true, "open_weights": false, - "release_date": "2025-04-30", - "last_updated": "2025-11-25", + "release_date": "2026-04-30", + "last_updated": "2026-04-30", "cost": { - "input": 0.07, - "output": 0.28 + "input": 0.306, + "output": 0.306 }, "type": "chat" }, { - "id": "Qwen/Qwen3-VL-32B-Thinking", - "name": "Qwen/Qwen3-VL-32B-Thinking", - "display_name": "Qwen/Qwen3-VL-32B-Thinking", + "id": "claude-opus-4-thinking", + "name": "Claude 4 Opus Thinking", + "display_name": "Claude 4 Opus Thinking", "modalities": { "input": [ "text", - "image" + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 262000, - "output": 262000 + "context": 200000, + "output": 32000 }, - "temperature": true, "tool_call": true, "reasoning": { "supported": true, "default": true }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": true, + "mode": "budget", + "budget": { + "min": 1024, + "unit": "tokens" + }, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ], + "notes": [ + "Claude 4 manual thinking uses thinking.type = \"enabled\" with budget_tokens.", + "Interleaved thinking requires the interleaved-thinking-2025-05-14 beta header for this model family." + ] + } + }, + "attachment": true, + "open_weights": false, + "release_date": "2025-07-15", + "last_updated": "2025-07-15", + "cost": { + "input": 14.994, + "output": 75.004 + }, + "type": "chat" + }, + { + "id": "qwen3.5-flash", + "name": "Qwen3.5 Flash", + "display_name": "Qwen3.5 Flash", + "modalities": { + "input": [ + "text", + "image", + "video" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 991808, + "output": 65536 + }, + "tool_call": false, + "reasoning": { + "supported": true + }, "extra_capabilities": { "reasoning": { "supported": true, @@ -155424,18 +160031,18 @@ }, "attachment": true, "open_weights": false, - "release_date": "2025-10-21", - "last_updated": "2025-11-25", + "release_date": "2026-02-24", + "last_updated": "2026-02-24", "cost": { - "input": 0.2, - "output": 1.5 + "input": 0.09, + "output": 0.36 }, "type": "chat" }, { - "id": "Qwen/Qwen2.5-72B-Instruct-128K", - "name": "Qwen/Qwen2.5-72B-Instruct-128K", - "display_name": "Qwen/Qwen2.5-72B-Instruct-128K", + "id": "exa-research-pro", + "name": "Exa (Research Pro)", + "display_name": "Exa (Research Pro)", "modalities": { "input": [ "text" @@ -155445,28 +160052,27 @@ ] }, "limit": { - "context": 131000, - "output": 4000 + "context": 16384, + "output": 16384 }, - "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": false }, "attachment": false, "open_weights": false, - "release_date": "2024-09-18", - "last_updated": "2025-11-25", + "release_date": "2025-06-04", + "last_updated": "2025-06-04", "cost": { - "input": 0.59, - "output": 0.59 + "input": 2.5, + "output": 2.5 }, "type": "chat" }, { - "id": "Qwen/Qwen3-8B", - "name": "Qwen/Qwen3-8B", - "display_name": "Qwen/Qwen3-8B", + "id": "jamba-mini", + "name": "Jamba Mini", + "display_name": "Jamba Mini", "modalities": { "input": [ "text" @@ -155476,52 +160082,41 @@ ] }, "limit": { - "context": 131000, - "output": 131000 + "context": 256000, + "output": 4096 }, - "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } + "supported": false }, "attachment": false, "open_weights": false, - "release_date": "2025-04-30", - "last_updated": "2025-11-25", + "release_date": "2025-07-09", + "last_updated": "2025-07-09", "cost": { - "input": 0.06, - "output": 0.06 + "input": 0.1989, + "output": 0.408 }, "type": "chat" }, { - "id": "Qwen/Qwen3-235B-A22B-Thinking-2507", - "name": "Qwen/Qwen3-235B-A22B-Thinking-2507", - "display_name": "Qwen/Qwen3-235B-A22B-Thinking-2507", + "id": "claude-opus-4-1-thinking:32000", + "name": "Claude 4.1 Opus Thinking (32K)", + "display_name": "Claude 4.1 Opus Thinking (32K)", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 262000, - "output": 262000 + "context": 200000, + "output": 32000 }, - "temperature": true, "tool_call": true, "reasoning": { "supported": true, @@ -155530,28 +160125,68 @@ "extra_capabilities": { "reasoning": { "supported": true, + "default_enabled": true, + "mode": "budget", + "budget": { + "min": 1024, + "unit": "tokens" + }, "interleaved": true, "summaries": true, "visibility": "summary", "continuation": [ "thinking_blocks" + ], + "notes": [ + "Claude 4 manual thinking uses thinking.type = \"enabled\" with budget_tokens.", + "Interleaved thinking requires the interleaved-thinking-2025-05-14 beta header for this model family." ] } }, + "attachment": true, + "open_weights": false, + "release_date": "2025-05-22", + "last_updated": "2025-05-22", + "cost": { + "input": 14.994, + "output": 75.004 + }, + "type": "chat" + }, + { + "id": "KAT-Coder-Air-V1", + "name": "KAT Coder Air V1", + "display_name": "KAT Coder Air V1", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 128000, + "output": 32768 + }, + "tool_call": false, + "reasoning": { + "supported": false + }, "attachment": false, "open_weights": false, - "release_date": "2025-07-28", - "last_updated": "2025-11-25", + "release_date": "2025-10-28", + "last_updated": "2025-10-28", "cost": { - "input": 0.13, - "output": 0.6 + "input": 0.1, + "output": 0.2 }, "type": "chat" }, { - "id": "Qwen/Qwen3-Coder-30B-A3B-Instruct", - "name": "Qwen/Qwen3-Coder-30B-A3B-Instruct", - "display_name": "Qwen/Qwen3-Coder-30B-A3B-Instruct", + "id": "exa-research", + "name": "Exa (Research)", + "display_name": "Exa (Research)", "modalities": { "input": [ "text" @@ -155561,43 +160196,72 @@ ] }, "limit": { - "context": 262000, - "output": 262000 + "context": 8192, + "output": 8192 }, - "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": false }, "attachment": false, "open_weights": false, - "release_date": "2025-08-01", - "last_updated": "2025-11-25", + "release_date": "2025-06-04", + "last_updated": "2025-06-04", "cost": { - "input": 0.07, - "output": 0.28 + "input": 2.5, + "output": 2.5 }, "type": "chat" }, { - "id": "Qwen/Qwen3-Omni-30B-A3B-Thinking", - "name": "Qwen/Qwen3-Omni-30B-A3B-Thinking", - "display_name": "Qwen/Qwen3-Omni-30B-A3B-Thinking", + "id": "deepclaude", + "name": "DeepClaude", + "display_name": "DeepClaude", + "modalities": { + "input": [ + "text", + "pdf" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 128000, + "output": 8192 + }, + "tool_call": false, + "reasoning": { + "supported": false + }, + "attachment": true, + "open_weights": false, + "release_date": "2025-02-01", + "last_updated": "2025-02-01", + "cost": { + "input": 3, + "output": 15 + }, + "type": "chat" + }, + { + "id": "gemini-2.5-flash-preview-09-2025", + "name": "Gemini 2.5 Flash Preview (09/2025)", + "display_name": "Gemini 2.5 Flash Preview (09/2025)", "modalities": { "input": [ "text", "image", - "audio" + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 66000, - "output": 66000 + "context": 1048756, + "output": 65536 }, - "temperature": true, "tool_call": true, "reasoning": { "supported": true, @@ -155606,91 +160270,127 @@ "extra_capabilities": { "reasoning": { "supported": true, - "interleaved": true, + "default_enabled": true, + "mode": "budget", + "budget": { + "default": -1, + "min": 0, + "max": 24576, + "auto": -1, + "off": 0, + "unit": "tokens" + }, "summaries": true, "visibility": "summary", "continuation": [ - "thinking_blocks" + "thought_signatures" ] } }, "attachment": true, "open_weights": false, - "release_date": "2025-10-04", - "last_updated": "2025-11-25", + "release_date": "2025-09-25", + "last_updated": "2025-09-25", "cost": { - "input": 0.1, - "output": 0.4 + "input": 0.3, + "output": 2.5 }, "type": "chat" }, { - "id": "Qwen/Qwen3-235B-A22B-Instruct-2507", - "name": "Qwen/Qwen3-235B-A22B-Instruct-2507", - "display_name": "Qwen/Qwen3-235B-A22B-Instruct-2507", + "id": "claude-opus-4-5-20251101", + "name": "Claude 4.5 Opus", + "display_name": "Claude 4.5 Opus", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 262000, - "output": 262000 + "context": 200000, + "output": 32000 }, - "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": false }, - "attachment": false, + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": false, + "mode": "mixed", + "budget": { + "min": 1024, + "unit": "tokens" + }, + "effort": "high", + "effort_options": [ + "low", + "medium", + "high" + ], + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ], + "notes": [ + "Claude Opus 4.5 uses manual thinking.type = \"enabled\" with budget_tokens; effort can be used alongside the thinking budget.", + "Interleaved thinking requires the interleaved-thinking-2025-05-14 beta header." + ] + } + }, + "attachment": true, "open_weights": false, - "release_date": "2025-07-23", - "last_updated": "2025-11-25", + "release_date": "2025-11-01", + "last_updated": "2025-11-01", "cost": { - "input": 0.09, - "output": 0.6 + "input": 4.998, + "output": 25.007 }, "type": "chat" }, { - "id": "Qwen/Qwen3-VL-32B-Instruct", - "name": "Qwen/Qwen3-VL-32B-Instruct", - "display_name": "Qwen/Qwen3-VL-32B-Instruct", + "id": "GLM-4.6-Derestricted-v5", + "name": "GLM 4.6 Derestricted v5", + "display_name": "GLM 4.6 Derestricted v5", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 262000, - "output": 262000 + "context": 131072, + "output": 8192 }, - "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": false }, - "attachment": true, + "attachment": false, "open_weights": false, - "release_date": "2025-10-21", - "last_updated": "2025-11-25", + "release_date": "2025-12-23", + "last_updated": "2025-12-23", "cost": { - "input": 0.2, - "output": 0.6 + "input": 0.4, + "output": 1.5 }, "type": "chat" }, { - "id": "Qwen/Qwen3-Next-80B-A3B-Instruct", - "name": "Qwen/Qwen3-Next-80B-A3B-Instruct", - "display_name": "Qwen/Qwen3-Next-80B-A3B-Instruct", + "id": "glm-z1-airx", + "name": "GLM Z1 AirX", + "display_name": "GLM Z1 AirX", "modalities": { "input": [ "text" @@ -155700,59 +160400,81 @@ ] }, "limit": { - "context": 262000, - "output": 262000 + "context": 32000, + "output": 16384 }, - "temperature": true, "tool_call": true, "reasoning": { "supported": false }, "attachment": false, "open_weights": false, - "release_date": "2025-09-18", - "last_updated": "2025-11-25", + "release_date": "2025-04-15", + "last_updated": "2025-04-15", "cost": { - "input": 0.14, - "output": 1.4 + "input": 0.7, + "output": 0.7 }, "type": "chat" }, { - "id": "Qwen/Qwen2.5-14B-Instruct", - "name": "Qwen/Qwen2.5-14B-Instruct", - "display_name": "Qwen/Qwen2.5-14B-Instruct", + "id": "claude-sonnet-4-thinking:1024", + "name": "Claude 4 Sonnet Thinking (1K)", + "display_name": "Claude 4 Sonnet Thinking (1K)", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 33000, - "output": 4000 + "context": 1000000, + "output": 64000 }, - "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": false, + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": true, + "mode": "budget", + "budget": { + "min": 1024, + "unit": "tokens" + }, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ], + "notes": [ + "Claude 4 manual thinking uses thinking.type = \"enabled\" with budget_tokens.", + "Interleaved thinking requires the interleaved-thinking-2025-05-14 beta header for this model family." + ] + } + }, + "attachment": true, "open_weights": false, - "release_date": "2024-09-18", - "last_updated": "2025-11-25", + "release_date": "2025-05-22", + "last_updated": "2025-05-22", "cost": { - "input": 0.1, - "output": 0.1 + "input": 2.992, + "output": 14.994 }, "type": "chat" }, { - "id": "Qwen/Qwen3-VL-30B-A3B-Instruct", - "name": "Qwen/Qwen3-VL-30B-A3B-Instruct", - "display_name": "Qwen/Qwen3-VL-30B-A3B-Instruct", + "id": "holo3-35b-a3b:thinking", + "name": "Holo3-35B-A3B Thinking", + "display_name": "Holo3-35B-A3B Thinking", "modalities": { "input": [ "text", @@ -155763,28 +160485,28 @@ ] }, "limit": { - "context": 262000, - "output": 262000 + "context": 65536, + "output": 65536 }, - "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "attachment": true, "open_weights": false, - "release_date": "2025-10-05", - "last_updated": "2025-11-25", + "release_date": "2024-01-01", + "last_updated": "2024-01-01", "cost": { - "input": 0.29, - "output": 1 + "input": 0.25, + "output": 1.8 }, "type": "chat" }, { - "id": "Qwen/Qwen2.5-Coder-32B-Instruct", - "name": "Qwen/Qwen2.5-Coder-32B-Instruct", - "display_name": "Qwen/Qwen2.5-Coder-32B-Instruct", + "id": "owl", + "name": "OWL", + "display_name": "OWL", "modalities": { "input": [ "text" @@ -155794,108 +160516,108 @@ ] }, "limit": { - "context": 33000, - "output": 4000 + "context": 1048756, + "output": 262144 }, - "temperature": true, "tool_call": true, "reasoning": { "supported": false }, "attachment": false, "open_weights": false, - "release_date": "2024-11-11", - "last_updated": "2025-11-25", + "release_date": "2026-05-01", + "last_updated": "2026-05-01", "cost": { - "input": 0.18, - "output": 0.18 + "input": 0.1, + "output": 0.3 }, "type": "chat" }, { - "id": "Qwen/Qwen2.5-VL-72B-Instruct", - "name": "Qwen/Qwen2.5-VL-72B-Instruct", - "display_name": "Qwen/Qwen2.5-VL-72B-Instruct", + "id": "gemini-2.0-pro-reasoner", + "name": "Gemini 2.0 Pro Reasoner", + "display_name": "Gemini 2.0 Pro Reasoner", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 131000, - "output": 4000 + "context": 128000, + "output": 65536 }, - "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": false }, - "attachment": true, + "attachment": false, "open_weights": false, - "release_date": "2025-01-28", - "last_updated": "2025-11-25", + "release_date": "2025-02-05", + "last_updated": "2025-02-05", "cost": { - "input": 0.59, - "output": 0.59 + "input": 1.292, + "output": 4.998 }, "type": "chat" }, { - "id": "Qwen/Qwen2.5-VL-32B-Instruct", - "name": "Qwen/Qwen2.5-VL-32B-Instruct", - "display_name": "Qwen/Qwen2.5-VL-32B-Instruct", + "id": "Gemma-4-31B-Cognitive-Unshackled", + "name": "Gemma 4 31B Cognitive Unshackled", + "display_name": "Gemma 4 31B Cognitive Unshackled", "modalities": { "input": [ "text", - "image" + "image", + "video" ], "output": [ "text" ] }, "limit": { - "context": 131000, - "output": 131000 + "context": 262144, + "output": 16384 }, - "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": false + "supported": true, + "default": true }, "attachment": true, "open_weights": false, - "release_date": "2025-03-24", - "last_updated": "2025-11-25", + "release_date": "2026-05-01", + "last_updated": "2026-05-01", "cost": { - "input": 0.27, - "output": 0.27 + "input": 0.306, + "output": 0.306 }, "type": "chat" }, { - "id": "Qwen/Qwen3-32B", - "name": "Qwen/Qwen3-32B", - "display_name": "Qwen/Qwen3-32B", + "id": "Qwen3.5-27B-earica-Derestricted", + "name": "Qwen3.5 27B earica Derestricted", + "display_name": "Qwen3.5 27B earica Derestricted", "modalities": { "input": [ - "text" + "text", + "image", + "video" ], "output": [ "text" ] }, "limit": { - "context": 131000, - "output": 131000 + "context": 262144, + "output": 16384 }, - "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true + "supported": true, + "default": true }, "extra_capabilities": { "reasoning": { @@ -155908,83 +160630,82 @@ ] } }, - "attachment": false, + "attachment": true, "open_weights": false, - "release_date": "2025-04-30", - "last_updated": "2025-11-25", + "release_date": "2026-04-30", + "last_updated": "2026-04-30", "cost": { - "input": 0.14, - "output": 0.57 + "input": 0.306, + "output": 0.306 }, "type": "chat" }, { - "id": "Qwen/Qwen2.5-32B-Instruct", - "name": "Qwen/Qwen2.5-32B-Instruct", - "display_name": "Qwen/Qwen2.5-32B-Instruct", + "id": "command-a-plus-05-2026", + "name": "Cohere Command A+ (05/2026)", + "display_name": "Cohere Command A+ (05/2026)", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 33000, - "output": 4000 + "context": 128000, + "output": 64000 }, - "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": false, + "attachment": true, "open_weights": false, - "release_date": "2024-09-19", - "last_updated": "2025-11-25", + "release_date": "2026-05-22", + "last_updated": "2026-05-22", "cost": { - "input": 0.18, - "output": 0.18 + "input": 2.5, + "output": 10 }, "type": "chat" }, { - "id": "Qwen/Qwen2.5-VL-7B-Instruct", - "name": "Qwen/Qwen2.5-VL-7B-Instruct", - "display_name": "Qwen/Qwen2.5-VL-7B-Instruct", + "id": "auto-model-premium", + "name": "Auto model (Premium)", + "display_name": "Auto model (Premium)", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 33000, - "output": 4000 + "context": 1000000, + "output": 1000000 }, - "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": false }, - "attachment": true, + "attachment": false, "open_weights": false, - "release_date": "2025-01-28", - "last_updated": "2025-11-25", + "release_date": "2024-06-01", + "last_updated": "2024-06-01", "cost": { - "input": 0.05, - "output": 0.05 + "input": 9.996, + "output": 19.992 }, "type": "chat" }, { - "id": "Qwen/Qwen3-30B-A3B-Thinking-2507", - "name": "Qwen/Qwen3-30B-A3B-Thinking-2507", - "display_name": "Qwen/Qwen3-30B-A3B-Thinking-2507", + "id": "learnlm-1.5-pro-experimental", + "name": "Gemini LearnLM Experimental", + "display_name": "Gemini LearnLM Experimental", "modalities": { "input": [ "text" @@ -155994,84 +160715,57 @@ ] }, "limit": { - "context": 262000, - "output": 131000 + "context": 32767, + "output": 8192 }, - "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } + "supported": false }, "attachment": false, "open_weights": false, - "release_date": "2025-07-31", - "last_updated": "2025-11-25", + "release_date": "2024-05-14", + "last_updated": "2024-05-14", "cost": { - "input": 0.09, - "output": 0.3 + "input": 3.502, + "output": 10.506 }, "type": "chat" }, { - "id": "Qwen/Qwen3-VL-30B-A3B-Thinking", - "name": "Qwen/Qwen3-VL-30B-A3B-Thinking", - "display_name": "Qwen/Qwen3-VL-30B-A3B-Thinking", + "id": "deepseek-r1-sambanova", + "name": "DeepSeek R1 Fast", + "display_name": "DeepSeek R1 Fast", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 262000, - "output": 262000 + "context": 128000, + "output": 4096 }, - "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } + "supported": false }, - "attachment": true, + "attachment": false, "open_weights": false, - "release_date": "2025-10-11", - "last_updated": "2025-11-25", + "release_date": "2025-02-20", + "last_updated": "2025-02-20", "cost": { - "input": 0.29, - "output": 1 + "input": 4.998, + "output": 6.987 }, "type": "chat" }, { - "id": "Qwen/Qwen2.5-7B-Instruct", - "name": "Qwen/Qwen2.5-7B-Instruct", - "display_name": "Qwen/Qwen2.5-7B-Instruct", + "id": "claw-medium", + "name": "Claw Medium", + "display_name": "Claw Medium", "modalities": { "input": [ "text" @@ -156081,103 +160775,112 @@ ] }, "limit": { - "context": 33000, - "output": 4000 + "context": 204800, + "output": 131072 }, - "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "attachment": false, "open_weights": false, - "release_date": "2024-09-18", - "last_updated": "2025-11-25", + "release_date": "2026-05-11", + "last_updated": "2026-05-11", "cost": { - "input": 0.05, - "output": 0.05 + "input": 0.3, + "output": 1.2 }, "type": "chat" }, { - "id": "Qwen/Qwen3-Next-80B-A3B-Thinking", - "name": "Qwen/Qwen3-Next-80B-A3B-Thinking", - "display_name": "Qwen/Qwen3-Next-80B-A3B-Thinking", + "id": "claude-opus-4-20250514", + "name": "Claude 4 Opus", + "display_name": "Claude 4 Opus", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 262000, - "output": 262000 + "context": 200000, + "output": 32000 }, - "temperature": true, "tool_call": true, "reasoning": { "supported": true, - "default": true + "default": false }, "extra_capabilities": { "reasoning": { "supported": true, + "default_enabled": false, + "mode": "budget", + "budget": { + "min": 1024, + "unit": "tokens" + }, "interleaved": true, "summaries": true, "visibility": "summary", "continuation": [ "thinking_blocks" + ], + "notes": [ + "Claude 4 manual thinking uses thinking.type = \"enabled\" with budget_tokens.", + "Interleaved thinking requires the interleaved-thinking-2025-05-14 beta header for this model family." ] } }, - "attachment": false, + "attachment": true, "open_weights": false, - "release_date": "2025-09-25", - "last_updated": "2025-11-25", + "release_date": "2025-05-14", + "last_updated": "2025-05-14", "cost": { - "input": 0.14, - "output": 0.57 + "input": 14.994, + "output": 75.004 }, "type": "chat" }, { - "id": "Qwen/Qwen3-VL-235B-A22B-Instruct", - "name": "Qwen/Qwen3-VL-235B-A22B-Instruct", - "display_name": "Qwen/Qwen3-VL-235B-A22B-Instruct", + "id": "yi-large", + "name": "Yi Large", + "display_name": "Yi Large", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 262000, - "output": 262000 + "context": 32000, + "output": 4096 }, - "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": false }, - "attachment": true, + "attachment": false, "open_weights": false, - "release_date": "2025-10-04", - "last_updated": "2025-11-25", + "release_date": "2024-05-13", + "last_updated": "2024-05-13", "cost": { - "input": 0.3, - "output": 1.5 + "input": 3.196, + "output": 3.196 }, "type": "chat" }, { - "id": "openai/gpt-oss-120b", - "name": "openai/gpt-oss-120b", - "display_name": "openai/gpt-oss-120b", + "id": "qwen3-max-2026-01-23", + "name": "Qwen3 Max 2026-01-23", + "display_name": "Qwen3 Max 2026-01-23", "modalities": { "input": [ "text" @@ -156187,34 +160890,38 @@ ] }, "limit": { - "context": 131000, - "output": 8000 + "context": 256000, + "output": 32768 }, - "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": true + "supported": true }, "extra_capabilities": { "reasoning": { - "supported": true + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] } }, "attachment": false, "open_weights": false, - "release_date": "2025-08-13", - "last_updated": "2025-11-25", + "release_date": "2026-01-26", + "last_updated": "2026-01-26", "cost": { - "input": 0.05, - "output": 0.45 + "input": 1.2002, + "output": 6.001 }, "type": "chat" }, { - "id": "openai/gpt-oss-20b", - "name": "openai/gpt-oss-20b", - "display_name": "openai/gpt-oss-20b", + "id": "phi-4-mini-instruct", + "name": "Phi 4 Mini", + "display_name": "Phi 4 Mini", "modalities": { "input": [ "text" @@ -156224,459 +160931,513 @@ ] }, "limit": { - "context": 131000, - "output": 8000 + "context": 128000, + "output": 16384 }, - "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true - } + "supported": false }, "attachment": false, "open_weights": false, - "release_date": "2025-08-13", - "last_updated": "2025-11-25", + "release_date": "2025-07-26", + "last_updated": "2025-07-26", "cost": { - "input": 0.04, - "output": 0.18 + "input": 0.17, + "output": 0.68 }, "type": "chat" - } - ] - }, - "vercel": { - "id": "vercel", - "name": "Vercel AI Gateway", - "display_name": "Vercel AI Gateway", - "doc": "https://github.com/vercel/ai/tree/5eb85cc45a259553501f535b8ac79a77d0e79223/packages/gateway", - "models": [ + }, { - "id": "kwaipilot/kat-coder-pro-v2", - "name": "Kat Coder Pro V2", - "display_name": "Kat Coder Pro V2", + "id": "ernie-x1-turbo-32k", + "name": "Ernie X1 Turbo 32k", + "display_name": "Ernie X1 Turbo 32k", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 256000, - "output": 256000 + "context": 32000, + "output": 16384 }, - "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": true + "supported": false }, - "attachment": false, + "attachment": true, "open_weights": false, - "release_date": "2026-03-27", - "last_updated": "2026-03-30", + "release_date": "2025-05-08", + "last_updated": "2025-05-08", "cost": { - "input": 0.3, - "output": 1.2, - "cache_read": 0.06 + "input": 0.165, + "output": 0.66 }, "type": "chat" }, { - "id": "kwaipilot/kat-coder-pro-v1", - "name": "KAT-Coder-Pro V1", - "display_name": "KAT-Coder-Pro V1", + "id": "claw-low", + "name": "Claw Low", + "display_name": "Claw Low", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 256000, - "output": 32000 + "context": 1048576, + "output": 65536 }, - "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { "supported": true, "default": true }, - "attachment": false, + "attachment": true, "open_weights": false, - "knowledge": "2024-10", - "release_date": "2025-10-24", - "last_updated": "2025-10-24", + "release_date": "2026-05-11", + "last_updated": "2026-05-11", "cost": { - "input": 0.03, - "output": 1.2, - "cache_read": 0.06 + "input": 0.25, + "output": 1.5, + "cache_read": 0.025 }, "type": "chat" }, { - "id": "bfl/flux-2-klein-9b", - "name": "FLUX.2 [klein] 9B", - "display_name": "FLUX.2 [klein] 9B", + "id": "gemini-3-pro-image-preview", + "name": "Gemini 3 Pro Image", + "display_name": "Gemini 3 Pro Image", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ - "image" + "text" ] }, "limit": { - "context": 8192, - "output": 8192 + "context": 1048756, + "output": 65536 }, - "temperature": true, "tool_call": false, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": false, + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": true, + "mode": "level", + "level": "high", + "level_options": [ + "low", + "high" + ], + "summaries": true, + "visibility": "summary", + "continuation": [ + "thought_signatures" + ] + } + }, + "attachment": true, "open_weights": false, - "release_date": "2026-06-08", - "last_updated": "2026-06-08", - "type": "chat" + "release_date": "2025-11-18", + "last_updated": "2025-11-18", + "cost": { + "input": 2, + "output": 12 + }, + "type": "imageGeneration" }, { - "id": "bfl/flux-2-flex", - "name": "FLUX.2 [flex]", - "display_name": "FLUX.2 [flex]", + "id": "gemma-4-31B-Garnet", + "name": "Gemma 4 31B Garnet", + "display_name": "Gemma 4 31B Garnet", "modalities": { "input": [ - "text" + "text", + "image", + "video" ], "output": [ - "image" + "text" ] }, "limit": { - "context": 8192, - "output": 8192 + "context": 262144, + "output": 16384 }, - "temperature": true, "tool_call": false, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": false, + "attachment": true, "open_weights": false, - "release_date": "2026-06-08", - "last_updated": "2026-06-08", - "type": "imageGeneration" + "release_date": "2026-05-02", + "last_updated": "2026-05-02", + "cost": { + "input": 0.306, + "output": 0.306 + }, + "type": "chat" }, { - "id": "bfl/flux-2-klein-4b", - "name": "FLUX.2 [klein] 4B", - "display_name": "FLUX.2 [klein] 4B", + "id": "doubao-1.5-vision-pro-32k", + "name": "Doubao 1.5 Vision Pro 32k", + "display_name": "Doubao 1.5 Vision Pro 32k", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ - "image" + "text" ] }, "limit": { - "context": 8192, + "context": 32000, "output": 8192 }, - "temperature": true, "tool_call": false, "reasoning": { "supported": false }, - "attachment": false, + "attachment": true, "open_weights": false, - "release_date": "2026-06-08", - "last_updated": "2026-06-08", + "release_date": "2025-01-22", + "last_updated": "2025-01-22", + "cost": { + "input": 0.459, + "output": 1.377 + }, "type": "chat" }, { - "id": "bfl/flux-kontext-max", - "name": "FLUX.1 Kontext Max", - "display_name": "FLUX.1 Kontext Max", + "id": "auto-model-standard", + "name": "Auto model (Standard)", + "display_name": "Auto model (Standard)", "modalities": { "input": [ "text" ], "output": [ - "image" + "text" ] }, "limit": { - "context": 512, - "output": 8192 + "context": 1000000, + "output": 1000000 }, - "temperature": true, "tool_call": false, "reasoning": { "supported": false }, "attachment": false, "open_weights": false, - "release_date": "2025-06-01", - "last_updated": "2025-06", + "release_date": "2024-06-01", + "last_updated": "2024-06-01", + "cost": { + "input": 9.996, + "output": 19.992 + }, "type": "chat" }, { - "id": "bfl/flux-2-pro", - "name": "FLUX.2 [pro]", - "display_name": "FLUX.2 [pro]", + "id": "Qwen3.5-27B-Marvin-DPO-V2-Derestricted-Lite", + "name": "Qwen3.5 27B Marvin DPO V2 Derestricted Lite", + "display_name": "Qwen3.5 27B Marvin DPO V2 Derestricted Lite", "modalities": { "input": [ - "text" + "text", + "image", + "video" ], "output": [ - "image" + "text" ] }, "limit": { - "context": 67300, - "output": 67300 + "context": 262144, + "output": 16384 }, - "temperature": true, "tool_call": false, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": false, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } + }, + "attachment": true, "open_weights": false, - "release_date": "2026-06-08", - "last_updated": "2026-06-08", - "type": "imageGeneration" + "release_date": "2026-04-30", + "last_updated": "2026-04-30", + "cost": { + "input": 0.306, + "output": 0.306 + }, + "type": "chat" }, { - "id": "bfl/flux-pro-1.1-ultra", - "name": "FLUX1.1 [pro] Ultra", - "display_name": "FLUX1.1 [pro] Ultra", + "id": "glm-4", + "name": "GLM-4", + "display_name": "GLM-4", "modalities": { "input": [ "text" ], "output": [ - "image" + "text" ] }, "limit": { - "context": 512, - "output": 8192 + "context": 128000, + "output": 4096 }, - "temperature": true, "tool_call": false, "reasoning": { "supported": false }, "attachment": false, "open_weights": false, - "release_date": "2024-11-01", - "last_updated": "2024-11", + "release_date": "2024-01-16", + "last_updated": "2024-01-16", + "cost": { + "input": 14.994, + "output": 14.994 + }, "type": "chat" }, { - "id": "bfl/flux-pro-1.0-fill", - "name": "FLUX.1 Fill [pro]", - "display_name": "FLUX.1 Fill [pro]", + "id": "Qwen3.5-27B-Writer-Derestricted-Lite", + "name": "Qwen3.5 27B Writer Derestricted Lite", + "display_name": "Qwen3.5 27B Writer Derestricted Lite", "modalities": { "input": [ - "text" + "text", + "image", + "video" ], "output": [ - "image" + "text" ] }, "limit": { - "context": 512, - "output": 8192 + "context": 262144, + "output": 16384 }, - "temperature": true, "tool_call": false, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": false, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } + }, + "attachment": true, "open_weights": false, - "release_date": "2024-10-01", - "last_updated": "2024-10", + "release_date": "2026-04-06", + "last_updated": "2026-04-06", + "cost": { + "input": 0.306, + "output": 0.306 + }, "type": "chat" }, { - "id": "bfl/flux-pro-1.1", - "name": "FLUX1.1 [pro]", - "display_name": "FLUX1.1 [pro]", + "id": "qwen-3.6-plus", + "name": "Qwen 3.6 Plus", + "display_name": "Qwen 3.6 Plus", "modalities": { "input": [ - "text" + "text", + "image", + "video" ], "output": [ - "image" + "text" ] }, "limit": { - "context": 512, - "output": 8192 + "context": 991800, + "output": 65536 }, - "temperature": true, "tool_call": false, "reasoning": { "supported": false }, "attachment": false, "open_weights": false, - "release_date": "2024-10-01", - "last_updated": "2024-10", + "release_date": "2026-04-02", + "last_updated": "2026-04-02", + "cost": { + "input": 0.45, + "output": 2.7 + }, "type": "chat" }, { - "id": "bfl/flux-kontext-pro", - "name": "FLUX.1 Kontext Pro", - "display_name": "FLUX.1 Kontext Pro", + "id": "brave-pro", + "name": "Brave (Pro)", + "display_name": "Brave (Pro)", "modalities": { "input": [ "text" ], "output": [ - "image" + "text" ] }, "limit": { - "context": 512, + "context": 8192, "output": 8192 }, - "temperature": true, "tool_call": false, "reasoning": { "supported": false }, "attachment": false, "open_weights": false, - "release_date": "2025-06-01", - "last_updated": "2025-06", + "release_date": "2023-03-02", + "last_updated": "2024-01-01", + "cost": { + "input": 5, + "output": 5 + }, "type": "chat" }, { - "id": "bfl/flux-2-max", - "name": "FLUX.2 [max]", - "display_name": "FLUX.2 [max]", + "id": "deepseek-chat-cheaper", + "name": "DeepSeek V3/Chat Cheaper", + "display_name": "DeepSeek V3/Chat Cheaper", "modalities": { "input": [ - "text" + "text", + "pdf" ], "output": [ - "image" + "text" ] }, "limit": { - "context": 67300, - "output": 67300 + "context": 128000, + "output": 8192 }, - "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { "supported": false }, - "attachment": false, + "attachment": true, "open_weights": false, - "release_date": "2026-06-08", - "last_updated": "2026-06-08", + "release_date": "2025-04-15", + "last_updated": "2025-04-15", + "cost": { + "input": 0.25, + "output": 0.7 + }, "type": "chat" }, { - "id": "deepseek/deepseek-v3.2", - "name": "DeepSeek V3.2", - "display_name": "DeepSeek V3.2", + "id": "Gemma-4-31B-Queen", + "name": "Gemma 4 31B Queen", + "display_name": "Gemma 4 31B Queen", "modalities": { "input": [ "text", "image", - "pdf" + "video" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 8000 + "context": 262144, + "output": 16384 }, - "temperature": true, "tool_call": false, "reasoning": { - "supported": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true - } + "supported": true, + "default": true }, - "attachment": false, + "attachment": true, "open_weights": false, - "knowledge": "2024-07", - "release_date": "2025-12-01", - "last_updated": "2025-12-01", + "release_date": "2026-05-01", + "last_updated": "2026-05-01", "cost": { - "input": 0.28, - "output": 0.42, - "cache_read": 0.028 + "input": 0.306, + "output": 0.306 }, "type": "chat" }, { - "id": "deepseek/deepseek-v3.2-thinking", - "name": "DeepSeek V3.2 Thinking", - "display_name": "DeepSeek V3.2 Thinking", + "id": "Gemma-4-31B-Gemopus", + "name": "Gemma 4 31B Gemopus", + "display_name": "Gemma 4 31B Gemopus", "modalities": { "input": [ "text", "image", - "pdf" + "video" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 8000 + "context": 262144, + "output": 16384 }, - "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": true, "default": true }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true - } - }, - "attachment": false, + "attachment": true, "open_weights": false, - "knowledge": "2024-07", - "release_date": "2025-12-01", - "last_updated": "2025-12-01", + "release_date": "2026-05-01", + "last_updated": "2026-05-01", "cost": { - "input": 0.62, - "output": 1.85 + "input": 0.306, + "output": 0.306 }, "type": "chat" }, { - "id": "deepseek/deepseek-v3.1-terminus", - "name": "DeepSeek V3.1 Terminus", - "display_name": "DeepSeek V3.1 Terminus", + "id": "mistral-code-latest", + "name": "Mistral Code Latest", + "display_name": "Mistral Code Latest", "modalities": { "input": [ "text" @@ -156686,78 +161447,78 @@ ] }, "limit": { - "context": 131072, - "output": 65536 + "context": 256000, + "output": 32768 }, - "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, "attachment": false, - "open_weights": true, - "knowledge": "2025-07", - "release_date": "2025-09-22", - "last_updated": "2025-09-22", + "open_weights": false, + "release_date": "2026-06-02", + "last_updated": "2026-06-02", "cost": { - "input": 0.27, - "output": 1, - "cache_read": 0.135 + "input": 0.3, + "output": 0.9 }, "type": "chat" }, { - "id": "deepseek/deepseek-v4-flash", - "name": "DeepSeek V4 Flash", - "display_name": "DeepSeek V4 Flash", + "id": "gemini-2.5-flash-lite", + "name": "Gemini 2.5 Flash Lite", + "display_name": "Gemini 2.5 Flash Lite", "modalities": { "input": [ "text", - "image", - "pdf" + "image" ], "output": [ "text" ] }, "limit": { - "context": 1000000, - "output": 384000 + "context": 1048756, + "output": 65536 }, - "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": true, - "default": true + "default": false }, "extra_capabilities": { "reasoning": { "supported": true, - "interleaved": true, + "default_enabled": false, + "mode": "budget", + "budget": { + "default": -1, + "min": 512, + "max": 24576, + "auto": -1, + "unit": "tokens" + }, "summaries": true, "visibility": "summary", "continuation": [ - "thinking_blocks" + "thought_signatures" ] } }, - "attachment": false, - "open_weights": true, - "knowledge": "2025-05", - "release_date": "2026-04-23", - "last_updated": "2026-04-24", + "attachment": true, + "open_weights": false, + "release_date": "2025-06-17", + "last_updated": "2025-06-17", "cost": { - "input": 0.14, - "output": 0.28, - "cache_read": 0.0028 + "input": 0.1, + "output": 0.4 }, "type": "chat" }, { - "id": "deepseek/deepseek-v3", - "name": "DeepSeek V3 0324", - "display_name": "DeepSeek V3 0324", + "id": "jamba-mini-1.7", + "name": "Jamba Mini 1.7", + "display_name": "Jamba Mini 1.7", "modalities": { "input": [ "text" @@ -156767,154 +161528,155 @@ ] }, "limit": { - "context": 163840, - "output": 163840 + "context": 256000, + "output": 4096 }, - "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": false }, "attachment": false, "open_weights": false, - "knowledge": "2024-07", - "release_date": "2024-12-26", - "last_updated": "2024-12-26", + "release_date": "2025-07-09", + "last_updated": "2025-07-09", "cost": { - "input": 0.27, - "output": 1.12, - "cache_read": 0.135 + "input": 0.1989, + "output": 0.408 }, "type": "chat" }, { - "id": "deepseek/deepseek-v4-pro", - "name": "DeepSeek V4 Pro", - "display_name": "DeepSeek V4 Pro", + "id": "universal-summarizer", + "name": "Universal Summarizer", + "display_name": "Universal Summarizer", "modalities": { "input": [ - "text", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 1000000, - "output": 384000 + "context": 32768, + "output": 32768 }, - "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } + "supported": false }, "attachment": false, - "open_weights": true, - "knowledge": "2025-05", - "release_date": "2026-04-23", - "last_updated": "2026-04-24", + "open_weights": false, + "release_date": "2023-05-01", + "last_updated": "2024-01-01", "cost": { - "input": 0.435, - "output": 0.87, - "cache_read": 0.0036 + "input": 30, + "output": 30 }, "type": "chat" }, { - "id": "deepseek/deepseek-v3.1", - "name": "DeepSeek-V3.1", - "display_name": "DeepSeek-V3.1", + "id": "Qwen3.5-27B-Anko", + "name": "Qwen3.5 27B Anko", + "display_name": "Qwen3.5 27B Anko", "modalities": { "input": [ - "text" + "text", + "image", + "video" ], "output": [ "text" ] }, "limit": { - "context": 163840, - "output": 8192 + "context": 262144, + "output": 16384 }, - "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": true, "default": true }, - "attachment": false, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } + }, + "attachment": true, "open_weights": false, - "knowledge": "2024-07", - "release_date": "2025-08-21", - "last_updated": "2025-08-21", + "release_date": "2026-04-30", + "last_updated": "2026-04-30", "cost": { - "input": 0.56, - "output": 1.68, - "cache_read": 0.28 + "input": 0.306, + "output": 0.306 }, "type": "chat" }, { - "id": "deepseek/deepseek-r1", - "name": "DeepSeek-R1", - "display_name": "DeepSeek-R1", + "id": "claude-sonnet-4-20250514", + "name": "Claude 4 Sonnet", + "display_name": "Claude 4 Sonnet", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 32768 + "context": 200000, + "output": 64000 }, - "temperature": true, "tool_call": true, "reasoning": { "supported": true, - "default": true + "default": false }, "extra_capabilities": { "reasoning": { "supported": true, + "default_enabled": false, + "mode": "budget", + "budget": { + "min": 1024, + "unit": "tokens" + }, "interleaved": true, "summaries": true, "visibility": "summary", "continuation": [ "thinking_blocks" + ], + "notes": [ + "Claude 4 manual thinking uses thinking.type = \"enabled\" with budget_tokens.", + "Interleaved thinking requires the interleaved-thinking-2025-05-14 beta header for this model family." ] } }, - "attachment": false, + "attachment": true, "open_weights": false, - "knowledge": "2024-07", - "release_date": "2025-01-20", - "last_updated": "2025-05-29", + "release_date": "2025-09-29", + "last_updated": "2025-09-29", "cost": { - "input": 1.35, - "output": 5.4 + "input": 2.992, + "output": 14.994 }, "type": "chat" }, { - "id": "inception/mercury-coder-small", - "name": "Mercury Coder Small Beta", - "display_name": "Mercury Coder Small Beta", + "id": "ernie-x1-32k-preview", + "name": "Ernie X1 32k", + "display_name": "Ernie X1 32k", "modalities": { "input": [ "text" @@ -156927,25 +161689,24 @@ "context": 32000, "output": 16384 }, - "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": false }, "attachment": false, "open_weights": false, - "release_date": "2025-02-26", - "last_updated": "2025-02-26", + "release_date": "2025-04-03", + "last_updated": "2025-04-03", "cost": { - "input": 0.25, - "output": 1 + "input": 0.33, + "output": 1.32 }, "type": "chat" }, { - "id": "inception/mercury-2", - "name": "Mercury 2", - "display_name": "Mercury 2", + "id": "azure-gpt-4-turbo", + "name": "Azure gpt-4-turbo", + "display_name": "Azure gpt-4-turbo", "modalities": { "input": [ "text" @@ -156956,245 +161717,345 @@ }, "limit": { "context": 128000, - "output": 128000 + "output": 4096 }, - "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": true + "supported": false }, "attachment": false, "open_weights": false, - "release_date": "2026-02-24", - "last_updated": "2026-03-06", + "release_date": "2023-11-06", + "last_updated": "2024-01-01", "cost": { - "input": 0.25, - "output": 0.75, - "cache_read": 0.024999999999999998 + "input": 9.996, + "output": 30.005 }, "type": "chat" }, { - "id": "klingai/kling-v2.6-i2v", - "name": "Kling v2.6 Image-to-Video", - "display_name": "Kling v2.6 Image-to-Video", + "id": "Meta-Llama-3-1-8B-Instruct-FP8", + "name": "Llama 3.1 8B (decentralized)", + "display_name": "Llama 3.1 8B (decentralized)", "modalities": { "input": [ "text" ], "output": [ - "video" + "text" ] }, "limit": { - "context": 8192, - "output": 8192 + "context": 128000, + "output": 16384 }, - "temperature": true, "tool_call": false, "reasoning": { "supported": false }, "attachment": false, "open_weights": false, - "release_date": "2025-12-21", - "last_updated": "2025-12-21", + "release_date": "2024-07-23", + "last_updated": "2024-07-23", + "cost": { + "input": 0.02, + "output": 0.03 + }, "type": "chat" }, { - "id": "klingai/kling-v3.0-t2v", - "name": "Kling v3.0 Text-to-Video", - "display_name": "Kling v3.0 Text-to-Video", + "id": "claude-sonnet-4-5-20250929-thinking", + "name": "Claude Sonnet 4.5 Thinking", + "display_name": "Claude Sonnet 4.5 Thinking", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ - "video" + "text" ] }, "limit": { - "context": 8192, - "output": 8192 + "context": 1000000, + "output": 64000 }, - "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": false, + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": true, + "mode": "budget", + "budget": { + "min": 1024, + "unit": "tokens" + }, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ], + "notes": [ + "Claude 4 manual thinking uses thinking.type = \"enabled\" with budget_tokens.", + "Interleaved thinking requires the interleaved-thinking-2025-05-14 beta header for this model family." + ] + } + }, + "attachment": true, "open_weights": false, - "release_date": "2026-02-05", - "last_updated": "2026-02-05", + "release_date": "2025-09-29", + "last_updated": "2025-09-29", + "cost": { + "input": 2.992, + "output": 14.994 + }, "type": "chat" }, { - "id": "klingai/kling-v3.0-motion-control", - "name": "Kling v3.0 Motion Control", - "display_name": "Kling v3.0 Motion Control", + "id": "asi1-mini", + "name": "ASI1 Mini", + "display_name": "ASI1 Mini", "modalities": { "input": [ - "text" + "text", + "pdf" ], "output": [ - "video" + "text" ] }, "limit": { - "context": 8192, - "output": 8192 + "context": 128000, + "output": 16384 }, - "temperature": true, "tool_call": false, "reasoning": { "supported": false }, - "attachment": false, + "attachment": true, "open_weights": false, - "release_date": "2026-03-04", - "last_updated": "2026-03-04", + "release_date": "2025-03-25", + "last_updated": "2025-03-25", + "cost": { + "input": 1, + "output": 1 + }, "type": "chat" }, { - "id": "klingai/kling-v2.6-motion-control", - "name": "Kling v2.6 Motion Control", - "display_name": "Kling v2.6 Motion Control", + "id": "qwen3.5-27b", + "name": "Qwen3.5 27B", + "display_name": "Qwen3.5 27B", "modalities": { "input": [ - "text" + "text", + "image", + "video" ], "output": [ - "video" + "text" ] }, "limit": { - "context": 8192, - "output": 8192 + "context": 260096, + "output": 65536 }, - "temperature": true, "tool_call": false, "reasoning": { - "supported": false + "supported": true }, - "attachment": false, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } + }, + "attachment": true, "open_weights": false, - "release_date": "2025-12-21", - "last_updated": "2025-12-21", + "release_date": "2026-02-24", + "last_updated": "2026-02-24", + "cost": { + "input": 0.27, + "output": 2.16 + }, "type": "chat" }, { - "id": "klingai/kling-v2.6-t2v", - "name": "Kling v2.6 Text-to-Video", - "display_name": "Kling v2.6 Text-to-Video", + "id": "Qwen3.5-27B-Omega-Evolution-v2.2-Derestricted-Lite", + "name": "Qwen3.5 27B Omega Evolution v2.2 Derestricted Lite", + "display_name": "Qwen3.5 27B Omega Evolution v2.2 Derestricted Lite", "modalities": { "input": [ - "text" + "text", + "image", + "video" ], "output": [ - "video" + "text" ] }, "limit": { - "context": 8192, - "output": 8192 + "context": 262144, + "output": 16384 }, - "temperature": true, "tool_call": false, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": false, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } + }, + "attachment": true, "open_weights": false, - "release_date": "2025-12-21", - "last_updated": "2025-12-21", + "release_date": "2026-05-02", + "last_updated": "2026-05-02", + "cost": { + "input": 0.306, + "output": 0.306 + }, "type": "chat" }, { - "id": "klingai/kling-v2.5-turbo-i2v", - "name": "Kling v2.5 Turbo Image-to-Video", - "display_name": "Kling v2.5 Turbo Image-to-Video", + "id": "claude-opus-4-1-thinking:32768", + "name": "Claude 4.1 Opus Thinking (32K)", + "display_name": "Claude 4.1 Opus Thinking (32K)", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ - "video" + "text" ] }, "limit": { - "context": 8192, - "output": 8192 + "context": 200000, + "output": 32000 }, - "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": false, + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": true, + "mode": "budget", + "budget": { + "min": 1024, + "unit": "tokens" + }, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ], + "notes": [ + "Claude 4 manual thinking uses thinking.type = \"enabled\" with budget_tokens.", + "Interleaved thinking requires the interleaved-thinking-2025-05-14 beta header for this model family." + ] + } + }, + "attachment": true, "open_weights": false, - "release_date": "2025-09-23", - "last_updated": "2025-09-23", + "release_date": "2025-05-22", + "last_updated": "2025-05-22", + "cost": { + "input": 14.994, + "output": 75.004 + }, "type": "chat" }, { - "id": "klingai/kling-v2.5-turbo-t2v", - "name": "Kling v2.5 Turbo Text-to-Video", - "display_name": "Kling v2.5 Turbo Text-to-Video", + "id": "gemma-4-31B-K1-v5", + "name": "Gemma 4 31B K1 v5", + "display_name": "Gemma 4 31B K1 v5", "modalities": { "input": [ - "text" + "text", + "image", + "video" ], "output": [ - "video" + "text" ] }, "limit": { - "context": 8192, - "output": 8192 + "context": 262144, + "output": 16384 }, - "temperature": true, "tool_call": false, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": false, + "attachment": true, "open_weights": false, - "release_date": "2025-09-23", - "last_updated": "2025-09-23", + "release_date": "2026-05-02", + "last_updated": "2026-05-02", + "cost": { + "input": 0.306, + "output": 0.306 + }, "type": "chat" }, { - "id": "klingai/kling-v3.0-i2v", - "name": "Kling v3.0 Image-to-Video", - "display_name": "Kling v3.0 Image-to-Video", + "id": "sonar", + "name": "Perplexity Simple", + "display_name": "Perplexity Simple", "modalities": { "input": [ "text" ], "output": [ - "video" + "text" ] }, "limit": { - "context": 8192, - "output": 8192 + "context": 127000, + "output": 128000 }, - "temperature": true, "tool_call": false, "reasoning": { "supported": false }, "attachment": false, "open_weights": false, - "release_date": "2026-02-05", - "last_updated": "2026-02-05", + "release_date": "2025-02-19", + "last_updated": "2025-02-19", + "cost": { + "input": 1.003, + "output": 1.003 + }, "type": "chat" }, { - "id": "interfaze/interfaze-beta", - "name": "Interfaze Beta", - "display_name": "Interfaze Beta", + "id": "MiniMax-M2", + "name": "MiniMax M2", + "display_name": "MiniMax M2", "modalities": { "input": [ "text" @@ -157204,239 +162065,153 @@ ] }, "limit": { - "context": 1000000, - "output": 32000 + "context": 200000, + "output": 131072 }, - "temperature": true, "tool_call": false, "reasoning": { "supported": true, "default": true }, + "extra_capabilities": { + "reasoning": { + "supported": true + } + }, "attachment": false, "open_weights": false, - "release_date": "2025-10-07", - "last_updated": "2026-04-29", + "release_date": "2025-10-25", + "last_updated": "2025-10-25", "cost": { - "input": 1.5, - "output": 3.5 + "input": 0.17, + "output": 1.53 }, "type": "chat" }, { - "id": "anthropic/claude-sonnet-4.6", - "name": "Claude Sonnet 4.6", - "display_name": "Claude Sonnet 4.6", + "id": "sarvam-105b", + "name": "Sarvam 105B", + "display_name": "Sarvam 105B", "modalities": { "input": [ - "text", - "image", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 1000000, - "output": 128000 - }, - "temperature": true, - "tool_call": true, - "reasoning": { - "supported": true, - "default": false + "context": 131072, + "output": 4096 }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": false, - "mode": "mixed", - "budget": { - "min": 1024, - "unit": "tokens" - }, - "effort": "high", - "effort_options": [ - "low", - "medium", - "high", - "max" - ], - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ], - "notes": [ - "Anthropic recommends adaptive thinking with effort for Claude 4.6; budget_tokens remains a deprecated compatibility path.", - "Anthropic API defaults effort to high; lower effort levels should be chosen per workload." - ] - } + "tool_call": true, + "reasoning": { + "supported": true, + "default": true }, - "attachment": true, + "attachment": false, "open_weights": false, - "knowledge": "2025-08-31", - "release_date": "2026-02-17", - "last_updated": "2026-03-13", + "release_date": "2026-05-12", + "last_updated": "2026-05-12", "cost": { - "input": 3, - "output": 15, - "cache_read": 0.3, - "cache_write": 3.75, - "tiers": [ - { - "input": 6, - "output": 22.5, - "cache_read": 0.6, - "cache_write": 7.5, - "tier": { - "type": "context", - "size": 200000 - } - } - ], - "context_over_200k": { - "input": 6, - "output": 22.5, - "cache_read": 0.6, - "cache_write": 7.5 - } + "input": 0.045, + "output": 0.177, + "cache_read": 0.028 }, "type": "chat" }, { - "id": "anthropic/claude-opus-4.5", - "name": "Claude Opus 4.5", - "display_name": "Claude Opus 4.5", + "id": "Qwen3.5-27B-Writer-V2-Derestricted-Lite", + "name": "Qwen3.5 27B Writer V2 Derestricted Lite", + "display_name": "Qwen3.5 27B Writer V2 Derestricted Lite", "modalities": { "input": [ "text", "image", - "pdf" + "video" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 64000 + "context": 262144, + "output": 16384 }, - "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": true, - "default": false + "default": true }, "extra_capabilities": { "reasoning": { "supported": true, - "default_enabled": false, - "mode": "mixed", - "budget": { - "min": 1024, - "unit": "tokens" - }, - "effort": "high", - "effort_options": [ - "low", - "medium", - "high" - ], "interleaved": true, "summaries": true, "visibility": "summary", "continuation": [ "thinking_blocks" - ], - "notes": [ - "Claude Opus 4.5 uses manual thinking.type = \"enabled\" with budget_tokens; effort can be used alongside the thinking budget.", - "Interleaved thinking requires the interleaved-thinking-2025-05-14 beta header." ] } }, "attachment": true, "open_weights": false, - "knowledge": "2025-03-31", - "release_date": "2024-11-24", - "last_updated": "2025-11-24", + "release_date": "2026-04-06", + "last_updated": "2026-04-06", "cost": { - "input": 5, - "output": 25, - "cache_read": 0.5, - "cache_write": 6.25 + "input": 0.306, + "output": 0.306 }, "type": "chat" }, { - "id": "anthropic/claude-opus-4.7", - "name": "Claude Opus 4.7", - "display_name": "Claude Opus 4.7", + "id": "Qwen3.5-27B-Marvin-V2-Derestricted", + "name": "Qwen3.5 27B Marvin V2 Derestricted", + "display_name": "Qwen3.5 27B Marvin V2 Derestricted", "modalities": { "input": [ "text", "image", - "pdf" + "video" ], "output": [ "text" ] }, "limit": { - "context": 1000000, - "output": 128000 + "context": 262144, + "output": 16384 }, - "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": true, - "default": false + "default": true }, "extra_capabilities": { "reasoning": { "supported": true, - "default_enabled": false, - "mode": "effort", - "effort": "high", - "effort_options": [ - "low", - "medium", - "high", - "xhigh", - "max" - ], "interleaved": true, "summaries": true, - "visibility": "omitted", + "visibility": "summary", "continuation": [ "thinking_blocks" - ], - "notes": [ - "Claude Opus 4.7 and newer Opus models require thinking.type = \"adaptive\" to enable thinking explicitly.", - "Manual budget_tokens requests return 400 on Claude Opus 4.7 and newer adaptive-only Opus models.", - "task_budget is separate from thinking control and should not be treated as a thinking budget." ] } }, "attachment": true, "open_weights": false, - "knowledge": "2026-01-31", - "release_date": "2026-04-16", - "last_updated": "2026-04-16", + "release_date": "2026-04-30", + "last_updated": "2026-04-30", "cost": { - "input": 5, - "output": 25, - "cache_read": 0.5, - "cache_write": 6.25 + "input": 0.306, + "output": 0.306 }, "type": "chat" }, { - "id": "anthropic/claude-fable-5", - "name": "Claude Fable 5", - "display_name": "Claude Fable 5", + "id": "claw-high", + "name": "Claw High", + "display_name": "Claw High", "modalities": { "input": [ "text", @@ -157451,240 +162226,118 @@ "context": 1000000, "output": 128000 }, - "temperature": true, "tool_call": true, "reasoning": { "supported": true, "default": true }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": true, - "mode": "effort", - "effort": "high", - "effort_options": [ - "low", - "medium", - "high", - "xhigh", - "max" - ], - "interleaved": true, - "summaries": true, - "visibility": "omitted", - "continuation": [ - "thinking_blocks" - ], - "notes": [ - "Adaptive thinking is always on for Claude Fable 5 and Claude Mythos 5; thinking.type = \"disabled\" is rejected.", - "Manual budget_tokens requests return 400 on Claude Fable 5 and Claude Mythos 5.", - "thinking.display defaults to omitted; set display to summarized to receive readable thinking summaries." - ] - } - }, "attachment": true, "open_weights": false, - "knowledge": "2026-01-31", - "release_date": "2026-06-09", - "last_updated": "2026-06-09", + "release_date": "2026-05-11", + "last_updated": "2026-05-11", "cost": { - "input": 10, - "output": 50, - "cache_read": 1, - "cache_write": 12.5 + "input": 4.998, + "output": 25.007 }, "type": "chat" }, { - "id": "anthropic/claude-opus-4.6", - "name": "Claude Opus 4.6", - "display_name": "Claude Opus 4.6", + "id": "qwen-max", + "name": "Qwen 2.5 Max", + "display_name": "Qwen 2.5 Max", "modalities": { "input": [ - "text", - "image", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 1000000, - "output": 128000 + "context": 32000, + "output": 8192 }, - "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": false - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": false, - "mode": "mixed", - "budget": { - "min": 1024, - "unit": "tokens" - }, - "effort": "high", - "effort_options": [ - "low", - "medium", - "high", - "max" - ], - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ], - "notes": [ - "Anthropic recommends adaptive thinking with effort for Claude 4.6; budget_tokens remains a deprecated compatibility path.", - "Anthropic API defaults effort to high; lower effort levels should be chosen per workload." - ] - } + "supported": false }, - "attachment": true, + "attachment": false, "open_weights": false, - "knowledge": "2025-05-31", - "release_date": "2026-02-05", - "last_updated": "2026-03-13", + "release_date": "2024-04-03", + "last_updated": "2024-04-03", "cost": { - "input": 5, - "output": 25, - "cache_read": 0.5, - "cache_write": 6.25 + "input": 1.5997, + "output": 6.392 }, "type": "chat" }, { - "id": "anthropic/claude-haiku-4.5", - "name": "Claude Haiku 4.5", - "display_name": "Claude Haiku 4.5", + "id": "gemma-4-31B-Fabled", + "name": "Gemma 4 31B Fabled", + "display_name": "Gemma 4 31B Fabled", "modalities": { "input": [ "text", "image", - "pdf" + "video" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 64000 + "context": 262144, + "output": 16384 }, - "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": true, - "default": false - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": false, - "mode": "budget", - "budget": { - "min": 1024, - "unit": "tokens" - }, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ], - "notes": [ - "Claude 4 manual thinking uses thinking.type = \"enabled\" with budget_tokens.", - "Interleaved thinking requires the interleaved-thinking-2025-05-14 beta header for this model family." - ] - } + "default": true }, "attachment": true, "open_weights": false, - "knowledge": "2025-02-28", - "release_date": "2025-10-15", - "last_updated": "2025-10-15", + "release_date": "2026-05-02", + "last_updated": "2026-05-02", "cost": { - "input": 1, - "output": 5, - "cache_read": 0.1, - "cache_write": 1.25 + "input": 0.306, + "output": 0.306 }, "type": "chat" }, { - "id": "anthropic/claude-opus-4.8", - "name": "Claude Opus 4.8", - "display_name": "Claude Opus 4.8", + "id": "v0-1.5-md", + "name": "v0 1.5 MD", + "display_name": "v0 1.5 MD", "modalities": { "input": [ - "text", - "image", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 1000000, - "output": 128000 + "context": 200000, + "output": 64000 }, - "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": false - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": false, - "mode": "effort", - "effort": "high", - "effort_options": [ - "low", - "medium", - "high", - "xhigh", - "max" - ], - "interleaved": true, - "summaries": true, - "visibility": "omitted", - "continuation": [ - "thinking_blocks" - ], - "notes": [ - "Claude Opus 4.7 and newer Opus models require thinking.type = \"adaptive\" to enable thinking explicitly.", - "Manual budget_tokens requests return 400 on Claude Opus 4.7 and newer adaptive-only Opus models.", - "task_budget is separate from thinking control and should not be treated as a thinking budget." - ] - } + "supported": false }, - "attachment": true, + "attachment": false, "open_weights": false, - "release_date": "2026-05-28", - "last_updated": "2026-05-28", + "release_date": "2025-07-04", + "last_updated": "2025-07-04", "cost": { - "input": 5, - "output": 25, - "cache_read": 0.5, - "cache_write": 6.25 + "input": 3, + "output": 15 }, "type": "chat" }, { - "id": "anthropic/claude-opus-4", - "name": "Claude Opus 4", - "display_name": "Claude Opus 4", + "id": "claude-opus-4-thinking:1024", + "name": "Claude 4 Opus Thinking (1K)", + "display_name": "Claude 4 Opus Thinking (1K)", "modalities": { "input": [ "text", @@ -157699,16 +162352,15 @@ "context": 200000, "output": 32000 }, - "temperature": true, "tool_call": true, "reasoning": { "supported": true, - "default": false + "default": true }, "extra_capabilities": { "reasoning": { "supported": true, - "default_enabled": false, + "default_enabled": true, "mode": "budget", "budget": { "min": 1024, @@ -157728,178 +162380,155 @@ }, "attachment": true, "open_weights": false, - "knowledge": "2025-03-31", "release_date": "2025-05-22", "last_updated": "2025-05-22", "cost": { - "input": 15, - "output": 75, - "cache_read": 1.5, - "cache_write": 18.75 + "input": 14.994, + "output": 75.004 }, "type": "chat" }, { - "id": "anthropic/claude-opus-4.1", - "name": "Claude Opus 4.1", - "display_name": "Claude Opus 4.1", + "id": "gemini-2.5-flash-preview-04-17", + "name": "Gemini 2.5 Flash Preview", + "display_name": "Gemini 2.5 Flash Preview", "modalities": { "input": [ "text", - "image", - "pdf" + "image" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 32000 + "context": 1048756, + "output": 65536 }, - "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": true, - "default": false + "default": true }, "extra_capabilities": { "reasoning": { "supported": true, - "default_enabled": false, + "default_enabled": true, "mode": "budget", "budget": { - "min": 1024, + "default": -1, + "min": 0, + "max": 24576, + "auto": -1, + "off": 0, "unit": "tokens" }, - "interleaved": true, "summaries": true, "visibility": "summary", "continuation": [ - "thinking_blocks" - ], - "notes": [ - "Claude 4 manual thinking uses thinking.type = \"enabled\" with budget_tokens.", - "Interleaved thinking requires the interleaved-thinking-2025-05-14 beta header for this model family." + "thought_signatures" ] } }, "attachment": true, "open_weights": false, - "knowledge": "2025-03-31", - "release_date": "2025-08-05", - "last_updated": "2025-08-05", + "release_date": "2025-04-17", + "last_updated": "2025-04-17", "cost": { - "input": 15, - "output": 75, - "cache_read": 1.5, - "cache_write": 18.75 + "input": 0.15, + "output": 0.6 }, "type": "chat" }, { - "id": "anthropic/claude-sonnet-4.5", - "name": "Claude Sonnet 4.5", - "display_name": "Claude Sonnet 4.5", + "id": "gemini-2.5-pro-exp-03-25", + "name": "Gemini 2.5 Pro Experimental 0325", + "display_name": "Gemini 2.5 Pro Experimental 0325", "modalities": { "input": [ "text", - "image", - "pdf" + "image" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 64000 + "context": 1048756, + "output": 65536 }, - "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": true, - "default": false + "default": true }, "extra_capabilities": { "reasoning": { "supported": true, - "default_enabled": false, + "default_enabled": true, "mode": "budget", "budget": { - "min": 1024, + "default": -1, + "min": 128, + "max": 32768, + "auto": -1, "unit": "tokens" }, - "interleaved": true, "summaries": true, "visibility": "summary", "continuation": [ - "thinking_blocks" - ], - "notes": [ - "Claude 4 manual thinking uses thinking.type = \"enabled\" with budget_tokens.", - "Interleaved thinking requires the interleaved-thinking-2025-05-14 beta header for this model family." + "thought_signatures" ] } }, "attachment": true, "open_weights": false, - "knowledge": "2025-07-31", - "release_date": "2025-09-29", - "last_updated": "2025-09-29", + "release_date": "2025-03-25", + "last_updated": "2025-03-25", "cost": { - "input": 3, - "output": 15, - "cache_read": 0.3, - "cache_write": 3.75 + "input": 2.5, + "output": 10 }, "type": "chat" }, { - "id": "anthropic/claude-3-haiku", - "name": "Claude Haiku 3", - "display_name": "Claude Haiku 3", + "id": "hermes-medium", + "name": "Hermes Medium", + "display_name": "Hermes Medium", "modalities": { "input": [ - "text", - "image", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 4096 + "context": 204800, + "output": 131072 }, - "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": true, + "attachment": false, "open_weights": false, - "knowledge": "2023-08-31", - "release_date": "2024-03-13", - "last_updated": "2024-03-13", + "release_date": "2026-05-11", + "last_updated": "2026-05-11", "cost": { - "input": 0.25, - "output": 1.25, - "cache_read": 0.03, - "cache_write": 0.3 + "input": 0.3, + "output": 1.2 }, "type": "chat" }, { - "id": "anthropic/claude-3.5-haiku", - "name": "Claude Haiku 3.5", - "display_name": "Claude Haiku 3.5", + "id": "sonar-pro", + "name": "Perplexity Pro", + "display_name": "Perplexity Pro", "modalities": { "input": [ - "text", - "image", - "pdf" + "text" ], "output": [ "text" @@ -157907,34 +162536,29 @@ }, "limit": { "context": 200000, - "output": 8192 + "output": 128000 }, - "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": false }, - "attachment": true, + "attachment": false, "open_weights": false, - "knowledge": "2024-07-31", - "release_date": "2024-10-22", - "last_updated": "2024-10-22", + "release_date": "2025-02-19", + "last_updated": "2025-02-19", "cost": { - "input": 0.8, - "output": 4, - "cache_read": 0.08, - "cache_write": 1 + "input": 2.992, + "output": 14.994 }, "type": "chat" }, { - "id": "anthropic/claude-sonnet-4", - "name": "Claude Sonnet 4", - "display_name": "Claude Sonnet 4", + "id": "doubao-1-5-thinking-pro-250415", + "name": "Doubao 1.5 Thinking Pro", + "display_name": "Doubao 1.5 Thinking Pro", "modalities": { "input": [ "text", - "image", "pdf" ], "output": [ @@ -157942,53 +162566,27 @@ ] }, "limit": { - "context": 200000, - "output": 64000 + "context": 128000, + "output": 16384 }, - "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": false - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": false, - "mode": "budget", - "budget": { - "min": 1024, - "unit": "tokens" - }, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ], - "notes": [ - "Claude 4 manual thinking uses thinking.type = \"enabled\" with budget_tokens.", - "Interleaved thinking requires the interleaved-thinking-2025-05-14 beta header for this model family." - ] - } + "supported": false }, "attachment": true, "open_weights": false, - "knowledge": "2025-03-31", - "release_date": "2025-05-22", - "last_updated": "2025-05-22", + "release_date": "2025-04-17", + "last_updated": "2025-04-17", "cost": { - "input": 3, - "output": 15, - "cache_read": 0.3, - "cache_write": 3.75 + "input": 0.6, + "output": 2.4 }, "type": "chat" }, { - "id": "alibaba/qwen-3-14b", - "name": "Qwen3-14B", - "display_name": "Qwen3-14B", + "id": "qwen3.7-max:thinking", + "name": "Qwen3.7 Max Thinking", + "display_name": "Qwen3.7 Max Thinking", "modalities": { "input": [ "text" @@ -157998,133 +162596,141 @@ ] }, "limit": { - "context": 40960, - "output": 16384 + "context": 1000000, + "output": 65536 }, - "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": true, "default": true }, "attachment": false, "open_weights": false, - "knowledge": "2025-04", - "release_date": "2025-04-01", - "last_updated": "2025-04", + "release_date": "2026-05-21", + "last_updated": "2026-05-21", "cost": { - "input": 0.12, - "output": 0.24 + "input": 2.5, + "output": 7.5, + "cache_read": 0.25 }, "type": "chat" }, { - "id": "alibaba/qwen3-next-80b-a3b-instruct", - "name": "Qwen3 Next 80B A3B Instruct", - "display_name": "Qwen3 Next 80B A3B Instruct", + "id": "ernie-4.5-turbo-vl-32k", + "name": "Ernie 4.5 Turbo VL 32k", + "display_name": "Ernie 4.5 Turbo VL 32k", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 131072, - "output": 32768 + "context": 32000, + "output": 16384 }, - "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": false }, - "attachment": false, - "open_weights": true, - "knowledge": "2025-04", - "release_date": "2025-09-12", - "last_updated": "2025-09", + "attachment": true, + "open_weights": false, + "release_date": "2025-05-08", + "last_updated": "2025-05-08", "cost": { - "input": 0.15, - "output": 1.2 + "input": 0.495, + "output": 1.43 }, "type": "chat" }, { - "id": "alibaba/qwen3-max-preview", - "name": "Qwen3 Max Preview", - "display_name": "Qwen3 Max Preview", + "id": "gemini-2.5-pro-preview-05-06", + "name": "Gemini 2.5 Pro Preview 0506", + "display_name": "Gemini 2.5 Pro Preview 0506", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 262144, - "output": 32768 + "context": 1048756, + "output": 65536 }, - "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true + "supported": true, + "default": true }, "extra_capabilities": { "reasoning": { "supported": true, - "interleaved": true, + "default_enabled": true, + "mode": "budget", + "budget": { + "default": -1, + "min": 128, + "max": 32768, + "auto": -1, + "unit": "tokens" + }, "summaries": true, "visibility": "summary", "continuation": [ - "thinking_blocks" + "thought_signatures" ] } }, - "attachment": false, + "attachment": true, "open_weights": false, - "knowledge": "2025-04", - "release_date": "2025-09-23", - "last_updated": "2025-09-23", + "release_date": "2025-05-06", + "last_updated": "2025-05-06", "cost": { - "input": 1.2, - "output": 6, - "cache_read": 0.24 + "input": 2.5, + "output": 10 }, "type": "chat" }, { - "id": "alibaba/wan-v2.6-r2v-flash", - "name": "Wan v2.6 Reference-to-Video Flash", - "display_name": "Wan v2.6 Reference-to-Video Flash", + "id": "hunyuan-turbos-20250226", + "name": "Hunyuan Turbo S", + "display_name": "Hunyuan Turbo S", "modalities": { "input": [ "text" ], "output": [ - "video" + "text" ] }, "limit": { - "context": 8192, + "context": 24000, "output": 8192 }, - "temperature": true, "tool_call": false, "reasoning": { "supported": false }, "attachment": false, "open_weights": false, - "release_date": "2025-12-16", - "last_updated": "2025-12-16", + "release_date": "2025-02-27", + "last_updated": "2025-02-27", + "cost": { + "input": 0.187, + "output": 0.374 + }, "type": "chat" }, { - "id": "alibaba/qwen3-vl-thinking", - "name": "Qwen3 VL Thinking", - "display_name": "Qwen3 VL Thinking", + "id": "claude-sonnet-4-thinking:64000", + "name": "Claude 4 Sonnet Thinking (64K)", + "display_name": "Claude 4 Sonnet Thinking (64K)", "modalities": { "input": [ "text", @@ -158136,10 +162742,9 @@ ] }, "limit": { - "context": 131072, - "output": 32768 + "context": 1000000, + "output": 64000 }, - "temperature": true, "tool_call": true, "reasoning": { "supported": true, @@ -158148,81 +162753,176 @@ "extra_capabilities": { "reasoning": { "supported": true, + "default_enabled": true, + "mode": "budget", + "budget": { + "min": 1024, + "unit": "tokens" + }, "interleaved": true, "summaries": true, "visibility": "summary", "continuation": [ "thinking_blocks" + ], + "notes": [ + "Claude 4 manual thinking uses thinking.type = \"enabled\" with budget_tokens.", + "Interleaved thinking requires the interleaved-thinking-2025-05-14 beta header for this model family." ] } }, "attachment": true, - "open_weights": true, - "knowledge": "2025-09", - "release_date": "2025-09-24", - "last_updated": "2025-09-24", + "open_weights": false, + "release_date": "2025-05-22", + "last_updated": "2025-05-22", "cost": { - "input": 0.4, - "output": 4 + "input": 2.992, + "output": 14.994 }, "type": "chat" }, { - "id": "alibaba/qwen3-vl-235b-a22b-instruct", - "name": "Qwen3 VL 235B A22B Instruct", - "display_name": "Qwen3 VL 235B A22B Instruct", + "id": "ernie-x1-32k", + "name": "Ernie X1 32k", + "display_name": "Ernie X1 32k", "modalities": { "input": [ "text", - "image", - "pdf" + "image" ], "output": [ "text" ] }, "limit": { - "context": 131072, - "output": 129024 + "context": 32000, + "output": 16384 }, - "temperature": true, "tool_call": false, "reasoning": { "supported": false }, "attachment": true, "open_weights": false, - "release_date": "2025-09-24", - "last_updated": "2026-05-01", + "release_date": "2025-05-08", + "last_updated": "2025-05-08", "cost": { - "input": 0.4, - "output": 1.6 + "input": 0.33, + "output": 1.32 }, "type": "chat" }, { - "id": "alibaba/qwen3.6-27b", - "name": "Qwen 3.6 27B", - "display_name": "Qwen 3.6 27B", + "id": "command-a-reasoning-08-2025", + "name": "Cohere Command A (08/2025)", + "display_name": "Cohere Command A (08/2025)", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 256000, + "output": 8192 + }, + "tool_call": false, + "reasoning": { + "supported": false + }, + "attachment": false, + "open_weights": false, + "release_date": "2025-08-22", + "last_updated": "2025-08-22", + "cost": { + "input": 2.5, + "output": 10 + }, + "type": "chat" + }, + { + "id": "doubao-seed-2-0-code-preview-260215", + "name": "Doubao Seed 2.0 Code Preview", + "display_name": "Doubao Seed 2.0 Code Preview", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 256000, + "output": 128000 + }, + "tool_call": false, + "reasoning": { + "supported": false + }, + "attachment": false, + "open_weights": false, + "release_date": "2026-02-14", + "last_updated": "2026-02-14", + "cost": { + "input": 0.782, + "output": 3.893 + }, + "type": "chat" + }, + { + "id": "doubao-1.5-pro-256k", + "name": "Doubao 1.5 Pro 256k", + "display_name": "Doubao 1.5 Pro 256k", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 256000, + "output": 16384 + }, + "tool_call": false, + "reasoning": { + "supported": false + }, + "attachment": false, + "open_weights": false, + "release_date": "2025-03-12", + "last_updated": "2025-03-12", + "cost": { + "input": 0.799, + "output": 1.445 + }, + "type": "chat" + }, + { + "id": "qwen3.5-35b-a3b", + "name": "Qwen3.5 35B A3B", + "display_name": "Qwen3.5 35B A3B", "modalities": { "input": [ "text", "image", - "pdf" + "video" ], "output": [ "text" ] }, "limit": { - "context": 256000, - "output": 256000 + "context": 260096, + "output": 65536 }, - "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": true + "supported": true }, "extra_capabilities": { "reasoning": { @@ -158237,34 +162937,33 @@ }, "attachment": true, "open_weights": false, - "release_date": "2026-04-22", - "last_updated": "2026-04-22", + "release_date": "2026-02-24", + "last_updated": "2026-02-24", "cost": { - "input": 0.6, - "output": 3.6 + "input": 0.225, + "output": 1.8 }, "type": "chat" }, { - "id": "alibaba/qwen3.5-plus", - "name": "Qwen 3.5 Plus", - "display_name": "Qwen 3.5 Plus", + "id": "qwen3.5-122b-a10b:thinking", + "name": "Qwen3.5 122B A10B Thinking", + "display_name": "Qwen3.5 122B A10B Thinking", "modalities": { "input": [ "text", "image", - "pdf" + "video" ], "output": [ "text" ] }, "limit": { - "context": 1000000, - "output": 64000 + "context": 260096, + "output": 65536 }, - "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": true, "default": true @@ -158282,21 +162981,18 @@ }, "attachment": true, "open_weights": false, - "knowledge": "2025-04", - "release_date": "2026-02-16", - "last_updated": "2026-02-16", + "release_date": "2026-02-24", + "last_updated": "2026-02-24", "cost": { - "input": 0.4, - "output": 2.4, - "cache_read": 0.04, - "cache_write": 0.5 + "input": 0.36, + "output": 2.88 }, "type": "chat" }, { - "id": "alibaba/qwen3-max", - "name": "Qwen3 Max", - "display_name": "Qwen3 Max", + "id": "yi-lightning", + "name": "Yi Lightning", + "display_name": "Yi Lightning", "modalities": { "input": [ "text" @@ -158306,41 +163002,81 @@ ] }, "limit": { - "context": 262144, - "output": 32768 + "context": 12000, + "output": 4096 + }, + "tool_call": false, + "reasoning": { + "supported": false + }, + "attachment": false, + "open_weights": false, + "release_date": "2024-10-16", + "last_updated": "2024-10-16", + "cost": { + "input": 0.2006, + "output": 0.2006 + }, + "type": "chat" + }, + { + "id": "claude-sonnet-4-5-20250929", + "name": "Claude Sonnet 4.5", + "display_name": "Claude Sonnet 4.5", + "modalities": { + "input": [ + "text", + "image", + "pdf" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 1000000, + "output": 64000 }, - "temperature": true, "tool_call": true, "reasoning": { - "supported": true + "supported": true, + "default": false }, "extra_capabilities": { "reasoning": { "supported": true, + "default_enabled": false, + "mode": "budget", + "budget": { + "min": 1024, + "unit": "tokens" + }, "interleaved": true, "summaries": true, "visibility": "summary", "continuation": [ "thinking_blocks" + ], + "notes": [ + "Claude 4 manual thinking uses thinking.type = \"enabled\" with budget_tokens.", + "Interleaved thinking requires the interleaved-thinking-2025-05-14 beta header for this model family." ] } }, - "attachment": false, + "attachment": true, "open_weights": false, - "knowledge": "2025-04", - "release_date": "2025-09-23", - "last_updated": "2025-09-23", + "release_date": "2025-09-29", + "last_updated": "2025-09-29", "cost": { - "input": 1.2, - "output": 6, - "cache_read": 0.24 + "input": 2.992, + "output": 14.994 }, "type": "chat" }, { - "id": "alibaba/qwen3-coder-plus", - "name": "Qwen3 Coder Plus", - "display_name": "Qwen3 Coder Plus", + "id": "deepseek-math-v2", + "name": "DeepSeek Math V2", + "display_name": "DeepSeek Math V2", "modalities": { "input": [ "text" @@ -158350,62 +163086,122 @@ ] }, "limit": { - "context": 1000000, + "context": 128000, "output": 65536 }, - "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": false }, "attachment": false, - "open_weights": true, - "knowledge": "2025-04", - "release_date": "2025-07-23", - "last_updated": "2025-07-23", + "open_weights": false, + "release_date": "2025-12-03", + "last_updated": "2025-12-03", "cost": { - "input": 1, - "output": 5, - "cache_read": 0.2 + "input": 0.6, + "output": 2.2 }, "type": "chat" }, { - "id": "alibaba/qwen3-coder-next", - "name": "Qwen3 Coder Next", - "display_name": "Qwen3 Coder Next", + "id": "claude-opus-4-1-thinking:8192", + "name": "Claude 4.1 Opus Thinking (8K)", + "display_name": "Claude 4.1 Opus Thinking (8K)", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 256000, - "output": 256000 + "context": 200000, + "output": 32000 }, - "temperature": true, "tool_call": true, "reasoning": { "supported": true, "default": true }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": true, + "mode": "budget", + "budget": { + "min": 1024, + "unit": "tokens" + }, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ], + "notes": [ + "Claude 4 manual thinking uses thinking.type = \"enabled\" with budget_tokens.", + "Interleaved thinking requires the interleaved-thinking-2025-05-14 beta header for this model family." + ] + } + }, + "attachment": true, + "open_weights": false, + "release_date": "2025-05-22", + "last_updated": "2025-05-22", + "cost": { + "input": 14.994, + "output": 75.004 + }, + "type": "chat" + }, + { + "id": "deepseek-reasoner", + "name": "DeepSeek Reasoner", + "display_name": "DeepSeek Reasoner", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 64000, + "output": 65536 + }, + "tool_call": false, + "reasoning": { + "supported": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } + }, "attachment": false, "open_weights": false, - "release_date": "2025-07-22", - "last_updated": "2026-02-19", + "release_date": "2025-01-20", + "last_updated": "2025-01-20", "cost": { - "input": 0.5, - "output": 1.2 + "input": 0.4, + "output": 1.7 }, "type": "chat" }, { - "id": "alibaba/qwen3.5-flash", - "name": "Qwen 3.5 Flash", - "display_name": "Qwen 3.5 Flash", + "id": "gemini-2.5-flash-nothinking", + "name": "Gemini 2.5 Flash (No Thinking)", + "display_name": "Gemini 2.5 Flash (No Thinking)", "modalities": { "input": [ "text", @@ -158417,11 +163213,10 @@ ] }, "limit": { - "context": 1000000, - "output": 64000 + "context": 1048756, + "output": 65536 }, - "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": true, "default": true @@ -158429,113 +163224,126 @@ "extra_capabilities": { "reasoning": { "supported": true, - "interleaved": true, + "default_enabled": true, + "mode": "budget", + "budget": { + "default": -1, + "min": 0, + "max": 24576, + "auto": -1, + "off": 0, + "unit": "tokens" + }, "summaries": true, "visibility": "summary", "continuation": [ - "thinking_blocks" + "thought_signatures" ] } }, "attachment": true, "open_weights": false, - "release_date": "2026-02-24", - "last_updated": "2026-02-24", + "release_date": "2025-06-05", + "last_updated": "2025-06-05", "cost": { - "input": 0.1, - "output": 0.4, - "cache_read": 0.001, - "cache_write": 0.125 + "input": 0.3, + "output": 2.5 }, "type": "chat" }, { - "id": "alibaba/qwen3.7-max", - "name": "Qwen 3.7 Max", - "display_name": "Qwen 3.7 Max", + "id": "Qwen3.5-27B-Omega-Evolution-v2.0-Derestricted-Lite", + "name": "Qwen3.5 27B Omega Evolution v2.0 Derestricted Lite", + "display_name": "Qwen3.5 27B Omega Evolution v2.0 Derestricted Lite", "modalities": { "input": [ "text", - "pdf" + "image", + "video" ], "output": [ "text" ] }, "limit": { - "context": 991000, - "output": 64000 + "context": 262144, + "output": 16384 }, - "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": true, "default": true }, "extra_capabilities": { "reasoning": { - "supported": true + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] } }, "attachment": true, "open_weights": false, - "release_date": "2026-05-21", - "last_updated": "2026-05-21", + "release_date": "2026-04-06", + "last_updated": "2026-04-06", "cost": { - "input": 1.25, - "output": 3.75, - "cache_read": 0.25, - "cache_write": 1.5625 + "input": 0.306, + "output": 0.306 }, "type": "chat" }, { - "id": "alibaba/wan-v2.5-t2v-preview", - "name": "Wan v2.5 Text-to-Video Preview", - "display_name": "Wan v2.5 Text-to-Video Preview", + "id": "fastgpt", + "name": "Web Answer", + "display_name": "Web Answer", "modalities": { "input": [ "text" ], "output": [ - "video" + "text" ] }, "limit": { - "context": 8192, - "output": 8192 + "context": 32768, + "output": 32768 }, - "temperature": true, "tool_call": false, "reasoning": { "supported": false }, "attachment": false, "open_weights": false, - "release_date": "2025-09-24", - "last_updated": "2025-09-24", + "release_date": "2023-08-01", + "last_updated": "2024-01-01", + "cost": { + "input": 7.5, + "output": 7.5 + }, "type": "chat" }, { - "id": "alibaba/qwen3.6-plus", - "name": "Qwen 3.6 Plus", - "display_name": "Qwen 3.6 Plus", + "id": "Qwen3.5-27B-Infracelestial", + "name": "Qwen3.5 27B Infracelestial", + "display_name": "Qwen3.5 27B Infracelestial", "modalities": { "input": [ "text", "image", - "pdf" + "video" ], "output": [ "text" ] }, "limit": { - "context": 1000000, - "output": 64000 + "context": 262144, + "output": 16384 }, - "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": true, "default": true @@ -158553,21 +163361,18 @@ }, "attachment": true, "open_weights": false, - "knowledge": "2025-04", - "release_date": "2026-04-02", - "last_updated": "2026-04-02", + "release_date": "2026-04-30", + "last_updated": "2026-04-30", "cost": { - "input": 0.5, - "output": 3, - "cache_read": 0.1, - "cache_write": 0.625 + "input": 0.306, + "output": 0.306 }, "type": "chat" }, { - "id": "alibaba/qwen3-next-80b-a3b-thinking", - "name": "Qwen3 Next 80B A3B Thinking", - "display_name": "Qwen3 Next 80B A3B Thinking", + "id": "glm-4-flash", + "name": "GLM-4 Flash", + "display_name": "GLM-4 Flash", "modalities": { "input": [ "text" @@ -158577,68 +163382,58 @@ ] }, "limit": { - "context": 131072, - "output": 32768 + "context": 128000, + "output": 4096 }, - "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } + "supported": false }, "attachment": false, - "open_weights": true, - "knowledge": "2025-09", - "release_date": "2025-09-12", - "last_updated": "2025-09", + "open_weights": false, + "release_date": "2024-08-01", + "last_updated": "2024-08-01", "cost": { - "input": 0.15, - "output": 1.2 + "input": 0.1003, + "output": 0.1003 }, "type": "chat" }, { - "id": "alibaba/qwen3-embedding-8b", - "name": "Qwen3 Embedding 8B", - "display_name": "Qwen3 Embedding 8B", + "id": "azure-gpt-4o-mini", + "name": "Azure gpt-4o-mini", + "display_name": "Azure gpt-4o-mini", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 32768, - "output": 32768 + "context": 128000, + "output": 16384 }, - "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { "supported": false }, - "attachment": false, + "attachment": true, "open_weights": false, - "release_date": "2025-06-05", - "last_updated": "2025-06-05", - "type": "embedding" + "release_date": "2024-07-18", + "last_updated": "2024-07-18", + "cost": { + "input": 0.1496, + "output": 0.595 + }, + "type": "chat" }, { - "id": "alibaba/qwen3-embedding-4b", - "name": "Qwen3 Embedding 4B", - "display_name": "Qwen3 Embedding 4B", + "id": "sonar-deep-research", + "name": "Perplexity Deep Research", + "display_name": "Perplexity Deep Research", "modalities": { "input": [ "text" @@ -158648,24 +163443,27 @@ ] }, "limit": { - "context": 32768, - "output": 32768 + "context": 60000, + "output": 128000 }, - "temperature": true, "tool_call": false, "reasoning": { "supported": false }, "attachment": false, "open_weights": false, - "release_date": "2025-06-05", - "last_updated": "2025-06-05", - "type": "embedding" + "release_date": "2025-02-25", + "last_updated": "2025-02-25", + "cost": { + "input": 3.4, + "output": 13.6 + }, + "type": "chat" }, { - "id": "alibaba/qwen3-embedding-0.6b", - "name": "Qwen3 Embedding 0.6B", - "display_name": "Qwen3 Embedding 0.6B", + "id": "qwq-32b", + "name": "Qwen: QwQ 32B", + "display_name": "Qwen: QwQ 32B", "modalities": { "input": [ "text" @@ -158675,24 +163473,38 @@ ] }, "limit": { - "context": 32768, + "context": 128000, "output": 32768 }, - "temperature": true, "tool_call": false, "reasoning": { - "supported": false + "supported": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } }, "attachment": false, "open_weights": false, - "release_date": "2025-11-14", - "last_updated": "2025-11-14", - "type": "embedding" + "release_date": "2025-04-15", + "last_updated": "2025-04-15", + "cost": { + "input": 0.25599999, + "output": 0.30499999 + }, + "type": "chat" }, { - "id": "alibaba/qwen-3-235b", - "name": "Qwen3 235B A22B Instruct 2507", - "display_name": "Qwen3 235B A22B Instruct 2507", + "id": "mistral-code-agent-latest", + "name": "Mistral Code Agent Latest", + "display_name": "Mistral Code Agent Latest", "modalities": { "input": [ "text" @@ -158703,190 +163515,205 @@ }, "limit": { "context": 262144, - "output": 16384 + "output": 32768 }, - "temperature": true, "tool_call": true, "reasoning": { "supported": false }, "attachment": false, "open_weights": false, - "knowledge": "2025-04", - "release_date": "2025-04-01", - "last_updated": "2025-04", + "release_date": "2026-06-02", + "last_updated": "2026-06-02", "cost": { - "input": 0.22, - "output": 0.88 + "input": 0.4, + "output": 2 }, "type": "chat" }, { - "id": "alibaba/qwen3-coder-30b-a3b", - "name": "Qwen 3 Coder 30B A3B Instruct", - "display_name": "Qwen 3 Coder 30B A3B Instruct", + "id": "glm-4.1v-thinking-flash", + "name": "GLM 4.1V Thinking Flash", + "display_name": "GLM 4.1V Thinking Flash", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 262144, + "context": 64000, "output": 8192 }, - "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": true + "supported": false }, - "attachment": false, + "attachment": true, "open_weights": false, - "knowledge": "2025-04", - "release_date": "2025-04-01", - "last_updated": "2025-04", + "release_date": "2025-07-09", + "last_updated": "2025-07-09", "cost": { - "input": 0.15, - "output": 0.6 + "input": 0.3, + "output": 0.3 }, "type": "chat" }, { - "id": "alibaba/qwen3-coder", - "name": "Qwen3 Coder 480B A35B Instruct", - "display_name": "Qwen3 Coder 480B A35B Instruct", + "id": "qwen3.5-omni-flash", + "name": "Qwen3.5 Omni Flash", + "display_name": "Qwen3.5 Omni Flash", "modalities": { "input": [ - "text" + "text", + "image", + "video", + "audio" ], "output": [ "text" ] }, "limit": { - "context": 262144, - "output": 65536 + "context": 49152, + "output": 16384 }, - "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": false }, - "attachment": false, + "attachment": true, "open_weights": false, - "knowledge": "2025-04", - "release_date": "2025-04-01", - "last_updated": "2025-04", + "release_date": "2026-03-30", + "last_updated": "2026-03-30", "cost": { - "input": 1.5, - "output": 7.5, - "cache_read": 0.3 + "input": 0, + "output": 0 }, "type": "chat" }, { - "id": "alibaba/wan-v2.6-i2v-flash", - "name": "Wan v2.6 Image-to-Video Flash", - "display_name": "Wan v2.6 Image-to-Video Flash", + "id": "gemma-4-31B-MeroMero", + "name": "Gemma 4 31B MeroMero", + "display_name": "Gemma 4 31B MeroMero", "modalities": { "input": [ - "text" + "text", + "image", + "video" ], "output": [ - "video" + "text" ] }, "limit": { - "context": 8192, - "output": 8192 + "context": 262144, + "output": 16384 }, - "temperature": true, "tool_call": false, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": false, + "attachment": true, "open_weights": false, - "release_date": "2025-12-16", - "last_updated": "2025-12-16", + "release_date": "2026-05-02", + "last_updated": "2026-05-02", + "cost": { + "input": 0.306, + "output": 0.306 + }, "type": "chat" }, { - "id": "alibaba/qwen3.7-plus", - "name": "Qwen 3.7 Plus", - "display_name": "Qwen 3.7 Plus", + "id": "gemini-2.5-flash-preview-04-17:thinking", + "name": "Gemini 2.5 Flash Preview Thinking", + "display_name": "Gemini 2.5 Flash Preview Thinking", "modalities": { "input": [ "text", - "image", - "pdf" + "image" ], "output": [ "text" ] }, "limit": { - "context": 1000000, - "output": 64000 + "context": 1048756, + "output": 65536 }, - "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": true, "default": true }, "extra_capabilities": { "reasoning": { - "supported": true + "supported": true, + "default_enabled": true, + "mode": "budget", + "budget": { + "default": -1, + "min": 0, + "max": 24576, + "auto": -1, + "off": 0, + "unit": "tokens" + }, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thought_signatures" + ] } }, "attachment": true, "open_weights": false, - "knowledge": "2025-04", - "release_date": "2026-06-01", - "last_updated": "2026-06-02", + "release_date": "2025-04-17", + "last_updated": "2025-04-17", "cost": { - "input": 0.4, - "output": 1.6, - "cache_read": 0.08, - "cache_write": 0.5 + "input": 0.15, + "output": 3.5 }, "type": "chat" }, { - "id": "alibaba/wan-v2.6-r2v", - "name": "Wan v2.6 Reference-to-Video", - "display_name": "Wan v2.6 Reference-to-Video", + "id": "glm-4-air", + "name": "GLM-4 Air", + "display_name": "GLM-4 Air", "modalities": { "input": [ "text" ], "output": [ - "video" + "text" ] }, "limit": { - "context": 8192, - "output": 8192 + "context": 128000, + "output": 4096 }, - "temperature": true, "tool_call": false, "reasoning": { "supported": false }, "attachment": false, "open_weights": false, - "release_date": "2025-12-16", - "last_updated": "2025-12-16", + "release_date": "2024-06-05", + "last_updated": "2024-06-05", + "cost": { + "input": 0.2006, + "output": 0.2006 + }, "type": "chat" }, { - "id": "alibaba/qwen-3-32b", - "name": "Qwen 3.32B", - "display_name": "Qwen 3.32B", + "id": "doubao-seed-1-6-thinking-250615", + "name": "Doubao Seed 1.6 Thinking", + "display_name": "Doubao Seed 1.6 Thinking", "modalities": { "input": [ "text" @@ -158896,46 +163723,72 @@ ] }, "limit": { - "context": 128000, - "output": 8192 + "context": 256000, + "output": 16384 }, - "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": true + "supported": false }, "attachment": false, "open_weights": false, - "knowledge": "2025-04", - "release_date": "2025-04-01", - "last_updated": "2025-04", + "release_date": "2025-06-15", + "last_updated": "2025-06-15", "cost": { - "input": 0.16, - "output": 0.64 + "input": 0.204, + "output": 2.04 }, "type": "chat" }, { - "id": "alibaba/qwen3-235b-a22b-thinking", - "name": "Qwen3 235B A22B Thinking 2507", - "display_name": "Qwen3 235B A22B Thinking 2507", + "id": "auto-model-basic", + "name": "Auto model (Basic)", + "display_name": "Auto model (Basic)", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 1000000, + "output": 1000000 + }, + "tool_call": false, + "reasoning": { + "supported": false + }, + "attachment": false, + "open_weights": false, + "release_date": "2024-06-01", + "last_updated": "2024-06-01", + "cost": { + "input": 9.996, + "output": 19.992 + }, + "type": "chat" + }, + { + "id": "Qwen3.5-27B-RpRMax-v1", + "name": "Qwen3.5 27B RpRMax v1", + "display_name": "Qwen3.5 27B RpRMax v1", "modalities": { "input": [ "text", "image", - "pdf" + "video" ], "output": [ "text" ] }, "limit": { - "context": 131072, - "output": 32768 + "context": 262144, + "output": 16384 }, - "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": true, "default": true @@ -158953,33 +163806,71 @@ }, "attachment": true, "open_weights": false, - "knowledge": "2025-04", - "release_date": "2025-09-24", - "last_updated": "2025-04", + "release_date": "2026-04-30", + "last_updated": "2026-04-30", "cost": { - "input": 0.4, - "output": 4 + "input": 0.306, + "output": 0.306 }, "type": "chat" }, { - "id": "alibaba/qwen3-max-thinking", - "name": "Qwen 3 Max Thinking", - "display_name": "Qwen 3 Max Thinking", + "id": "ernie-5.1", + "name": "ERNIE 5.1", + "display_name": "ERNIE 5.1", "modalities": { "input": [ + "text", + "image", + "video" + ], + "output": [ "text" + ] + }, + "limit": { + "context": 119000, + "output": 64000 + }, + "tool_call": false, + "reasoning": { + "supported": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true + } + }, + "attachment": true, + "open_weights": false, + "release_date": "2026-05-10", + "last_updated": "2026-05-10", + "cost": { + "input": 0.75, + "output": 3, + "cache_read": 0.75 + }, + "type": "chat" + }, + { + "id": "Qwen3.5-27B-Marvin-DPO-V2-Derestricted", + "name": "Qwen3.5 27B Marvin DPO V2 Derestricted", + "display_name": "Qwen3.5 27B Marvin DPO V2 Derestricted", + "modalities": { + "input": [ + "text", + "image", + "video" ], "output": [ "text" ] }, "limit": { - "context": 256000, - "output": 65536 + "context": 262144, + "output": 16384 }, - "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": true, "default": true @@ -158995,178 +163886,200 @@ ] } }, - "attachment": false, - "open_weights": true, - "knowledge": "2025-01", - "release_date": "2025-01", - "last_updated": "2025-01", + "attachment": true, + "open_weights": false, + "release_date": "2026-04-30", + "last_updated": "2026-04-30", "cost": { - "input": 1.2, - "output": 6, - "cache_read": 0.24 + "input": 0.306, + "output": 0.306 }, "type": "chat" }, { - "id": "alibaba/qwen-3.6-max-preview", - "name": "Qwen 3.6 Max Preview", - "display_name": "Qwen 3.6 Max Preview", + "id": "azure-gpt-4o", + "name": "Azure gpt-4o", + "display_name": "Azure gpt-4o", "modalities": { "input": [ "text", - "pdf" + "image" ], "output": [ "text" ] }, "limit": { - "context": 240000, - "output": 64000 + "context": 128000, + "output": 16384 }, - "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, "attachment": true, - "open_weights": true, - "release_date": "2026-04-20", - "last_updated": "2026-04-24", + "open_weights": false, + "release_date": "2024-05-13", + "last_updated": "2024-05-13", "cost": { - "input": 1.3, - "output": 7.8, - "cache_read": 0.26, - "cache_write": 1.625 + "input": 2.499, + "output": 9.996 }, "type": "chat" }, { - "id": "alibaba/wan-v2.6-i2v", - "name": "Wan v2.6 Image-to-Video", - "display_name": "Wan v2.6 Image-to-Video", + "id": "deepseek-chat", + "name": "DeepSeek V3/Deepseek Chat", + "display_name": "DeepSeek V3/Deepseek Chat", "modalities": { "input": [ - "text" + "text", + "pdf" ], "output": [ - "video" + "text" ] }, "limit": { - "context": 8192, + "context": 128000, "output": 8192 }, - "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { "supported": false }, - "attachment": false, + "attachment": true, "open_weights": false, - "release_date": "2025-12-16", - "last_updated": "2025-12-16", + "release_date": "2025-02-27", + "last_updated": "2025-02-27", + "cost": { + "input": 0.25, + "output": 0.7 + }, "type": "chat" }, { - "id": "alibaba/qwen-3-30b", - "name": "Qwen3-30B-A3B", - "display_name": "Qwen3-30B-A3B", + "id": "gemini-2.5-flash-preview-05-20", + "name": "Gemini 2.5 Flash 0520", + "display_name": "Gemini 2.5 Flash 0520", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 40960, - "output": 16384 + "context": 1048000, + "output": 65536 }, - "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": true, "default": true }, - "attachment": false, + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": true, + "mode": "budget", + "budget": { + "default": -1, + "min": 0, + "max": 24576, + "auto": -1, + "off": 0, + "unit": "tokens" + }, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thought_signatures" + ] + } + }, + "attachment": true, "open_weights": false, - "knowledge": "2025-04", - "release_date": "2025-04-01", - "last_updated": "2025-04", + "release_date": "2025-05-20", + "last_updated": "2025-05-20", "cost": { - "input": 0.12, - "output": 0.5 + "input": 0.15, + "output": 0.6 }, "type": "chat" }, { - "id": "alibaba/wan-v2.6-t2v", - "name": "Wan v2.6 Text-to-Video", - "display_name": "Wan v2.6 Text-to-Video", + "id": "mercury-2", + "name": "Mercury 2", + "display_name": "Mercury 2", "modalities": { "input": [ "text" ], "output": [ - "video" + "text" ] }, "limit": { - "context": 8192, - "output": 8192 + "context": 128000, + "output": 50000 }, - "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "attachment": false, "open_weights": false, - "release_date": "2025-12-16", - "last_updated": "2025-12-16", + "release_date": "2024-01-01", + "last_updated": "2024-01-01", + "cost": { + "input": 0.25, + "output": 0.75, + "cache_read": 0.025 + }, "type": "chat" }, { - "id": "alibaba/qwen3-vl-instruct", - "name": "Qwen3 VL Instruct", - "display_name": "Qwen3 VL Instruct", + "id": "qwen3.7-plus:thinking", + "name": "Qwen3.7 Plus Thinking", + "display_name": "Qwen3.7 Plus Thinking", "modalities": { "input": [ "text", "image", - "pdf" + "video" ], "output": [ "text" ] }, "limit": { - "context": 131072, - "output": 129024 + "context": 983616, + "output": 65536 }, - "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": false + "supported": true, + "default": true }, "attachment": true, - "open_weights": true, - "knowledge": "2025-04", - "release_date": "2025-09-24", - "last_updated": "2025-09-24", + "open_weights": false, + "release_date": "2026-06-01", + "last_updated": "2026-06-01", "cost": { "input": 0.4, - "output": 1.6 + "output": 1.6, + "cache_read": 0.04 }, "type": "chat" }, { - "id": "xiaomi/mimo-v2-pro", - "name": "MiMo V2 Pro", - "display_name": "MiMo V2 Pro", + "id": "gemini-2.0-flash-thinking-exp-1219", + "name": "Gemini 2.0 Flash Thinking 1219", + "display_name": "Gemini 2.0 Flash Thinking 1219", "modalities": { "input": [ "text" @@ -159176,67 +164089,57 @@ ] }, "limit": { - "context": 1000000, - "output": 128000 + "context": 32767, + "output": 8192 }, - "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": true + "supported": false }, "attachment": false, "open_weights": false, - "knowledge": "2024-12", - "release_date": "2026-03-18", - "last_updated": "2026-03-18", + "release_date": "2024-12-19", + "last_updated": "2024-12-19", "cost": { - "input": 1, - "output": 3, - "cache_read": 0.2 + "input": 0.1003, + "output": 0.408 }, "type": "chat" }, { - "id": "xiaomi/mimo-v2.5", - "name": "MiMo M2.5", - "display_name": "MiMo M2.5", + "id": "glm-4-plus-0111", + "name": "GLM 4 Plus 0111", + "display_name": "GLM 4 Plus 0111", "modalities": { "input": [ - "text", - "image", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 1050000, - "output": 131100 + "context": 128000, + "output": 4096 }, - "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": true + "supported": false }, - "attachment": true, + "attachment": false, "open_weights": false, - "knowledge": "2024-12", - "release_date": "2026-04-22", - "last_updated": "2026-04-22", + "release_date": "2025-02-19", + "last_updated": "2025-02-19", "cost": { - "input": 0.14, - "output": 0.28, - "cache_read": 0.0028 + "input": 9.996, + "output": 9.996 }, "type": "chat" }, { - "id": "xiaomi/mimo-v2-flash", - "name": "MiMo V2 Flash", - "display_name": "MiMo V2 Flash", + "id": "brave", + "name": "Brave (Answers)", + "display_name": "Brave (Answers)", "modalities": { "input": [ "text" @@ -159246,127 +164149,152 @@ ] }, "limit": { - "context": 262144, - "output": 32000 + "context": 8192, + "output": 8192 }, - "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": true + "supported": false }, "attachment": false, "open_weights": false, - "knowledge": "2024-10", - "release_date": "2025-12-17", - "last_updated": "2026-02-04", + "release_date": "2023-03-02", + "last_updated": "2024-01-01", "cost": { - "input": 0.1, - "output": 0.3, - "cache_read": 0.01 + "input": 5, + "output": 5 }, "type": "chat" }, { - "id": "xiaomi/mimo-v2.5-pro", - "name": "MiMo V2.5 Pro", - "display_name": "MiMo V2.5 Pro", + "id": "glm-zero-preview", + "name": "GLM Zero Preview", + "display_name": "GLM Zero Preview", "modalities": { "input": [ - "text", - "image", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 1050000, - "output": 131000 + "context": 8000, + "output": 4096 }, - "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": true + "supported": false }, - "attachment": true, + "attachment": false, "open_weights": false, - "knowledge": "2024-12", - "release_date": "2026-04-22", - "last_updated": "2026-04-22", + "release_date": "2024-12-01", + "last_updated": "2024-12-01", "cost": { - "input": 0.435, - "output": 0.87, - "cache_read": 0.0036 + "input": 1.802, + "output": 1.802 }, "type": "chat" }, { - "id": "mistral/codestral-embed", - "name": "Codestral Embed", - "display_name": "Codestral Embed", + "id": "gemini-2.5-flash-lite-preview-06-17", + "name": "Gemini 2.5 Flash Lite Preview", + "display_name": "Gemini 2.5 Flash Lite Preview", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 8192, - "output": 1536 + "context": 1048756, + "output": 65536 }, - "temperature": true, "tool_call": false, "reasoning": { - "supported": false + "supported": true, + "default": false }, - "attachment": false, + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": false, + "mode": "budget", + "budget": { + "default": -1, + "min": 512, + "max": 24576, + "auto": -1, + "unit": "tokens" + }, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thought_signatures" + ] + } + }, + "attachment": true, "open_weights": false, - "release_date": "2025-05-28", - "last_updated": "2025-05-28", + "release_date": "2025-06-17", + "last_updated": "2025-06-17", + "cost": { + "input": 0.15, + "output": 0.6 + }, "type": "chat" }, { - "id": "mistral/mistral-large-3", - "name": "Mistral Large 3", - "display_name": "Mistral Large 3", + "id": "Qwen3.5-27B-Writer-Derestricted", + "name": "Qwen3.5 27B Writer Derestricted", + "display_name": "Qwen3.5 27B Writer Derestricted", "modalities": { "input": [ "text", - "image" + "image", + "video" ], "output": [ "text" ] }, "limit": { - "context": 256000, - "output": 256000 + "context": 262144, + "output": 16384 }, - "temperature": true, "tool_call": false, "reasoning": { - "supported": false + "supported": true, + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } }, "attachment": true, "open_weights": false, - "knowledge": "2024-10", - "release_date": "2025-12-02", - "last_updated": "2025-12-02", + "release_date": "2026-04-06", + "last_updated": "2026-04-06", "cost": { - "input": 0.5, - "output": 1.5 + "input": 0.306, + "output": 0.306 }, "type": "chat" }, { - "id": "mistral/devstral-small-2", - "name": "Devstral Small 2", - "display_name": "Devstral Small 2", + "id": "KAT-Coder-Exp-72B-1010", + "name": "KAT Coder Exp 72B 1010", + "display_name": "KAT Coder Exp 72B 1010", "modalities": { "input": [ "text" @@ -159376,56 +164304,122 @@ ] }, "limit": { - "context": 256000, - "output": 256000 + "context": 128000, + "output": 32768 }, - "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": false }, "attachment": false, "open_weights": false, - "knowledge": "2024-10", - "release_date": "2025-05-07", - "last_updated": "2025-05-07", + "release_date": "2025-10-28", + "last_updated": "2025-10-28", "cost": { "input": 0.1, - "output": 0.3 + "output": 0.2 }, "type": "chat" }, { - "id": "mistral/mistral-embed", - "name": "Mistral Embed", - "display_name": "Mistral Embed", + "id": "gemini-2.5-pro-preview-06-05", + "name": "Gemini 2.5 Pro Preview 0605", + "display_name": "Gemini 2.5 Pro Preview 0605", "modalities": { "input": [ + "text", + "image" + ], + "output": [ "text" + ] + }, + "limit": { + "context": 1048756, + "output": 65536 + }, + "tool_call": false, + "reasoning": { + "supported": true, + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": true, + "mode": "budget", + "budget": { + "default": -1, + "min": 128, + "max": 32768, + "auto": -1, + "unit": "tokens" + }, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thought_signatures" + ] + } + }, + "attachment": true, + "open_weights": false, + "release_date": "2025-06-05", + "last_updated": "2025-06-05", + "cost": { + "input": 2.5, + "output": 10 + }, + "type": "chat" + }, + { + "id": "Qwen3.5-27B-Musica-v1", + "name": "Qwen3.5 27B Musica v1", + "display_name": "Qwen3.5 27B Musica v1", + "modalities": { + "input": [ + "text", + "image", + "video" ], "output": [ "text" ] }, "limit": { - "context": 8192, - "output": 1536 + "context": 262144, + "output": 16384 }, - "temperature": true, "tool_call": false, "reasoning": { - "supported": false + "supported": true, + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } + }, + "attachment": true, + "open_weights": false, + "release_date": "2026-03-27", + "last_updated": "2026-03-27", + "cost": { + "input": 0.306, + "output": 0.306 }, - "attachment": false, - "open_weights": false, - "release_date": "2023-12-11", - "last_updated": "2023-12-11", "type": "chat" }, { - "id": "mistral/mistral-nemo", - "name": "Mistral Nemo", - "display_name": "Mistral Nemo", + "id": "MiniMax-M1", + "name": "MiniMax M1", + "display_name": "MiniMax M1", "modalities": { "input": [ "text" @@ -159435,160 +164429,168 @@ ] }, "limit": { - "context": 131072, + "context": 1000000, "output": 131072 }, - "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": false }, "attachment": false, "open_weights": false, - "knowledge": "2024-04", - "release_date": "2024-07-01", - "last_updated": "2024-07-01", + "release_date": "2025-06-16", + "last_updated": "2025-06-16", "cost": { - "input": 0.02, - "output": 0.04 + "input": 0.1394, + "output": 1.3328 }, "type": "chat" }, { - "id": "mistral/mistral-medium-3.5", - "name": "Mistral Medium Latest", - "display_name": "Mistral Medium Latest", + "id": "doubao-1-5-thinking-pro-vision-250415", + "name": "Doubao 1.5 Thinking Pro Vision", + "display_name": "Doubao 1.5 Thinking Pro Vision", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 256000, - "output": 256000 + "context": 128000, + "output": 16384 }, - "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": true + "supported": false }, - "attachment": false, + "attachment": true, "open_weights": false, - "release_date": "2026-05-21", - "last_updated": "2026-05-21", + "release_date": "2025-04-15", + "last_updated": "2025-04-15", "cost": { - "input": 1.5, - "output": 7.5 + "input": 0.6, + "output": 2.4 }, "type": "chat" }, { - "id": "mistral/ministral-14b", - "name": "Ministral 14B", - "display_name": "Ministral 14B", + "id": "qwen3.5-27b:thinking", + "name": "Qwen3.5 27B Thinking", + "display_name": "Qwen3.5 27B Thinking", "modalities": { "input": [ "text", "image", - "pdf" + "video" ], "output": [ "text" ] }, "limit": { - "context": 256000, - "output": 256000 + "context": 260096, + "output": 65536 }, - "temperature": true, "tool_call": false, "reasoning": { - "supported": false + "supported": true, + "default": true }, "attachment": true, "open_weights": false, - "knowledge": "2024-10", - "release_date": "2025-12-01", - "last_updated": "2025-12-01", + "release_date": "2026-02-24", + "last_updated": "2026-02-24", "cost": { - "input": 0.2, - "output": 0.2 + "input": 0.27, + "output": 2.16 }, "type": "chat" }, { - "id": "mistral/mistral-medium", - "name": "Mistral Medium 3.1", - "display_name": "Mistral Medium 3.1", + "id": "Qwen3.5-27B-Omega-Evolution-v2.0-Derestricted", + "name": "Qwen3.5 27B Omega Evolution v2.0 Derestricted", + "display_name": "Qwen3.5 27B Omega Evolution v2.0 Derestricted", "modalities": { "input": [ "text", - "image" + "image", + "video" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 64000 + "context": 262144, + "output": 16384 }, - "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": false + "supported": true, + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } }, "attachment": true, "open_weights": false, - "knowledge": "2024-10", - "release_date": "2025-05-07", - "last_updated": "2025-05-07", + "release_date": "2026-04-06", + "last_updated": "2026-04-06", "cost": { - "input": 0.4, - "output": 2 + "input": 0.306, + "output": 0.306 }, "type": "chat" }, { - "id": "mistral/devstral-small", - "name": "Devstral Small 1.1", - "display_name": "Devstral Small 1.1", + "id": "Gemma-4-31B-GarnetV2", + "name": "Gemma 4 31B Garnet V2", + "display_name": "Gemma 4 31B Garnet V2", "modalities": { "input": [ - "text" + "text", + "image", + "video" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 64000 + "context": 262144, + "output": 16384 }, - "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": false, + "attachment": true, "open_weights": false, - "knowledge": "2024-10", - "release_date": "2025-05-07", - "last_updated": "2025-05-07", + "release_date": "2026-05-01", + "last_updated": "2026-05-01", "cost": { - "input": 0.1, - "output": 0.3 + "input": 0.306, + "output": 0.306 }, "type": "chat" }, { - "id": "mistral/devstral-2", - "name": "Devstral 2", - "display_name": "Devstral 2", + "id": "qwen-turbo", + "name": "Qwen Turbo", + "display_name": "Qwen Turbo", "modalities": { "input": [ "text" @@ -159598,29 +164600,38 @@ ] }, "limit": { - "context": 256000, - "output": 256000 + "context": 1000000, + "output": 8192 }, - "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": false + "supported": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } }, "attachment": false, "open_weights": false, - "knowledge": "2024-10", - "release_date": "2025-12-09", - "last_updated": "2025-12-09", + "release_date": "2024-11-01", + "last_updated": "2024-11-01", "cost": { - "input": 0.4, - "output": 2 + "input": 0.04998, + "output": 0.2006 }, "type": "chat" }, { - "id": "mistral/ministral-8b", - "name": "Ministral 8B (latest)", - "display_name": "Ministral 8B (latest)", + "id": "phi-4-multimodal-instruct", + "name": "Phi 4 Multimodal", + "display_name": "Phi 4 Multimodal", "modalities": { "input": [ "text" @@ -159631,28 +164642,26 @@ }, "limit": { "context": 128000, - "output": 128000 + "output": 16384 }, - "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": false }, "attachment": false, - "open_weights": true, - "knowledge": "2024-10", - "release_date": "2024-10-01", - "last_updated": "2024-10-04", + "open_weights": false, + "release_date": "2025-07-26", + "last_updated": "2025-07-26", "cost": { - "input": 0.1, - "output": 0.1 + "input": 0.07, + "output": 0.11 }, "type": "chat" }, { - "id": "mistral/pixtral-large", - "name": "Pixtral Large (latest)", - "display_name": "Pixtral Large (latest)", + "id": "mistral-small-31-24b-instruct", + "name": "Mistral Small 31 24b Instruct", + "display_name": "Mistral Small 31 24b Instruct", "modalities": { "input": [ "text", @@ -159664,28 +164673,26 @@ }, "limit": { "context": 128000, - "output": 128000 + "output": 131072 }, - "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": false }, "attachment": true, - "open_weights": true, - "knowledge": "2024-11", - "release_date": "2024-11-01", - "last_updated": "2024-11-04", + "open_weights": false, + "release_date": "2025-04-15", + "last_updated": "2025-04-15", "cost": { - "input": 2, - "output": 6 + "input": 0.1, + "output": 0.3 }, "type": "chat" }, { - "id": "mistral/pixtral-12b", - "name": "Pixtral 12B", - "display_name": "Pixtral 12B", + "id": "ernie-4.5-turbo-128k", + "name": "Ernie 4.5 Turbo 128k", + "display_name": "Ernie 4.5 Turbo 128k", "modalities": { "input": [ "text", @@ -159697,127 +164704,152 @@ }, "limit": { "context": 128000, - "output": 128000 + "output": 16384 }, - "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": false }, "attachment": true, - "open_weights": true, - "knowledge": "2024-09", - "release_date": "2024-09-01", - "last_updated": "2024-09-01", + "open_weights": false, + "release_date": "2025-05-08", + "last_updated": "2025-05-08", "cost": { - "input": 0.15, - "output": 0.15 + "input": 0.132, + "output": 0.55 }, "type": "chat" }, { - "id": "mistral/magistral-small", - "name": "Magistral Small", - "display_name": "Magistral Small", + "id": "Qwen3.5-27B-BlueStar-Derestricted", + "name": "Qwen3.5 27B BlueStar Derestricted", + "display_name": "Qwen3.5 27B BlueStar Derestricted", "modalities": { "input": [ - "text" + "text", + "image", + "video" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 128000 + "context": 262144, + "output": 16384 }, - "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": true, "default": true }, - "attachment": false, - "open_weights": true, - "knowledge": "2025-06", - "release_date": "2025-03-17", - "last_updated": "2025-03-17", + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } + }, + "attachment": true, + "open_weights": false, + "release_date": "2026-04-06", + "last_updated": "2026-04-06", "cost": { - "input": 0.5, - "output": 1.5 + "input": 0.306, + "output": 0.306 }, "type": "chat" }, { - "id": "mistral/codestral", - "name": "Codestral (latest)", - "display_name": "Codestral (latest)", + "id": "gemini-2.5-flash-lite-preview-09-2025-thinking", + "name": "Gemini 2.5 Flash Lite Preview (09/2025) – Thinking", + "display_name": "Gemini 2.5 Flash Lite Preview (09/2025) – Thinking", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 256000, - "output": 4096 + "context": 1048756, + "output": 65536 }, - "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": false }, - "attachment": false, - "open_weights": true, - "knowledge": "2024-10", - "release_date": "2024-05-29", - "last_updated": "2025-01-04", + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": false, + "mode": "budget", + "budget": { + "default": -1, + "min": 512, + "max": 24576, + "auto": -1, + "unit": "tokens" + }, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thought_signatures" + ] + } + }, + "attachment": true, + "open_weights": false, + "release_date": "2025-09-25", + "last_updated": "2025-09-25", "cost": { - "input": 0.3, - "output": 0.9 + "input": 0.1, + "output": 0.4 }, "type": "chat" }, { - "id": "mistral/mistral-small", - "name": "Mistral Small (latest)", - "display_name": "Mistral Small (latest)", + "id": "doubao-seed-1-8-251215", + "name": "Doubao Seed 1.8", + "display_name": "Doubao Seed 1.8", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 256000, - "output": 256000 + "context": 128000, + "output": 8192 }, - "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": true + "supported": false }, - "attachment": true, - "open_weights": true, - "knowledge": "2025-06", - "release_date": "2026-03-16", - "last_updated": "2026-03-16", + "attachment": false, + "open_weights": false, + "release_date": "2025-12-15", + "last_updated": "2025-12-15", "cost": { - "input": 0.15, - "output": 0.6 + "input": 0.612, + "output": 6.12 }, "type": "chat" }, { - "id": "mistral/magistral-medium", - "name": "Magistral Medium (latest)", - "display_name": "Magistral Medium (latest)", + "id": "qwen3.6-max-preview", + "name": "Qwen3.6 Max Preview", + "display_name": "Qwen3.6 Max Preview", "modalities": { "input": [ "text" @@ -159827,30 +164859,38 @@ ] }, "limit": { - "context": 128000, - "output": 16384 + "context": 245800, + "output": 65536 }, - "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": true + "supported": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } }, "attachment": false, - "open_weights": true, - "knowledge": "2025-06", - "release_date": "2025-03-17", - "last_updated": "2025-03-20", + "open_weights": false, + "release_date": "2026-04-20", + "last_updated": "2026-04-21", "cost": { - "input": 2, - "output": 5 + "input": 1.3, + "output": 7.8 }, "type": "chat" }, { - "id": "mistral/ministral-3b", - "name": "Ministral 3B (latest)", - "display_name": "Ministral 3B (latest)", + "id": "exa-answer", + "name": "Exa (Answer)", + "display_name": "Exa (Answer)", "modalities": { "input": [ "text" @@ -159860,148 +164900,146 @@ ] }, "limit": { - "context": 128000, - "output": 128000 + "context": 4096, + "output": 4096 }, - "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": false }, "attachment": false, - "open_weights": true, - "knowledge": "2024-10", - "release_date": "2024-10-01", - "last_updated": "2024-10-04", + "open_weights": false, + "release_date": "2025-06-04", + "last_updated": "2025-06-04", "cost": { - "input": 0.04, - "output": 0.04 + "input": 2.5, + "output": 2.5 }, "type": "chat" }, { - "id": "xai/grok-4.20-multi-agent", - "name": "Grok 4.20 Multi-Agent", - "display_name": "Grok 4.20 Multi-Agent", + "id": "Baichuan4-Air", + "name": "Baichuan 4 Air", + "display_name": "Baichuan 4 Air", "modalities": { "input": [ - "text", - "image", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 2000000, - "output": 2000000 + "context": 32768, + "output": 32768 }, - "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": true + "supported": false }, "attachment": false, "open_weights": false, - "release_date": "2026-03-09", - "last_updated": "2026-03-23", + "release_date": "2025-08-19", + "last_updated": "2025-08-19", "cost": { - "input": 1.25, - "output": 2.5, - "cache_read": 0.2 + "input": 0.157, + "output": 0.157 }, "type": "chat" }, { - "id": "xai/grok-4.20-reasoning", - "name": "Grok 4.20 Reasoning", - "display_name": "Grok 4.20 Reasoning", + "id": "qwen3.5-122b-a10b", + "name": "Qwen3.5 122B A10B", + "display_name": "Qwen3.5 122B A10B", "modalities": { "input": [ "text", "image", - "pdf" + "video" ], "output": [ "text" ] }, "limit": { - "context": 2000000, - "output": 2000000 + "context": 260096, + "output": 65536 }, - "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": true + "supported": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } }, "attachment": true, "open_weights": false, - "release_date": "2026-03-09", - "last_updated": "2026-03-23", + "release_date": "2026-02-24", + "last_updated": "2026-02-24", "cost": { - "input": 1.25, - "output": 2.5, - "cache_read": 0.2 + "input": 0.36, + "output": 2.88 }, "type": "chat" }, { - "id": "xai/grok-4.1-fast-non-reasoning", - "name": "Grok 4.1 Fast Non-Reasoning", - "display_name": "Grok 4.1 Fast Non-Reasoning", + "id": "sarvam-30b", + "name": "Sarvam 30B", + "display_name": "Sarvam 30B", "modalities": { "input": [ - "text", - "image", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 1000000, - "output": 1000000 + "context": 65536, + "output": 4096 }, - "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "attachment": false, "open_weights": false, - "knowledge": "2024-10", - "release_date": "2025-07-09", - "last_updated": "2025-07-09", + "release_date": "2026-05-12", + "last_updated": "2026-05-12", "cost": { - "input": 0.2, - "output": 0.5, - "cache_read": 0.05 + "input": 0.028, + "output": 0.111, + "cache_read": 0.017 }, "type": "chat" }, { - "id": "xai/grok-build-0.1", - "name": "Grok Build 0.1", - "display_name": "Grok Build 0.1", + "id": "claude-opus-4-1-thinking", + "name": "Claude 4.1 Opus Thinking", + "display_name": "Claude 4.1 Opus Thinking", "modalities": { "input": [ "text", - "image" + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 256000, - "output": 256000 + "context": 200000, + "output": 32000 }, - "temperature": true, "tool_call": true, "reasoning": { "supported": true, @@ -160009,24 +165047,39 @@ }, "extra_capabilities": { "reasoning": { - "supported": true + "supported": true, + "default_enabled": true, + "mode": "budget", + "budget": { + "min": 1024, + "unit": "tokens" + }, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ], + "notes": [ + "Claude 4 manual thinking uses thinking.type = \"enabled\" with budget_tokens.", + "Interleaved thinking requires the interleaved-thinking-2025-05-14 beta header for this model family." + ] } }, "attachment": true, "open_weights": false, - "release_date": "2026-05-20", - "last_updated": "2026-04-16", + "release_date": "2025-05-22", + "last_updated": "2025-05-22", "cost": { - "input": 1, - "output": 2, - "cache_read": 0.2 + "input": 14.994, + "output": 75.004 }, "type": "chat" }, { - "id": "xai/grok-4.1-fast-reasoning", - "name": "Grok 4.1 Fast Reasoning", - "display_name": "Grok 4.1 Fast Reasoning", + "id": "claude-opus-4-thinking:32000", + "name": "Claude 4 Opus Thinking (32K)", + "display_name": "Claude 4 Opus Thinking (32K)", "modalities": { "input": [ "text", @@ -160038,210 +165091,227 @@ ] }, "limit": { - "context": 1000000, - "output": 1000000 + "context": 200000, + "output": 32000 }, - "temperature": true, "tool_call": true, "reasoning": { "supported": true, "default": true }, - "attachment": false, + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": true, + "mode": "budget", + "budget": { + "min": 1024, + "unit": "tokens" + }, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ], + "notes": [ + "Claude 4 manual thinking uses thinking.type = \"enabled\" with budget_tokens.", + "Interleaved thinking requires the interleaved-thinking-2025-05-14 beta header for this model family." + ] + } + }, + "attachment": true, "open_weights": false, - "knowledge": "2024-10", - "release_date": "2025-07-09", - "last_updated": "2025-07-09", + "release_date": "2025-05-22", + "last_updated": "2025-05-22", "cost": { - "input": 0.2, - "output": 0.5, - "cache_read": 0.05 + "input": 14.994, + "output": 75.004 }, "type": "chat" }, { - "id": "xai/grok-imagine-video-1.5-preview", - "name": "Grok Imagine Video 1.5 Preview", - "display_name": "Grok Imagine Video 1.5 Preview", + "id": "auto-model", + "name": "Auto model", + "display_name": "Auto model", "modalities": { "input": [ "text" ], "output": [ - "video" + "text" ] }, "limit": { - "context": 8192, - "output": 8192 + "context": 1000000, + "output": 1000000 }, - "temperature": true, "tool_call": false, "reasoning": { "supported": false }, "attachment": false, "open_weights": false, - "release_date": "2026-05-30", - "last_updated": "2026-05-30", + "release_date": "2024-06-01", + "last_updated": "2024-06-01", + "cost": { + "input": 0, + "output": 0 + }, "type": "chat" }, { - "id": "xai/grok-4.20-non-reasoning-beta", - "name": "Grok 4.20 Beta Non-Reasoning", - "display_name": "Grok 4.20 Beta Non-Reasoning", + "id": "qwen3-vl-235b-a22b-instruct-original", + "name": "Qwen3 VL 235B A22B Instruct Original", + "display_name": "Qwen3 VL 235B A22B Instruct Original", "modalities": { "input": [ "text", - "image", - "pdf" + "image" ], "output": [ "text" ] }, "limit": { - "context": 2000000, - "output": 2000000 + "context": 32768, + "output": 32768 }, - "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": false }, "attachment": true, "open_weights": false, - "release_date": "2026-03-11", - "last_updated": "2026-03-13", + "release_date": "2025-09-25", + "last_updated": "2025-09-25", "cost": { - "input": 1.25, - "output": 2.5, - "cache_read": 0.4 + "input": 0.5, + "output": 1.2 }, "type": "chat" }, { - "id": "xai/grok-4.3", - "name": "Grok 4.3", - "display_name": "Grok 4.3", + "id": "glm-z1-air", + "name": "GLM Z1 Air", + "display_name": "GLM Z1 Air", "modalities": { "input": [ - "text", - "image", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 1000000, - "output": 1000000 + "context": 32000, + "output": 16384 }, - "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true - } + "supported": false }, - "attachment": true, + "attachment": false, "open_weights": false, - "release_date": "2026-04-30", - "last_updated": "2026-04-17", + "release_date": "2025-04-15", + "last_updated": "2025-04-15", "cost": { - "input": 1.25, - "output": 2.5, - "cache_read": 0.2 + "input": 0.07, + "output": 0.07 }, "type": "chat" }, { - "id": "xai/grok-4.20-reasoning-beta", - "name": "Grok 4.20 Beta Reasoning", - "display_name": "Grok 4.20 Beta Reasoning", + "id": "Qwen3.5-27B-Queen-Derestricted-Lite", + "name": "Qwen3.5 27B Queen Derestricted Lite", + "display_name": "Qwen3.5 27B Queen Derestricted Lite", "modalities": { "input": [ "text", "image", - "pdf" + "video" ], "output": [ "text" ] }, "limit": { - "context": 2000000, - "output": 2000000 + "context": 262144, + "output": 16384 }, - "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": true, "default": true }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } + }, "attachment": true, "open_weights": false, - "release_date": "2026-03-11", - "last_updated": "2026-03-13", + "release_date": "2026-04-30", + "last_updated": "2026-04-30", "cost": { - "input": 1.25, - "output": 2.5, - "cache_read": 0.2 + "input": 0.306, + "output": 0.306 }, "type": "chat" }, { - "id": "xai/grok-imagine-image", - "name": "Grok Imagine Image", - "display_name": "Grok Imagine Image", + "id": "inclusionai/ling-2.6-1t", + "name": "Ling 2.6 1T", + "display_name": "Ling 2.6 1T", "modalities": { "input": [ "text" ], "output": [ - "text", - "image" + "text" ] }, "limit": { - "context": 8192, - "output": 8192 + "context": 262144, + "output": 32768 }, - "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { "supported": false }, "attachment": false, "open_weights": false, - "release_date": "2026-01-28", - "last_updated": "2026-02-19", + "release_date": "2026-04-23", + "last_updated": "2026-04-23", + "cost": { + "input": 0.3, + "output": 2.5, + "cache_read": 0.06 + }, "type": "chat" }, { - "id": "xai/grok-4.20-multi-agent-beta", - "name": "Grok 4.20 Multi Agent Beta", - "display_name": "Grok 4.20 Multi Agent Beta", + "id": "inclusionai/ring-2.6-1t", + "name": "Ring 2.6 1T", + "display_name": "Ring 2.6 1T", "modalities": { "input": [ - "text", - "image", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 2000000, - "output": 2000000 + "context": 262144, + "output": 65536 }, - "temperature": true, "tool_call": true, "reasoning": { "supported": true, @@ -160249,80 +165319,78 @@ }, "attachment": false, "open_weights": false, - "release_date": "2026-03-11", - "last_updated": "2026-03-13", + "release_date": "2026-05-08", + "last_updated": "2026-05-08", "cost": { - "input": 1.25, - "output": 2.5, - "cache_read": 0.2 + "input": 1, + "output": 3 }, "type": "chat" }, { - "id": "xai/grok-4.20-non-reasoning", - "name": "Grok 4.20 Non-Reasoning", - "display_name": "Grok 4.20 Non-Reasoning", + "id": "inclusionai/ling-2.6-flash", + "name": "Ling 2.6 Flash", + "display_name": "Ling 2.6 Flash", "modalities": { "input": [ - "text", - "image", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 2000000, - "output": 2000000 + "context": 262144, + "output": 32768 }, - "temperature": true, "tool_call": true, "reasoning": { "supported": false }, - "attachment": true, + "attachment": false, "open_weights": false, - "release_date": "2026-03-09", - "last_updated": "2026-03-23", + "release_date": "2026-04-21", + "last_updated": "2026-04-21", "cost": { - "input": 1.25, - "output": 2.5, - "cache_read": 0.2 + "input": 0.08, + "output": 0.24 }, "type": "chat" }, { - "id": "xai/grok-imagine-video", - "name": "Grok Imagine", - "display_name": "Grok Imagine", + "id": "Alibaba-NLP/Tongyi-DeepResearch-30B-A3B", + "name": "Tongyi DeepResearch 30B A3B", + "display_name": "Tongyi DeepResearch 30B A3B", "modalities": { "input": [ "text" ], "output": [ - "video" + "text" ] }, "limit": { - "context": 8192, - "output": 8192 + "context": 128000, + "output": 65536 }, - "temperature": true, "tool_call": false, "reasoning": { "supported": false }, "attachment": false, "open_weights": false, - "release_date": "2026-01-28", - "last_updated": "2026-01-28", + "release_date": "2025-08-26", + "last_updated": "2025-08-26", + "cost": { + "input": 0.08, + "output": 0.24000000000000002 + }, "type": "chat" }, { - "id": "cohere/rerank-v4-pro", - "name": "Cohere Rerank 4 Pro", - "display_name": "Cohere Rerank 4 Pro", + "id": "ibm-granite/granite-4.1-8b", + "name": "Granite 4.1 8B", + "display_name": "Granite 4.1 8B", "modalities": { "input": [ "text" @@ -160332,24 +165400,28 @@ ] }, "limit": { - "context": 32000, - "output": 32000 + "context": 131072, + "output": 131072 }, - "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { "supported": false }, "attachment": false, "open_weights": false, - "release_date": "2025-12-11", - "last_updated": "2025-12-11", + "release_date": "2026-04-29", + "last_updated": "2026-04-29", + "cost": { + "input": 0.05, + "output": 0.1, + "cache_read": 0.05 + }, "type": "chat" }, { - "id": "cohere/rerank-v4-fast", - "name": "Cohere Rerank 4 Fast", - "display_name": "Cohere Rerank 4 Fast", + "id": "Salesforce/Llama-xLAM-2-70b-fc-r", + "name": "Llama-xLAM-2 70B fc-r", + "display_name": "Llama-xLAM-2 70B fc-r", "modalities": { "input": [ "text" @@ -160359,24 +165431,27 @@ ] }, "limit": { - "context": 32000, - "output": 32000 + "context": 128000, + "output": 16384 }, - "temperature": true, "tool_call": false, "reasoning": { "supported": false }, "attachment": false, "open_weights": false, - "release_date": "2025-12-11", - "last_updated": "2025-12-11", + "release_date": "2025-04-13", + "last_updated": "2025-04-13", + "cost": { + "input": 2.5, + "output": 2.5 + }, "type": "chat" }, { - "id": "cohere/embed-v4.0", - "name": "Embed v4.0", - "display_name": "Embed v4.0", + "id": "THUDM/GLM-Z1-32B-0414", + "name": "GLM Z1 32B 0414", + "display_name": "GLM Z1 32B 0414", "modalities": { "input": [ "text" @@ -160386,10 +165461,9 @@ ] }, "limit": { - "context": 8192, - "output": 1536 + "context": 128000, + "output": 65536 }, - "temperature": true, "tool_call": false, "reasoning": { "supported": false @@ -160398,44 +165472,16 @@ "open_weights": false, "release_date": "2025-04-15", "last_updated": "2025-04-15", - "type": "chat" - }, - { - "id": "cohere/command-a", - "name": "Command A", - "display_name": "Command A", - "modalities": { - "input": [ - "text" - ], - "output": [ - "text" - ] - }, - "limit": { - "context": 256000, - "output": 8000 - }, - "temperature": true, - "tool_call": true, - "reasoning": { - "supported": false - }, - "attachment": false, - "open_weights": false, - "knowledge": "2024-10", - "release_date": "2025-03-13", - "last_updated": "2025-03-13", "cost": { - "input": 2.5, - "output": 10 + "input": 0.2, + "output": 0.2 }, "type": "chat" }, { - "id": "cohere/rerank-v3.5", - "name": "Cohere Rerank 3.5", - "display_name": "Cohere Rerank 3.5", + "id": "THUDM/GLM-4-32B-0414", + "name": "GLM 4 32B 0414", + "display_name": "GLM 4 32B 0414", "modalities": { "input": [ "text" @@ -160445,64 +165491,27 @@ ] }, "limit": { - "context": 4096, - "output": 4096 + "context": 128000, + "output": 65536 }, - "temperature": true, "tool_call": false, "reasoning": { "supported": false }, "attachment": false, "open_weights": false, - "release_date": "2024-12-02", - "last_updated": "2024-12-02", - "type": "chat" - }, - { - "id": "moonshotai/kimi-k2-thinking-turbo", - "name": "Kimi K2 Thinking Turbo", - "display_name": "Kimi K2 Thinking Turbo", - "modalities": { - "input": [ - "text" - ], - "output": [ - "text" - ] - }, - "limit": { - "context": 262114, - "output": 262114 - }, - "temperature": true, - "tool_call": true, - "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true - } - }, - "attachment": false, - "open_weights": false, - "knowledge": "2024-08", - "release_date": "2025-11-06", - "last_updated": "2025-11-06", + "release_date": "2025-04-14", + "last_updated": "2025-04-14", "cost": { - "input": 1.15, - "output": 8, - "cache_read": 0.15 + "input": 0.2, + "output": 0.2 }, "type": "chat" }, { - "id": "moonshotai/kimi-k2-thinking", - "name": "Kimi K2 Thinking", - "display_name": "Kimi K2 Thinking", + "id": "THUDM/GLM-4-9B-0414", + "name": "GLM 4 9B 0414", + "display_name": "GLM 4 9B 0414", "modalities": { "input": [ "text" @@ -160512,83 +165521,57 @@ ] }, "limit": { - "context": 262114, - "output": 262114 + "context": 32000, + "output": 8000 }, - "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } + "supported": false }, "attachment": false, "open_weights": false, - "knowledge": "2024-08", - "release_date": "2025-11-06", - "last_updated": "2025-11-06", + "release_date": "2025-04-14", + "last_updated": "2025-04-14", "cost": { - "input": 0.6, - "output": 2.5, - "cache_read": 0.15 + "input": 0.2, + "output": 0.2 }, "type": "chat" }, { - "id": "moonshotai/kimi-k2.6", - "name": "Kimi K2.6", - "display_name": "Kimi K2.6", + "id": "THUDM/GLM-Z1-9B-0414", + "name": "GLM Z1 9B 0414", + "display_name": "GLM Z1 9B 0414", "modalities": { "input": [ - "text", - "image", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 262000, - "output": 262000 - }, - "temperature": true, - "tool_call": true, - "reasoning": { - "supported": true, - "default": true + "context": 32000, + "output": 8000 }, - "extra_capabilities": { - "reasoning": { - "supported": true - } + "tool_call": false, + "reasoning": { + "supported": false }, - "attachment": true, - "open_weights": true, - "knowledge": "2025-01", - "release_date": "2026-04-20", - "last_updated": "2026-04-21", + "attachment": false, + "open_weights": false, + "release_date": "2025-04-14", + "last_updated": "2025-04-14", "cost": { - "input": 0.95, - "output": 4, - "cache_read": 0.16 + "input": 0.2, + "output": 0.2 }, "type": "chat" }, { - "id": "moonshotai/kimi-k2-turbo", - "name": "Kimi K2 Turbo", - "display_name": "Kimi K2 Turbo", + "id": "meta-llama/llama-3.1-8b-instruct", + "name": "Llama 3.1 8b Instruct", + "display_name": "Llama 3.1 8b Instruct", "modalities": { "input": [ "text" @@ -160598,30 +165581,27 @@ ] }, "limit": { - "context": 256000, + "context": 131072, "output": 16384 }, - "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": false }, "attachment": false, "open_weights": false, - "knowledge": "2024-08", - "release_date": "2025-09-05", - "last_updated": "2025-09-05", + "release_date": "2024-07-23", + "last_updated": "2024-07-23", "cost": { - "input": 1.15, - "output": 8, - "cache_read": 0.15 + "input": 0.0544, + "output": 0.0544 }, "type": "chat" }, { - "id": "moonshotai/kimi-k2.5", - "name": "Kimi K2.5", - "display_name": "Kimi K2.5", + "id": "meta-llama/llama-4-maverick", + "name": "Llama 4 Maverick", + "display_name": "Llama 4 Maverick", "modalities": { "input": [ "text", @@ -160632,71 +165612,57 @@ ] }, "limit": { - "context": 262114, - "output": 262114 + "context": 1048576, + "output": 65536 }, - "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } + "supported": false }, "attachment": true, - "open_weights": true, - "knowledge": "2025-01", - "release_date": "2026-01-26", - "last_updated": "2026-01", + "open_weights": false, + "release_date": "2025-09-05", + "last_updated": "2025-09-05", "cost": { - "input": 0.6, - "output": 3, - "cache_read": 0.1 + "input": 0.18000000000000002, + "output": 0.8 }, "type": "chat" }, { - "id": "perplexity/sonar", - "name": "Sonar", - "display_name": "Sonar", + "id": "meta-llama/llama-3.3-70b-instruct", + "name": "Llama 3.3 70b Instruct", + "display_name": "Llama 3.3 70b Instruct", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 127000, - "output": 8000 + "context": 131072, + "output": 16384 }, - "temperature": true, "tool_call": true, "reasoning": { "supported": false }, - "attachment": true, + "attachment": false, "open_weights": false, - "knowledge": "2025-02", - "release_date": "2025-02-19", - "last_updated": "2025-02-19", + "release_date": "2025-02-27", + "last_updated": "2025-02-27", + "cost": { + "input": 0.05, + "output": 0.23 + }, "type": "chat" }, { - "id": "perplexity/sonar-pro", - "name": "Sonar Pro", - "display_name": "Sonar Pro", + "id": "meta-llama/llama-4-scout", + "name": "Llama 4 Scout", + "display_name": "Llama 4 Scout", "modalities": { "input": [ "text", @@ -160707,81 +165673,88 @@ ] }, "limit": { - "context": 200000, - "output": 8000 + "context": 328000, + "output": 65536 }, - "temperature": true, "tool_call": true, "reasoning": { "supported": false }, "attachment": true, "open_weights": false, - "knowledge": "2025-09", - "release_date": "2025-02-19", - "last_updated": "2025-02-19", + "release_date": "2025-09-05", + "last_updated": "2025-09-05", + "cost": { + "input": 0.085, + "output": 0.46 + }, "type": "chat" }, { - "id": "perplexity/sonar-reasoning-pro", - "name": "Sonar Reasoning Pro", - "display_name": "Sonar Reasoning Pro", + "id": "meta-llama/llama-3.2-3b-instruct", + "name": "Llama 3.2 3b Instruct", + "display_name": "Llama 3.2 3b Instruct", "modalities": { "input": [ - "text" + "text", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 127000, - "output": 8000 + "context": 131072, + "output": 8192 }, - "temperature": true, "tool_call": false, "reasoning": { - "supported": true, - "default": true + "supported": false }, - "attachment": false, + "attachment": true, "open_weights": false, - "knowledge": "2025-09", - "release_date": "2025-02-19", - "last_updated": "2025-02-19", + "release_date": "2024-09-25", + "last_updated": "2024-09-25", + "cost": { + "input": 0.0306, + "output": 0.0493 + }, "type": "chat" }, { - "id": "prodia/flux-fast-schnell", - "name": "Flux Schnell", - "display_name": "Flux Schnell", + "id": "featherless-ai/Qwerky-72B", + "name": "Qwerky 72B", + "display_name": "Qwerky 72B", "modalities": { "input": [ "text" ], "output": [ - "image" + "text" ] }, "limit": { - "context": 512, + "context": 32000, "output": 8192 }, - "temperature": true, "tool_call": false, "reasoning": { "supported": false }, "attachment": false, "open_weights": false, - "release_date": "2026-06-08", - "last_updated": "2026-06-08", + "release_date": "2025-03-20", + "last_updated": "2025-03-20", + "cost": { + "input": 0.5, + "output": 0.5 + }, "type": "chat" }, { - "id": "nvidia/nemotron-3-nano-30b-a3b", - "name": "Nemotron 3 Nano 30B A3B", - "display_name": "Nemotron 3 Nano 30B A3B", + "id": "moonshotai/kimi-k2-instruct-0711", + "name": "Kimi K2 0711", + "display_name": "Kimi K2 0711", "modalities": { "input": [ "text" @@ -160791,30 +165764,27 @@ ] }, "limit": { - "context": 262144, - "output": 262144 + "context": 128000, + "output": 8192 }, - "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, "attachment": false, "open_weights": false, - "knowledge": "2024-10", - "release_date": "2024-12-01", - "last_updated": "2025-12-15", + "release_date": "2025-07-11", + "last_updated": "2025-07-11", "cost": { - "input": 0.05, - "output": 0.24 + "input": 0.1, + "output": 2 }, "type": "chat" }, { - "id": "nvidia/nemotron-nano-9b-v2", - "name": "Nvidia Nemotron Nano 9B V2", - "display_name": "Nvidia Nemotron Nano 9B V2", + "id": "moonshotai/Kimi-K2-Instruct-0905", + "name": "Kimi K2 0905", + "display_name": "Kimi K2 0905", "modalities": { "input": [ "text" @@ -160824,30 +165794,27 @@ ] }, "limit": { - "context": 131072, - "output": 131072 + "context": 256000, + "output": 262144 }, - "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, "attachment": false, "open_weights": false, - "knowledge": "2024-10", - "release_date": "2025-08-18", - "last_updated": "2025-08-18", + "release_date": "2025-09-25", + "last_updated": "2025-09-25", "cost": { - "input": 0.06, - "output": 0.23 + "input": 0.4, + "output": 2 }, "type": "chat" }, { - "id": "nvidia/nemotron-3-ultra-550b-a55b", - "name": "Nemotron 3 Ultra", - "display_name": "Nemotron 3 Ultra", + "id": "moonshotai/kimi-k2-thinking-original", + "name": "Kimi K2 Thinking Original", + "display_name": "Kimi K2 Thinking Original", "modalities": { "input": [ "text" @@ -160857,30 +165824,28 @@ ] }, "limit": { - "context": 1000000, - "output": 65000 + "context": 256000, + "output": 16384 }, - "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": true, "default": true }, "attachment": false, "open_weights": false, - "release_date": "2026-06-04", - "last_updated": "2026-06-04", + "release_date": "2025-11-06", + "last_updated": "2025-11-06", "cost": { "input": 0.6, - "output": 2.4, - "cache_read": 0.12 + "output": 2.5 }, "type": "chat" }, { - "id": "nvidia/nemotron-nano-12b-v2-vl", - "name": "Nvidia Nemotron Nano 12B V2 VL", - "display_name": "Nvidia Nemotron Nano 12B V2 VL", + "id": "moonshotai/kimi-k2.5:thinking", + "name": "Kimi K2.5 Thinking", + "display_name": "Kimi K2.5 Thinking", "modalities": { "input": [ "text", @@ -160891,10 +165856,9 @@ ] }, "limit": { - "context": 131072, - "output": 131072 + "context": 256000, + "output": 65536 }, - "temperature": true, "tool_call": true, "reasoning": { "supported": true, @@ -160902,19 +165866,18 @@ }, "attachment": true, "open_weights": false, - "knowledge": "2024-10", - "release_date": "2024-12-01", - "last_updated": "2025-10-28", + "release_date": "2026-01-26", + "last_updated": "2026-01-26", "cost": { - "input": 0.2, - "output": 0.6 + "input": 0.3, + "output": 1.9 }, "type": "chat" }, { - "id": "nvidia/nemotron-3-super-120b-a12b", - "name": "NVIDIA Nemotron 3 Super 120B A12B", - "display_name": "NVIDIA Nemotron 3 Super 120B A12B", + "id": "moonshotai/kimi-k2-instruct", + "name": "Kimi K2 Instruct", + "display_name": "Kimi K2 Instruct", "modalities": { "input": [ "text" @@ -160925,27 +165888,26 @@ }, "limit": { "context": 256000, - "output": 32000 + "output": 8192 }, - "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { "supported": false }, "attachment": false, "open_weights": false, - "release_date": "2026-03-18", - "last_updated": "2026-03-11", + "release_date": "2025-07-01", + "last_updated": "2025-07-01", "cost": { - "input": 0.15, - "output": 0.65 + "input": 0.1, + "output": 2 }, "type": "chat" }, { - "id": "arcee-ai/trinity-large-preview", - "name": "Trinity Large Preview", - "display_name": "Trinity Large Preview", + "id": "moonshotai/kimi-k2-thinking", + "name": "Kimi K2 Thinking", + "display_name": "Kimi K2 Thinking", "modalities": { "input": [ "text" @@ -160955,157 +165917,181 @@ ] }, "limit": { - "context": 131000, - "output": 131000 + "context": 256000, + "output": 262144 }, - "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } }, "attachment": false, "open_weights": false, - "knowledge": "2024-10", - "release_date": "2025-01-01", - "last_updated": "2025-01", + "release_date": "2025-11-06", + "last_updated": "2025-11-06", "cost": { - "input": 0.25, - "output": 1 + "input": 0.3, + "output": 1.2 }, "type": "chat" }, { - "id": "arcee-ai/trinity-mini", - "name": "Trinity Mini", - "display_name": "Trinity Mini", + "id": "moonshotai/kimi-k2.6:thinking", + "name": "Kimi K2.6 Thinking", + "display_name": "Kimi K2.6 Thinking", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 131072, - "output": 131072 + "context": 256000, + "output": 65536 }, - "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": false, - "open_weights": false, - "knowledge": "2024-10", - "release_date": "2025-12-01", - "last_updated": "2025-12", + "attachment": true, + "open_weights": true, + "release_date": "2026-04-16", + "last_updated": "2026-04-21", "cost": { - "input": 0.045, - "output": 0.15 + "input": 0.53, + "output": 2.73 }, "type": "chat" }, { - "id": "arcee-ai/trinity-large-thinking", - "name": "Trinity Large Thinking", - "display_name": "Trinity Large Thinking", + "id": "moonshotai/kimi-k2.5", + "name": "Kimi K2.5", + "display_name": "Kimi K2.5", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 262100, - "output": 80000 + "context": 256000, + "output": 65536 }, - "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": true }, - "attachment": false, - "open_weights": true, - "release_date": "2026-04-01", - "last_updated": "2026-04-03", + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } + }, + "attachment": true, + "open_weights": false, + "release_date": "2026-01-26", + "last_updated": "2026-01-26", "cost": { - "input": 0.25, - "output": 0.8999999999999999 + "input": 0.3, + "output": 1.9 }, "type": "chat" }, { - "id": "meta/llama-3.1-8b", - "name": "Llama 3.1 8B Instruct", - "display_name": "Llama 3.1 8B Instruct", + "id": "moonshotai/kimi-k2.6", + "name": "Kimi K2.6", + "display_name": "Kimi K2.6", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 8192 + "context": 256000, + "output": 65536 }, - "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true }, - "attachment": false, - "open_weights": false, - "knowledge": "2023-12", - "release_date": "2024-07-23", - "last_updated": "2024-07-23", + "extra_capabilities": { + "reasoning": { + "supported": true + } + }, + "attachment": true, + "open_weights": true, + "release_date": "2026-04-16", + "last_updated": "2026-04-21", "cost": { - "input": 0.22, - "output": 0.22 + "input": 0.53, + "output": 2.73 }, "type": "chat" }, { - "id": "meta/llama-3.1-70b", - "name": "Llama 3.1 70B Instruct", - "display_name": "Llama 3.1 70B Instruct", + "id": "moonshotai/kimi-latest", + "name": "Kimi Latest", + "display_name": "Kimi Latest", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 8192 + "context": 256000, + "output": 65536 }, - "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": false, + "attachment": true, "open_weights": false, - "knowledge": "2023-12", - "release_date": "2024-07-23", - "last_updated": "2024-07-23", + "release_date": "2026-05-03", + "last_updated": "2026-05-03", "cost": { - "input": 0.72, - "output": 0.72 + "input": 0.5, + "output": 2.6, + "cache_read": 0.125 }, "type": "chat" }, { - "id": "meta/llama-3.2-3b", - "name": "Llama 3.2 3B Instruct", - "display_name": "Llama 3.2 3B Instruct", + "id": "moonshotai/kimi-k2-thinking-turbo-original", + "name": "Kimi K2 Thinking Turbo Original", + "display_name": "Kimi K2 Thinking Turbo Original", "modalities": { "input": [ "text" @@ -161115,29 +166101,28 @@ ] }, "limit": { - "context": 128000, - "output": 8192 + "context": 256000, + "output": 16384 }, - "temperature": true, "tool_call": false, "reasoning": { - "supported": false + "supported": true, + "default": true }, "attachment": false, "open_weights": false, - "knowledge": "2023-12", - "release_date": "2024-09-18", - "last_updated": "2024-09-18", + "release_date": "2025-11-06", + "last_updated": "2025-11-06", "cost": { - "input": 0.15, - "output": 0.15 + "input": 1.15, + "output": 8 }, "type": "chat" }, { - "id": "meta/llama-3.2-90b", - "name": "Llama 3.2 90B Vision Instruct", - "display_name": "Llama 3.2 90B Vision Instruct", + "id": "baidu/ernie-4.5-vl-28b-a3b", + "name": "ERNIE 4.5 VL 28B", + "display_name": "ERNIE 4.5 VL 28B", "modalities": { "input": [ "text", @@ -161148,62 +166133,60 @@ ] }, "limit": { - "context": 128000, - "output": 8192 + "context": 32768, + "output": 16384 }, - "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": false }, "attachment": true, "open_weights": false, - "knowledge": "2023-12", - "release_date": "2024-09-25", - "last_updated": "2024-09-25", + "release_date": "2025-06-30", + "last_updated": "2025-06-30", "cost": { - "input": 0.72, - "output": 0.72 + "input": 0.13999999999999999, + "output": 0.5599999999999999 }, "type": "chat" }, { - "id": "meta/llama-3.2-11b", - "name": "Llama 3.2 11B Vision Instruct", - "display_name": "Llama 3.2 11B Vision Instruct", + "id": "perceptron/perceptron-mk1", + "name": "Perceptron Mk1", + "display_name": "Perceptron Mk1", "modalities": { "input": [ "text", - "image" + "image", + "video" ], "output": [ "text" ] }, "limit": { - "context": 128000, + "context": 32768, "output": 8192 }, - "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": false + "supported": true, + "default": true }, "attachment": true, "open_weights": false, - "knowledge": "2023-12", - "release_date": "2024-09-25", - "last_updated": "2024-09-25", + "release_date": "2026-05-12", + "last_updated": "2026-05-12", "cost": { - "input": 0.16, - "output": 0.16 + "input": 0.15, + "output": 1.5 }, "type": "chat" }, { - "id": "meta/llama-3.2-1b", - "name": "Llama 3.2 1B Instruct", - "display_name": "Llama 3.2 1B Instruct", + "id": "failspy/Meta-Llama-3-70B-Instruct-abliterated-v3.5", + "name": "Llama 3 70B abliterated", + "display_name": "Llama 3 70B abliterated", "modalities": { "input": [ "text" @@ -161213,29 +166196,27 @@ ] }, "limit": { - "context": 128000, + "context": 8192, "output": 8192 }, - "temperature": true, "tool_call": false, "reasoning": { "supported": false }, "attachment": false, "open_weights": false, - "knowledge": "2023-12", - "release_date": "2024-09-18", - "last_updated": "2024-09-18", + "release_date": "2025-07-26", + "last_updated": "2025-07-26", "cost": { - "input": 0.1, - "output": 0.1 + "input": 0.7, + "output": 0.7 }, "type": "chat" }, { - "id": "meta/llama-3.3-70b", - "name": "Llama-3.3-70B-Instruct", - "display_name": "Llama-3.3-70B-Instruct", + "id": "nanogpt/coding-router:max", + "name": "Coding Router Max", + "display_name": "Coding Router Max", "modalities": { "input": [ "text" @@ -161245,130 +166226,125 @@ ] }, "limit": { - "context": 128000, - "output": 4096 + "context": 1000000, + "output": 128000 }, - "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": true, - "open_weights": true, - "knowledge": "2023-12", - "release_date": "2024-12-06", - "last_updated": "2024-12-06", + "attachment": false, + "open_weights": false, + "release_date": "2026-05-12", + "last_updated": "2026-05-12", "cost": { - "input": 0, - "output": 0 + "input": 5, + "output": 30, + "cache_read": 0.5 }, "type": "chat" }, { - "id": "meta/llama-4-scout", - "name": "Llama-4-Scout-17B-16E-Instruct-FP8", - "display_name": "Llama-4-Scout-17B-16E-Instruct-FP8", + "id": "nanogpt/coding-router:high", + "name": "Coding Router High", + "display_name": "Coding Router High", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 4096 + "context": 1000000, + "output": 128000 }, - "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": true, - "open_weights": true, - "knowledge": "2024-08", - "release_date": "2025-04-05", - "last_updated": "2025-04-05", + "attachment": false, + "open_weights": false, + "release_date": "2026-05-12", + "last_updated": "2026-05-12", "cost": { - "input": 0, - "output": 0 + "input": 1.1, + "output": 2.2, + "cache_read": 0.11 }, "type": "chat" }, { - "id": "meta/llama-4-maverick", - "name": "Llama-4-Maverick-17B-128E-Instruct-FP8", - "display_name": "Llama-4-Maverick-17B-128E-Instruct-FP8", + "id": "nanogpt/coding-router:low", + "name": "Coding Router Low", + "display_name": "Coding Router Low", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 4096 + "context": 1000000, + "output": 128000 }, - "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": true, - "open_weights": true, - "knowledge": "2024-08", - "release_date": "2025-04-05", - "last_updated": "2025-04-05", + "attachment": false, + "open_weights": false, + "release_date": "2026-05-12", + "last_updated": "2026-05-12", "cost": { - "input": 0, - "output": 0 + "input": 0.14, + "output": 0.28, + "cache_read": 0.028 }, "type": "chat" }, { - "id": "stepfun/step-3.7-flash", - "name": "Step 3.7 Flash", - "display_name": "Step 3.7 Flash", + "id": "nanogpt/coding-router:medium", + "name": "Coding Router Medium", + "display_name": "Coding Router Medium", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 256000, - "output": 256000 + "context": 1000000, + "output": 128000 }, - "temperature": true, "tool_call": true, "reasoning": { "supported": true, "default": true }, - "attachment": true, + "attachment": false, "open_weights": false, - "knowledge": "2026-01-01", - "release_date": "2026-05-28", - "last_updated": "2026-05-29", + "release_date": "2026-05-12", + "last_updated": "2026-05-12", "cost": { - "input": 0.2, - "output": 1.15, - "cache_read": 0.04 + "input": 0.14, + "output": 0.28, + "cache_read": 0.028 }, "type": "chat" }, { - "id": "stepfun/step-3.5-flash", - "name": "StepFun 3.5 Flash", - "display_name": "StepFun 3.5 Flash", + "id": "nanogpt/coding-router", + "name": "Coding Router", + "display_name": "Coding Router", "modalities": { "input": [ "text" @@ -161378,10 +166354,9 @@ ] }, "limit": { - "context": 262114, - "output": 262114 + "context": 1000000, + "output": 128000 }, - "temperature": true, "tool_call": true, "reasoning": { "supported": true, @@ -161389,55 +166364,49 @@ }, "attachment": false, "open_weights": false, - "knowledge": "2025-01", - "release_date": "2026-01-29", - "last_updated": "2026-02-13", + "release_date": "2026-05-12", + "last_updated": "2026-05-12", "cost": { - "input": 0.09, - "output": 0.3, - "cache_write": 0.02 + "input": 1.1, + "output": 2.2, + "cache_read": 0.11 }, "type": "chat" }, { - "id": "amazon/nova-2-lite", - "name": "Nova 2 Lite", - "display_name": "Nova 2 Lite", + "id": "GalrionSoftworks/MN-LooseCannon-12B-v1", + "name": "MN-LooseCannon-12B-v1", + "display_name": "MN-LooseCannon-12B-v1", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 1000000, - "output": 1000000 + "context": 16384, + "output": 8192 }, - "temperature": true, "tool_call": false, "reasoning": { - "supported": true, - "default": true + "supported": false }, - "attachment": true, + "attachment": false, "open_weights": false, - "knowledge": "2024-10", - "release_date": "2024-12-01", - "last_updated": "2024-12-01", + "release_date": "2024-07-01", + "last_updated": "2024-07-01", "cost": { - "input": 0.3, - "output": 2.5, - "cache_read": 0.075 + "input": 0.49299999999999994, + "output": 0.49299999999999994 }, "type": "chat" }, { - "id": "amazon/titan-embed-text-v2", - "name": "Titan Text Embeddings V2", - "display_name": "Titan Text Embeddings V2", + "id": "TheDrummer/Cydonia-24B-v4.3", + "name": "The Drummer Cydonia 24B v4.3", + "display_name": "The Drummer Cydonia 24B v4.3", "modalities": { "input": [ "text" @@ -161447,24 +166416,27 @@ ] }, "limit": { - "context": 8192, - "output": 1536 + "context": 32768, + "output": 32768 }, - "temperature": true, "tool_call": false, "reasoning": { "supported": false }, "attachment": false, "open_weights": false, - "release_date": "2024-04-01", - "last_updated": "2024-04", + "release_date": "2025-12-25", + "last_updated": "2025-12-25", + "cost": { + "input": 0.1003, + "output": 0.1207 + }, "type": "chat" }, { - "id": "amazon/nova-micro", - "name": "Nova Micro", - "display_name": "Nova Micro", + "id": "TheDrummer/Cydonia-24B-v4.1", + "name": "The Drummer Cydonia 24B v4.1", + "display_name": "The Drummer Cydonia 24B v4.1", "modalities": { "input": [ "text" @@ -161474,144 +166446,121 @@ ] }, "limit": { - "context": 128000, - "output": 8192 + "context": 16384, + "output": 32768 }, - "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": false }, "attachment": false, "open_weights": false, - "knowledge": "2024-10", - "release_date": "2024-12-03", - "last_updated": "2024-12-03", + "release_date": "2025-08-19", + "last_updated": "2025-08-19", "cost": { - "input": 0.035, - "output": 0.14, - "cache_read": 0.00875 + "input": 0.1003, + "output": 0.1207 }, "type": "chat" }, { - "id": "amazon/nova-pro", - "name": "Nova Pro", - "display_name": "Nova Pro", + "id": "TheDrummer/Cydonia-24B-v2", + "name": "The Drummer Cydonia 24B v2", + "display_name": "The Drummer Cydonia 24B v2", "modalities": { "input": [ - "text", - "image", - "video" + "text" ], "output": [ "text" ] }, "limit": { - "context": 300000, - "output": 8192 + "context": 16384, + "output": 32768 }, - "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": false }, - "attachment": true, + "attachment": false, "open_weights": false, - "knowledge": "2024-10", - "release_date": "2024-12-03", - "last_updated": "2024-12-03", + "release_date": "2025-02-17", + "last_updated": "2025-02-17", "cost": { - "input": 0.8, - "output": 3.2, - "cache_read": 0.2 + "input": 0.1003, + "output": 0.1207 }, "type": "chat" }, { - "id": "amazon/nova-lite", - "name": "Nova Lite", - "display_name": "Nova Lite", + "id": "TheDrummer/Anubis-70B-v1.1", + "name": "Anubis 70B v1.1", + "display_name": "Anubis 70B v1.1", "modalities": { "input": [ - "text", - "image", - "video" + "text" ], "output": [ "text" ] }, "limit": { - "context": 300000, - "output": 8192 + "context": 131072, + "output": 16384 }, - "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": false }, - "attachment": true, + "attachment": false, "open_weights": false, - "knowledge": "2024-10", - "release_date": "2024-12-03", - "last_updated": "2024-12-03", + "release_date": "2024-01-01", + "last_updated": "2024-01-01", "cost": { - "input": 0.06, - "output": 0.24, - "cache_read": 0.015 + "input": 0.31, + "output": 0.31 }, "type": "chat" }, { - "id": "zai/glm-4.7-flashx", - "name": "GLM 4.7 FlashX", - "display_name": "GLM 4.7 FlashX", + "id": "TheDrummer/UnslopNemo-12B-v4.1", + "name": "UnslopNemo 12b v4", + "display_name": "UnslopNemo 12b v4", "modalities": { "input": [ - "text" + "text", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 128000 + "context": 32768, + "output": 8192 }, - "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true - } + "supported": false }, - "attachment": false, - "open_weights": true, - "knowledge": "2025-01", - "release_date": "2025-01-01", - "last_updated": "2026-01-19", + "attachment": true, + "open_weights": false, + "release_date": "2024-01-01", + "last_updated": "2024-01-01", "cost": { - "input": 0.06, - "output": 0.4, - "cache_read": 0.01 + "input": 0.493, + "output": 0.493 }, "type": "chat" }, { - "id": "zai/glm-4.6v-flash", - "name": "GLM-4.6V-Flash", - "display_name": "GLM-4.6V-Flash", + "id": "TheDrummer/skyfall-36b-v2", + "name": "TheDrummer Skyfall 36B V2", + "display_name": "TheDrummer Skyfall 36B V2", "modalities": { "input": [ "text", - "image", "pdf" ], "output": [ @@ -161619,26 +166568,27 @@ ] }, "limit": { - "context": 128000, - "output": 24000 + "context": 64000, + "output": 32768 }, - "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": true + "supported": false }, "attachment": true, "open_weights": false, - "knowledge": "2024-10", - "release_date": "2025-09-30", - "last_updated": "2025-09-30", + "release_date": "2025-03-10", + "last_updated": "2025-03-10", + "cost": { + "input": 0.493, + "output": 0.493 + }, "type": "chat" }, { - "id": "zai/glm-4.6", - "name": "GLM 4.6", - "display_name": "GLM 4.6", + "id": "TheDrummer/Rocinante-12B-v1.1", + "name": "Rocinante 12b", + "display_name": "Rocinante 12b", "modalities": { "input": [ "text" @@ -161648,37 +166598,27 @@ ] }, "limit": { - "context": 200000, - "output": 96000 + "context": 16384, + "output": 8192 }, - "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true - } + "supported": false }, "attachment": false, - "open_weights": true, - "knowledge": "2025-04", - "release_date": "2025-09-30", - "last_updated": "2025-09-30", + "open_weights": false, + "release_date": "2024-01-01", + "last_updated": "2024-01-01", "cost": { - "input": 0.6, - "output": 2.2, - "cache_read": 0.11 + "input": 0.408, + "output": 0.595 }, "type": "chat" }, { - "id": "zai/glm-4.7", - "name": "GLM 4.7", - "display_name": "GLM 4.7", + "id": "TheDrummer/Magidonia-24B-v4.3", + "name": "The Drummer Magidonia 24B v4.3", + "display_name": "The Drummer Magidonia 24B v4.3", "modalities": { "input": [ "text" @@ -161688,81 +166628,60 @@ ] }, "limit": { - "context": 131000, - "output": 40000 + "context": 32768, + "output": 32768 }, - "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } + "supported": false }, "attachment": false, "open_weights": false, - "knowledge": "2024-10", - "release_date": "2025-12-22", - "last_updated": "2025-12-22", + "release_date": "2025-12-25", + "last_updated": "2025-12-25", "cost": { - "input": 2.25, - "output": 2.75, - "cache_read": 2.25 + "input": 0.1003, + "output": 0.1207 }, "type": "chat" }, { - "id": "zai/glm-4.5v", - "name": "GLM 4.5V", - "display_name": "GLM 4.5V", + "id": "TheDrummer/Cydonia-24B-v4", + "name": "The Drummer Cydonia 24B v4", + "display_name": "The Drummer Cydonia 24B v4", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 66000, - "output": 16000 + "context": 16384, + "output": 32768 }, - "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": true + "supported": false }, - "attachment": true, - "open_weights": true, - "knowledge": "2025-08", - "release_date": "2025-08-11", - "last_updated": "2025-08-11", + "attachment": false, + "open_weights": false, + "release_date": "2025-07-22", + "last_updated": "2025-07-22", "cost": { - "input": 0.6, - "output": 1.8, - "cache_read": 0.11 + "input": 0.2006, + "output": 0.2414 }, "type": "chat" }, { - "id": "zai/glm-4.6v", - "name": "GLM-4.6V", - "display_name": "GLM-4.6V", + "id": "TheDrummer/Skyfall-31B-v4.2", + "name": "TheDrummer Skyfall 31B v4.2", + "display_name": "TheDrummer Skyfall 31B v4.2", "modalities": { "input": [ "text", - "image", "pdf" ], "output": [ @@ -161770,31 +166689,27 @@ ] }, "limit": { - "context": 128000, - "output": 24000 + "context": 131072, + "output": 16384 }, - "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": true + "supported": false }, "attachment": true, "open_weights": false, - "knowledge": "2024-10", - "release_date": "2025-09-30", - "last_updated": "2025-12-08", + "release_date": "2026-03-26", + "last_updated": "2026-03-26", "cost": { - "input": 0.3, - "output": 0.9, - "cache_read": 0.05 + "input": 0.55, + "output": 0.8 }, "type": "chat" }, { - "id": "zai/glm-4.7-flash", - "name": "GLM 4.7 Flash", - "display_name": "GLM 4.7 Flash", + "id": "TheDrummer/Anubis-70B-v1", + "name": "Anubis 70B v1", + "display_name": "Anubis 70B v1", "modalities": { "input": [ "text" @@ -161804,70 +166719,57 @@ ] }, "limit": { - "context": 200000, - "output": 131000 + "context": 65536, + "output": 16384 }, - "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true - } + "supported": false }, "attachment": false, "open_weights": false, - "knowledge": "2025-04", - "release_date": "2026-03-13", - "last_updated": "2026-01-19", + "release_date": "2024-01-01", + "last_updated": "2024-01-01", "cost": { - "input": 0.07, - "output": 0.4 + "input": 0.31, + "output": 0.31 }, "type": "chat" }, { - "id": "zai/glm-5v-turbo", - "name": "GLM 5V Turbo", - "display_name": "GLM 5V Turbo", + "id": "huihui-ai/Qwen2.5-32B-Instruct-abliterated", + "name": "Qwen 2.5 32B Abliterated", + "display_name": "Qwen 2.5 32B Abliterated", "modalities": { "input": [ - "text", - "image", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 128000 + "context": 32768, + "output": 8192 }, - "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": true + "supported": false }, - "attachment": true, + "attachment": false, "open_weights": false, - "release_date": "2026-04-01", - "last_updated": "2026-04-01", + "release_date": "2025-01-06", + "last_updated": "2025-01-06", "cost": { - "input": 1.2, - "output": 4, - "cache_read": 0.24 + "input": 0.7, + "output": 0.7 }, "type": "chat" }, { - "id": "zai/glm-5", - "name": "GLM-5", - "display_name": "GLM-5", + "id": "huihui-ai/Llama-3.3-70B-Instruct-abliterated", + "name": "Llama 3.3 70B Instruct abliterated", + "display_name": "Llama 3.3 70B Instruct abliterated", "modalities": { "input": [ "text" @@ -161877,41 +166779,27 @@ ] }, "limit": { - "context": 202800, - "output": 131100 + "context": 16384, + "output": 16384 }, - "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } + "supported": false }, "attachment": false, - "open_weights": true, - "release_date": "2026-02-12", - "last_updated": "2026-02-11", + "open_weights": false, + "release_date": "2025-08-08", + "last_updated": "2025-08-08", "cost": { - "input": 1, - "output": 3.2, - "cache_read": 0.2 + "input": 0.7, + "output": 0.7 }, "type": "chat" }, { - "id": "zai/glm-5-turbo", - "name": "GLM 5 Turbo", - "display_name": "GLM 5 Turbo", + "id": "huihui-ai/DeepSeek-R1-Distill-Qwen-32B-abliterated", + "name": "DeepSeek R1 Qwen Abliterated", + "display_name": "DeepSeek R1 Qwen Abliterated", "modalities": { "input": [ "text" @@ -161921,35 +166809,28 @@ ] }, "limit": { - "context": 202800, - "output": 131100 + "context": 16384, + "output": 8192 }, - "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": true, "default": true }, - "extra_capabilities": { - "reasoning": { - "supported": true - } - }, "attachment": false, "open_weights": false, - "release_date": "2026-03-15", - "last_updated": "2026-03-16", + "release_date": "2025-01-20", + "last_updated": "2025-01-20", "cost": { - "input": 1.2, - "output": 4, - "cache_read": 0.24 + "input": 1.4, + "output": 1.4 }, "type": "chat" }, { - "id": "zai/glm-4.5", - "name": "GLM 4.5", - "display_name": "GLM 4.5", + "id": "huihui-ai/DeepSeek-R1-Distill-Llama-70B-abliterated", + "name": "DeepSeek R1 Llama 70B Abliterated", + "display_name": "DeepSeek R1 Llama 70B Abliterated", "modalities": { "input": [ "text" @@ -161959,37 +166840,28 @@ ] }, "limit": { - "context": 128000, - "output": 96000 + "context": 16384, + "output": 8192 }, - "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": true, "default": true }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true - } - }, "attachment": false, - "open_weights": true, - "knowledge": "2025-07", - "release_date": "2025-07-28", - "last_updated": "2025-07-28", + "open_weights": false, + "release_date": "2025-01-20", + "last_updated": "2025-01-20", "cost": { - "input": 0.6, - "output": 2.2, - "cache_read": 0.11 + "input": 0.7, + "output": 0.7 }, "type": "chat" }, { - "id": "zai/glm-4.5-air", - "name": "GLM 4.5 Air", - "display_name": "GLM 4.5 Air", + "id": "Envoid/Llama-3.05-NT-Storybreaker-Ministral-70B", + "name": "Llama 3.05 Storybreaker Ministral 70b", + "display_name": "Llama 3.05 Storybreaker Ministral 70b", "modalities": { "input": [ "text" @@ -161999,71 +166871,57 @@ ] }, "limit": { - "context": 128000, - "output": 96000 + "context": 16384, + "output": 8192 }, - "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": true + "supported": false }, "attachment": false, - "open_weights": true, - "knowledge": "2025-04", - "release_date": "2025-07-28", - "last_updated": "2025-07-28", + "open_weights": false, + "release_date": "2024-12-01", + "last_updated": "2024-12-01", "cost": { - "input": 0.2, - "output": 1.1, - "cache_read": 0.03 + "input": 0.49299999999999994, + "output": 0.49299999999999994 }, "type": "chat" }, { - "id": "zai/glm-5.1", - "name": "GLM 5.1", - "display_name": "GLM 5.1", + "id": "Envoid/Llama-3.05-Nemotron-Tenyxchat-Storybreaker-70B", + "name": "Nemotron Tenyxchat Storybreaker 70b", + "display_name": "Nemotron Tenyxchat Storybreaker 70b", "modalities": { "input": [ - "text", - "image", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 202800, - "output": 64000 + "context": 16384, + "output": 8192 }, - "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true - } + "supported": false }, - "attachment": true, + "attachment": false, "open_weights": false, - "release_date": "2026-04-07", - "last_updated": "2026-03-27", + "release_date": "2024-12-01", + "last_updated": "2024-12-01", "cost": { - "input": 1.4, - "output": 4.4, - "cache_read": 0.26 + "input": 0.49299999999999994, + "output": 0.49299999999999994 }, "type": "chat" }, { - "id": "meituan/longcat-flash-thinking-2601", - "name": "LongCat Flash Thinking 2601", - "display_name": "LongCat Flash Thinking 2601", + "id": "stepfun-ai/step-3.5-flash-2603", + "name": "Step 3.5 Flash 2603", + "display_name": "Step 3.5 Flash 2603", "modalities": { "input": [ "text" @@ -162073,10 +166931,9 @@ ] }, "limit": { - "context": 32768, - "output": 32768 + "context": 256000, + "output": 256000 }, - "temperature": true, "tool_call": false, "reasoning": { "supported": true, @@ -162084,14 +166941,18 @@ }, "attachment": false, "open_weights": false, - "release_date": "2026-03-13", - "last_updated": "2026-03-13", + "release_date": "2026-04-14", + "last_updated": "2026-04-14", + "cost": { + "input": 0.1, + "output": 0.3 + }, "type": "chat" }, { - "id": "meituan/longcat-flash-chat", - "name": "LongCat Flash Chat", - "display_name": "LongCat Flash Chat", + "id": "stepfun-ai/step-3.5-flash", + "name": "Step 3.5 Flash", + "display_name": "Step 3.5 Flash", "modalities": { "input": [ "text" @@ -162101,79 +166962,92 @@ ] }, "limit": { - "context": 128000, - "output": 100000 + "context": 256000, + "output": 256000 }, - "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": false + "supported": true, + "default": true }, "attachment": false, "open_weights": false, - "knowledge": "2024-10", - "release_date": "2025-08-30", - "last_updated": "2025-08-30", + "release_date": "2026-02-02", + "last_updated": "2026-02-02", + "cost": { + "input": 0.2, + "output": 0.5 + }, "type": "chat" }, { - "id": "voyage/voyage-code-2", - "name": "voyage-code-2", - "display_name": "voyage-code-2", + "id": "mistral/mistral-medium-3.5", + "name": "Mistral Medium 3.5", + "display_name": "Mistral Medium 3.5", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 8192, - "output": 1536 + "context": 256000, + "output": 32768 }, - "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": false, + "attachment": true, "open_weights": false, - "release_date": "2024-01-01", - "last_updated": "2024-01", + "release_date": "2026-04-29", + "last_updated": "2026-04-29", + "cost": { + "input": 1.5, + "output": 7.5 + }, "type": "chat" }, { - "id": "voyage/voyage-code-3", - "name": "voyage-code-3", - "display_name": "voyage-code-3", + "id": "mistral/mistral-medium-3.5:thinking", + "name": "Mistral Medium 3.5 Thinking", + "display_name": "Mistral Medium 3.5 Thinking", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 8192, - "output": 1536 + "context": 256000, + "output": 32768 }, - "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": false, + "attachment": true, "open_weights": false, - "release_date": "2024-09-01", - "last_updated": "2024-09", + "release_date": "2026-04-30", + "last_updated": "2026-04-30", + "cost": { + "input": 1.5, + "output": 7.5 + }, "type": "chat" }, { - "id": "voyage/rerank-2.5-lite", - "name": "Voyage Rerank 2.5 Lite", - "display_name": "Voyage Rerank 2.5 Lite", + "id": "Tongyi-Zhiwen/QwenLong-L1-32B", + "name": "QwenLong L1 32B", + "display_name": "QwenLong L1 32B", "modalities": { "input": [ "text" @@ -162183,24 +167057,27 @@ ] }, "limit": { - "context": 32000, - "output": 32000 + "context": 128000, + "output": 40960 }, - "temperature": true, "tool_call": false, "reasoning": { "supported": false }, "attachment": false, "open_weights": false, - "release_date": "2025-08-11", - "last_updated": "2025-08-11", + "release_date": "2025-01-25", + "last_updated": "2025-01-25", + "cost": { + "input": 0.13999999999999999, + "output": 0.6 + }, "type": "chat" }, { - "id": "voyage/voyage-finance-2", - "name": "voyage-finance-2", - "display_name": "voyage-finance-2", + "id": "google/gemini-flash-1.5", + "name": "Gemini 1.5 Flash", + "display_name": "Gemini 1.5 Flash", "modalities": { "input": [ "text" @@ -162210,440 +167087,630 @@ ] }, "limit": { - "context": 8192, - "output": 1536 + "context": 2000000, + "output": 8192 }, - "temperature": true, "tool_call": false, "reasoning": { "supported": false }, "attachment": false, "open_weights": false, - "release_date": "2024-03-01", - "last_updated": "2024-03", + "release_date": "2024-05-14", + "last_updated": "2024-05-14", + "cost": { + "input": 0.0748, + "output": 0.306 + }, "type": "chat" }, { - "id": "voyage/voyage-3.5", - "name": "voyage-3.5", - "display_name": "voyage-3.5", + "id": "google/gemini-3.1-pro-preview-high", + "name": "Gemini 3.1 Pro (Preview High)", + "display_name": "Gemini 3.1 Pro (Preview High)", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 8192, - "output": 1536 + "context": 1048756, + "output": 65536 }, - "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": false, + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": true, + "mode": "level", + "level": "high", + "level_options": [ + "low", + "high" + ], + "summaries": true, + "visibility": "summary", + "continuation": [ + "thought_signatures" + ] + } + }, + "attachment": true, "open_weights": false, - "release_date": "2025-05-20", - "last_updated": "2025-05-20", + "release_date": "2026-02-21", + "last_updated": "2026-02-21", + "cost": { + "input": 2, + "output": 12, + "cache_read": 0.2 + }, "type": "chat" }, { - "id": "voyage/voyage-4-large", - "name": "voyage-4-large", - "display_name": "voyage-4-large", + "id": "google/gemini-3.1-flash-lite", + "name": "Gemini 3.1 Flash Lite", + "display_name": "Gemini 3.1 Flash Lite", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 32000, - "output": 8192 + "context": 1048576, + "output": 65536 }, - "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": false, + "extra_capabilities": { + "reasoning": { + "supported": true + } + }, + "attachment": true, "open_weights": false, - "release_date": "2026-03-06", - "last_updated": "2026-03-06", + "release_date": "2026-03-03", + "last_updated": "2026-03-03", + "cost": { + "input": 0.25, + "output": 1.5, + "cache_read": 0.025 + }, "type": "chat" }, { - "id": "voyage/voyage-3.5-lite", - "name": "voyage-3.5-lite", - "display_name": "voyage-3.5-lite", + "id": "google/gemini-3-flash-preview-thinking", + "name": "Gemini 3 Flash Thinking", + "display_name": "Gemini 3 Flash Thinking", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 8192, - "output": 1536 + "context": 1048756, + "output": 65536 }, - "temperature": true, "tool_call": false, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": false, + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": true, + "mode": "level", + "level": "high", + "level_options": [ + "minimal", + "low", + "medium", + "high" + ], + "summaries": true, + "visibility": "summary", + "continuation": [ + "thought_signatures" + ] + } + }, + "attachment": true, "open_weights": false, - "release_date": "2025-05-20", - "last_updated": "2025-05-20", + "release_date": "2025-12-17", + "last_updated": "2025-12-17", + "cost": { + "input": 0.5, + "output": 3 + }, "type": "chat" }, { - "id": "voyage/rerank-2.5", - "name": "Voyage Rerank 2.5", - "display_name": "Voyage Rerank 2.5", + "id": "google/gemini-3.5-flash", + "name": "Gemini 3.5 Flash", + "display_name": "Gemini 3.5 Flash", "modalities": { "input": [ - "text" + "text", + "image", + "audio" ], "output": [ "text" ] }, "limit": { - "context": 32000, - "output": 32000 + "context": 1048576, + "output": 65536 }, - "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": false, + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": true, + "mode": "level", + "level": "high", + "level_options": [ + "minimal", + "low", + "medium", + "high" + ], + "summaries": true, + "visibility": "summary", + "continuation": [ + "thought_signatures" + ] + } + }, + "attachment": true, "open_weights": false, - "release_date": "2025-08-11", - "last_updated": "2025-08-11", + "release_date": "2026-05-19", + "last_updated": "2026-05-19", + "cost": { + "input": 1.5, + "output": 9, + "cache_read": 0.15 + }, "type": "chat" }, { - "id": "voyage/voyage-4", - "name": "voyage-4", - "display_name": "voyage-4", + "id": "google/gemma-4-31b-it", + "name": "Gemma 4 31B", + "display_name": "Gemma 4 31B", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 32000, - "output": 8192 + "context": 262144, + "output": 131072 }, - "temperature": true, "tool_call": false, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": false, + "attachment": true, "open_weights": false, - "release_date": "2026-03-06", - "last_updated": "2026-03-06", + "release_date": "2026-04-02", + "last_updated": "2026-04-02", + "cost": { + "input": 0.1, + "output": 0.35 + }, "type": "chat" }, { - "id": "voyage/voyage-3-large", - "name": "voyage-3-large", - "display_name": "voyage-3-large", + "id": "google/gemini-pro-latest", + "name": "Gemini Pro Latest", + "display_name": "Gemini Pro Latest", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 8192, - "output": 1536 + "context": 1048756, + "output": 65536 }, - "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": false, + "attachment": true, "open_weights": false, - "release_date": "2024-09-01", - "last_updated": "2024-09", + "release_date": "2026-03-29", + "last_updated": "2026-03-29", + "cost": { + "input": 2, + "output": 12, + "cache_read": 0.2 + }, "type": "chat" }, { - "id": "voyage/voyage-law-2", - "name": "voyage-law-2", - "display_name": "voyage-law-2", + "id": "google/gemini-3.1-pro-preview-customtools", + "name": "Gemini 3.1 Pro (Preview Custom Tools)", + "display_name": "Gemini 3.1 Pro (Preview Custom Tools)", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 8192, - "output": 1536 + "context": 1048756, + "output": 65536 }, - "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": false, + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": true, + "mode": "level", + "level": "high", + "level_options": [ + "low", + "high" + ], + "summaries": true, + "visibility": "summary", + "continuation": [ + "thought_signatures" + ] + } + }, + "attachment": true, "open_weights": false, - "release_date": "2024-03-01", - "last_updated": "2024-03", + "release_date": "2026-02-27", + "last_updated": "2026-02-27", + "cost": { + "input": 2, + "output": 12, + "cache_read": 0.2 + }, "type": "chat" }, { - "id": "voyage/voyage-4-lite", - "name": "voyage-4-lite", - "display_name": "voyage-4-lite", + "id": "google/gemini-flash-lite-latest", + "name": "Gemini Flash Lite Latest", + "display_name": "Gemini Flash Lite Latest", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 32000, - "output": 8192 + "context": 1048576, + "output": 65536 }, - "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": false, + "attachment": true, "open_weights": false, - "release_date": "2026-03-06", - "last_updated": "2026-03-06", + "release_date": "2026-03-29", + "last_updated": "2026-03-29", + "cost": { + "input": 0.25, + "output": 1.5, + "cache_read": 0.025 + }, "type": "chat" }, { - "id": "morph/morph-v3-large", - "name": "Morph v3 Large", - "display_name": "Morph v3 Large", + "id": "google/gemma-4-26b-a4b-it:thinking", + "name": "Gemma 4 26B A4B Thinking", + "display_name": "Gemma 4 26B A4B Thinking", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 32000, - "output": 32000 + "context": 262144, + "output": 131072 }, - "temperature": false, "tool_call": false, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": false, + "attachment": true, "open_weights": false, - "release_date": "2024-08-15", - "last_updated": "2024-08-15", + "release_date": "2026-04-02", + "last_updated": "2026-04-02", "cost": { - "input": 0.9, - "output": 1.9 + "input": 0.13, + "output": 0.4 }, "type": "chat" }, { - "id": "morph/morph-v3-fast", - "name": "Morph v3 Fast", - "display_name": "Morph v3 Fast", + "id": "google/gemini-3.1-pro-preview", + "name": "Gemini 3.1 Pro (Preview)", + "display_name": "Gemini 3.1 Pro (Preview)", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 16000, - "output": 16000 + "context": 1048756, + "output": 65536 }, - "temperature": false, - "tool_call": false, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": false, + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": true, + "mode": "level", + "level": "high", + "level_options": [ + "low", + "high" + ], + "summaries": true, + "visibility": "summary", + "continuation": [ + "thought_signatures" + ] + } + }, + "attachment": true, "open_weights": false, - "release_date": "2024-08-15", - "last_updated": "2024-08-15", + "release_date": "2026-02-19", + "last_updated": "2026-02-19", "cost": { - "input": 0.8, - "output": 1.2 + "input": 2, + "output": 12, + "cache_read": 0.2 }, "type": "chat" }, { - "id": "google/veo-3.1-fast-generate-001", - "name": "Veo 3.1 Fast Generate", - "display_name": "Veo 3.1 Fast Generate", + "id": "google/gemma-4-26b-a4b-it", + "name": "Gemma 4 26B A4B", + "display_name": "Gemma 4 26B A4B", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ - "video" + "text" ] }, "limit": { - "context": 8192, - "output": 8192 + "context": 262144, + "output": 131072 }, - "temperature": true, "tool_call": false, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": false, + "attachment": true, "open_weights": false, - "release_date": "2026-06-08", - "last_updated": "2026-06-08", + "release_date": "2026-04-02", + "last_updated": "2026-04-02", + "cost": { + "input": 0.13, + "output": 0.4 + }, "type": "chat" }, { - "id": "google/gemini-2.5-flash-image", - "name": "Nano Banana (Gemini 2.5 Flash Image)", - "display_name": "Nano Banana (Gemini 2.5 Flash Image)", + "id": "google/gemini-3.1-pro-preview-low", + "name": "Gemini 3.1 Pro (Preview Low)", + "display_name": "Gemini 3.1 Pro (Preview Low)", "modalities": { "input": [ - "text" - ], - "output": [ "text", "image" + ], + "output": [ + "text" ] }, "limit": { - "context": 32768, + "context": 1048756, "output": 65536 }, - "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": false, + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": true, + "mode": "level", + "level": "high", + "level_options": [ + "low", + "high" + ], + "summaries": true, + "visibility": "summary", + "continuation": [ + "thought_signatures" + ] + } + }, + "attachment": true, "open_weights": false, - "knowledge": "2025-01", - "release_date": "2025-03-20", - "last_updated": "2025-08-26", + "release_date": "2026-02-21", + "last_updated": "2026-02-21", "cost": { - "input": 0.3, - "output": 2.5, - "cache_read": 0.03 + "input": 2, + "output": 12, + "cache_read": 0.2 }, - "type": "imageGeneration" + "type": "chat" }, { - "id": "google/gemini-embedding-2", - "name": "Gemini Embedding 2", - "display_name": "Gemini Embedding 2", + "id": "google/gemma-4-31b-it:thinking", + "name": "Gemma 4 31B Thinking", + "display_name": "Gemma 4 31B Thinking", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 8192, - "output": 8192 + "context": 262144, + "output": 131072 }, - "temperature": true, "tool_call": false, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": false, + "attachment": true, "open_weights": false, - "release_date": "2026-03-10", - "last_updated": "2026-03-23", + "release_date": "2026-04-02", + "last_updated": "2026-04-02", + "cost": { + "input": 0.1, + "output": 0.35 + }, "type": "chat" }, { - "id": "google/gemini-3.1-flash-image", - "name": "Gemini 3.1 Flash Image (Nano Banana 2)", - "display_name": "Gemini 3.1 Flash Image (Nano Banana 2)", + "id": "google/gemini-3.5-flash-thinking", + "name": "Gemini 3.5 Flash Thinking", + "display_name": "Gemini 3.5 Flash Thinking", "modalities": { "input": [ "text", "image" ], "output": [ - "text", - "image" + "text" ] }, "limit": { - "context": 131072, - "output": 32768 + "context": 1048576, + "output": 65536 }, - "temperature": true, "tool_call": false, "reasoning": { "supported": true, "default": true }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": true, + "mode": "level", + "level": "high", + "level_options": [ + "minimal", + "low", + "medium", + "high" + ], + "summaries": true, + "visibility": "summary", + "continuation": [ + "thought_signatures" + ] + } + }, "attachment": true, "open_weights": false, - "release_date": "2026-05-28", - "last_updated": "2026-05-28", + "release_date": "2026-05-19", + "last_updated": "2026-05-19", "cost": { - "input": 0.5, - "output": 3, - "cache_read": 0.05 + "input": 1.5, + "output": 9, + "cache_read": 0.15 }, "type": "chat" }, { - "id": "google/gemini-3.1-flash-lite-preview", - "name": "Gemini 3.1 Flash Lite Preview", - "display_name": "Gemini 3.1 Flash Lite Preview", + "id": "google/gemini-3-flash-preview", + "name": "Gemini 3 Flash (Preview)", + "display_name": "Gemini 3 Flash (Preview)", "modalities": { "input": [ "text", - "image", - "pdf" + "image" ], "output": [ "text" ] }, "limit": { - "context": 1000000, - "output": 65000 + "context": 1048756, + "output": 65536 }, - "temperature": true, "tool_call": true, "reasoning": { "supported": true, @@ -162651,118 +167718,136 @@ }, "extra_capabilities": { "reasoning": { - "supported": true + "supported": true, + "default_enabled": true, + "mode": "level", + "level": "high", + "level_options": [ + "minimal", + "low", + "medium", + "high" + ], + "summaries": true, + "visibility": "summary", + "continuation": [ + "thought_signatures" + ] } }, "attachment": true, "open_weights": false, - "knowledge": "2025-01", - "release_date": "2026-03-03", - "last_updated": "2026-03-03", + "release_date": "2025-12-17", + "last_updated": "2025-12-17", "cost": { - "input": 0.25, - "output": 1.5, - "cache_read": 0.03 + "input": 0.5, + "output": 3 }, "type": "chat" }, { - "id": "google/gemma-4-31b-it", - "name": "Gemma 4 31B IT", - "display_name": "Gemma 4 31B IT", + "id": "google/gemini-flash-latest", + "name": "Gemini Flash Latest", + "display_name": "Gemini Flash Latest", "modalities": { "input": [ "text", - "image", - "pdf" + "image" ], "output": [ "text" ] }, "limit": { - "context": 262144, - "output": 131072 + "context": 1048756, + "output": 65536 }, - "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": true, "default": true }, "attachment": true, "open_weights": false, - "release_date": "2026-04-02", - "last_updated": "2026-04-02", + "release_date": "2026-03-29", + "last_updated": "2026-03-29", "cost": { - "input": 0.14, - "output": 0.4 + "input": 1.5, + "output": 9, + "cache_read": 0.15 }, "type": "chat" }, { - "id": "google/imagen-4.0-generate-001", - "name": "Imagen 4", - "display_name": "Imagen 4", + "id": "liquid/lfm-2-24b-a2b", + "name": "LFM2 24B A2B", + "display_name": "LFM2 24B A2B", "modalities": { "input": [ "text" ], "output": [ - "image" + "text" ] }, "limit": { - "context": 480, - "output": 8192 + "context": 32768, + "output": 32768 }, - "temperature": false, "tool_call": false, "reasoning": { "supported": false }, "attachment": false, "open_weights": false, - "release_date": "2025-05-22", - "last_updated": "2025-05-22", - "type": "imageGeneration" + "release_date": "2025-12-20", + "last_updated": "2025-12-20", + "cost": { + "input": 0.03, + "output": 0.12 + }, + "type": "chat" }, { - "id": "google/text-embedding-005", - "name": "Text Embedding 005", - "display_name": "Text Embedding 005", + "id": "x-ai/grok-4.20", + "name": "Grok 4.20", + "display_name": "Grok 4.20", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 8192, - "output": 1536 + "context": 2000000, + "output": 131072 }, - "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": false, + "attachment": true, "open_weights": false, - "release_date": "2024-08-01", - "last_updated": "2024-08", + "release_date": "2026-03-31", + "last_updated": "2026-03-31", + "cost": { + "input": 2, + "output": 6 + }, "type": "chat" }, { - "id": "google/gemini-3-flash", - "name": "Gemini 3 Flash", - "display_name": "Gemini 3 Flash", + "id": "x-ai/grok-4.3", + "name": "Grok 4.3", + "display_name": "Grok 4.3", "modalities": { "input": [ "text", - "image", - "pdf" + "image" ], "output": [ "text" @@ -162770,107 +167855,69 @@ }, "limit": { "context": 1000000, - "output": 65000 + "output": 1000000 }, - "temperature": true, "tool_call": true, - "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": true, - "mode": "level", - "level": "high", - "level_options": [ - "minimal", - "low", - "medium", - "high" - ], - "summaries": true, - "visibility": "summary", - "continuation": [ - "thought_signatures" - ] + "reasoning": { + "supported": true, + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true } }, "attachment": true, "open_weights": false, - "knowledge": "2025-03", - "release_date": "2025-12-17", - "last_updated": "2025-12-17", + "release_date": "2026-04-30", + "last_updated": "2026-04-30", "cost": { - "input": 0.5, - "output": 3, - "cache_read": 0.05 + "input": 1.25, + "output": 2.5, + "cache_read": 0.2 }, "type": "chat" }, { - "id": "google/gemini-3.1-pro-preview", - "name": "Gemini 3.1 Pro Preview", - "display_name": "Gemini 3.1 Pro Preview", + "id": "x-ai/grok-4.20-multi-agent", + "name": "Grok 4.20 Multi-Agent", + "display_name": "Grok 4.20 Multi-Agent", "modalities": { "input": [ "text", - "image", - "pdf" + "image" ], "output": [ "text" ] }, "limit": { - "context": 1000000, - "output": 64000 + "context": 2000000, + "output": 131072 }, - "temperature": true, "tool_call": true, "reasoning": { "supported": true, "default": true }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": true, - "mode": "level", - "level": "high", - "level_options": [ - "low", - "high" - ], - "summaries": true, - "visibility": "summary", - "continuation": [ - "thought_signatures" - ] - } - }, "attachment": true, "open_weights": false, - "knowledge": "2025-01", - "release_date": "2025-11-18", - "last_updated": "2026-02-19", + "release_date": "2026-03-31", + "last_updated": "2026-03-31", "cost": { "input": 2, - "output": 12, - "cache_read": 0.2 + "output": 6 }, "type": "chat" }, { - "id": "google/gemini-3.1-flash-lite", - "name": "Gemini 3.1 Flash Lite", - "display_name": "Gemini 3.1 Flash Lite", + "id": "x-ai/grok-latest", + "name": "Grok Latest", + "display_name": "Grok Latest", "modalities": { "input": [ "text", - "image", - "pdf" + "image" ], "output": [ "text" @@ -162878,357 +167925,277 @@ }, "limit": { "context": 1000000, - "output": 65000 + "output": 1000000 }, - "temperature": true, "tool_call": true, "reasoning": { "supported": true, "default": true }, - "extra_capabilities": { - "reasoning": { - "supported": true - } - }, "attachment": true, "open_weights": false, - "knowledge": "2025-01", - "release_date": "2026-05-07", - "last_updated": "2026-05-07", + "release_date": "2026-05-03", + "last_updated": "2026-05-03", "cost": { - "input": 0.25, - "output": 1.5, - "cache_read": 0.03 + "input": 1.25, + "output": 2.5, + "cache_read": 0.2 }, "type": "chat" }, { - "id": "google/gemini-2.5-flash-lite", - "name": "Gemini 2.5 Flash Lite", - "display_name": "Gemini 2.5 Flash Lite", + "id": "x-ai/grok-build-0.1", + "name": "Grok Build 0.1", + "display_name": "Grok Build 0.1", "modalities": { "input": [ "text", - "image", - "pdf" + "image" ], "output": [ "text" ] }, "limit": { - "context": 1048576, - "output": 65536 + "context": 256000, + "output": 256000 }, - "temperature": true, "tool_call": true, "reasoning": { "supported": true, - "default": false + "default": true }, "extra_capabilities": { "reasoning": { - "supported": true, - "default_enabled": false, - "mode": "budget", - "budget": { - "default": -1, - "min": 512, - "max": 24576, - "auto": -1, - "unit": "tokens" - }, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thought_signatures" - ] + "supported": true } }, "attachment": true, "open_weights": false, - "knowledge": "2025-01", - "release_date": "2025-06-17", - "last_updated": "2025-06-17", + "release_date": "2026-05-20", + "last_updated": "2026-05-20", "cost": { - "input": 0.1, - "output": 0.4, - "cache_read": 0.01 + "input": 1, + "output": 2, + "cache_read": 0.2 }, "type": "chat" }, { - "id": "google/veo-3.1-generate-001", - "name": "Veo 3.1", - "display_name": "Veo 3.1", + "id": "EVA-UNIT-01/EVA-LLaMA-3.33-70B-v0.0", + "name": "EVA Llama 3.33 70B", + "display_name": "EVA Llama 3.33 70B", "modalities": { "input": [ "text" ], "output": [ - "video" + "text" ] }, "limit": { - "context": 8192, - "output": 8192 + "context": 16384, + "output": 16384 }, - "temperature": true, "tool_call": false, "reasoning": { "supported": false }, "attachment": false, "open_weights": false, - "release_date": "2026-06-08", - "last_updated": "2026-06-08", + "release_date": "2025-07-26", + "last_updated": "2025-07-26", + "cost": { + "input": 2.006, + "output": 2.006 + }, "type": "chat" }, { - "id": "google/gemma-4-26b-a4b-it", - "name": "Gemma 4 26B A4B IT", - "display_name": "Gemma 4 26B A4B IT", + "id": "EVA-UNIT-01/EVA-Qwen2.5-72B-v0.2", + "name": "EVA-Qwen2.5-72B-v0.2", + "display_name": "EVA-Qwen2.5-72B-v0.2", "modalities": { "input": [ - "text", - "image", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 262144, - "output": 131072 + "context": 16384, + "output": 8192 }, - "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": true + "supported": false }, - "attachment": true, + "attachment": false, "open_weights": false, - "release_date": "2026-04-02", - "last_updated": "2026-04-02", + "release_date": "2025-09-25", + "last_updated": "2025-09-25", "cost": { - "input": 0.15, - "output": 0.6, - "cache_read": 0.015 + "input": 0.7989999999999999, + "output": 0.7989999999999999 }, "type": "chat" }, { - "id": "google/gemini-3.5-flash", - "name": "Gemini 3.5 Flash", - "display_name": "Gemini 3.5 Flash", + "id": "EVA-UNIT-01/EVA-LLaMA-3.33-70B-v0.1", + "name": "EVA-LLaMA-3.33-70B-v0.1", + "display_name": "EVA-LLaMA-3.33-70B-v0.1", "modalities": { "input": [ - "text", - "image", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 1000000, - "output": 64000 + "context": 16384, + "output": 16384 }, - "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": true, - "mode": "level", - "level": "high", - "level_options": [ - "minimal", - "low", - "medium", - "high" - ], - "summaries": true, - "visibility": "summary", - "continuation": [ - "thought_signatures" - ] - } + "supported": false }, - "attachment": true, + "attachment": false, "open_weights": false, - "knowledge": "2025-01", - "release_date": "2026-05-19", - "last_updated": "2026-05-19", + "release_date": "2025-09-25", + "last_updated": "2025-09-25", "cost": { - "input": 1.5, - "output": 9, - "cache_read": 0.15 + "input": 2.006, + "output": 2.006 }, "type": "chat" }, { - "id": "google/veo-3.0-generate-001", - "name": "Veo 3.0", - "display_name": "Veo 3.0", + "id": "EVA-UNIT-01/EVA-Qwen2.5-32B-v0.2", + "name": "EVA-Qwen2.5-32B-v0.2", + "display_name": "EVA-Qwen2.5-32B-v0.2", "modalities": { "input": [ "text" ], "output": [ - "video" + "text" ] }, "limit": { - "context": 8192, + "context": 16384, "output": 8192 }, - "temperature": true, "tool_call": false, "reasoning": { "supported": false }, "attachment": false, "open_weights": false, - "release_date": "2026-06-08", - "last_updated": "2026-06-08", + "release_date": "2025-07-26", + "last_updated": "2025-07-26", + "cost": { + "input": 0.7989999999999999, + "output": 0.7989999999999999 + }, "type": "chat" }, { - "id": "google/imagen-4.0-ultra-generate-001", - "name": "Imagen 4 Ultra", - "display_name": "Imagen 4 Ultra", + "id": "microsoft/wizardlm-2-8x22b", + "name": "WizardLM-2 8x22B", + "display_name": "WizardLM-2 8x22B", "modalities": { "input": [ - "text" + "text", + "pdf" ], "output": [ - "image" + "text" ] }, "limit": { - "context": 480, + "context": 65536, "output": 8192 }, - "temperature": false, "tool_call": false, "reasoning": { "supported": false }, - "attachment": false, + "attachment": true, "open_weights": false, - "release_date": "2025-05-24", - "last_updated": "2025-05-24", - "type": "imageGeneration" + "release_date": "2025-04-15", + "last_updated": "2025-04-15", + "cost": { + "input": 0.49299999999999994, + "output": 0.49299999999999994 + }, + "type": "chat" }, { - "id": "google/gemini-3-pro-preview", - "name": "Gemini 3 Pro Preview", - "display_name": "Gemini 3 Pro Preview", + "id": "Doctor-Shotgun/MS3.2-24B-Magnum-Diamond", + "name": "MS3.2 24B Magnum Diamond", + "display_name": "MS3.2 24B Magnum Diamond", "modalities": { "input": [ - "text", - "image", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 1000000, - "output": 64000 + "context": 16384, + "output": 32768 }, - "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": true, - "mode": "level", - "level": "high", - "level_options": [ - "low", - "high" - ], - "summaries": true, - "visibility": "summary", - "continuation": [ - "thought_signatures" - ] - } + "supported": false }, - "attachment": true, + "attachment": false, "open_weights": false, - "knowledge": "2025-01", - "release_date": "2025-11-18", - "last_updated": "2025-11-18", + "release_date": "2025-11-24", + "last_updated": "2025-11-24", "cost": { - "input": 2, - "output": 12, - "cache_read": 0.2, - "tiers": [ - { - "input": 4, - "output": 18, - "cache_read": 0.4, - "tier": { - "type": "context", - "size": 200000 - } - } - ], - "context_over_200k": { - "input": 4, - "output": 18, - "cache_read": 0.4 - } + "input": 0.49299999999999994, + "output": 0.49299999999999994 }, "type": "chat" }, { - "id": "google/veo-3.0-fast-generate-001", - "name": "Veo 3.0 Fast Generate", - "display_name": "Veo 3.0 Fast Generate", + "id": "poolside/laguna-xs.2", + "name": "Laguna XS.2", + "display_name": "Laguna XS.2", "modalities": { "input": [ "text" ], "output": [ - "video" + "text" ] }, "limit": { - "context": 8192, - "output": 8192 + "context": 128000, + "output": 32768 }, - "temperature": true, "tool_call": false, "reasoning": { "supported": false }, "attachment": false, "open_weights": false, - "release_date": "2026-06-08", - "last_updated": "2026-06-08", + "release_date": "2026-04-29", + "last_updated": "2026-04-29", + "cost": { + "input": 0.1, + "output": 0.3 + }, "type": "chat" }, { - "id": "google/gemini-embedding-001", - "name": "Gemini Embedding 001", - "display_name": "Gemini Embedding 001", + "id": "poolside/laguna-m.1", + "name": "Laguna M.1", + "display_name": "Laguna M.1", "modalities": { "input": [ "text" @@ -163238,147 +168205,135 @@ ] }, "limit": { - "context": 8192, - "output": 1536 + "context": 128000, + "output": 32768 }, - "temperature": true, "tool_call": false, "reasoning": { "supported": false }, "attachment": false, "open_weights": false, - "knowledge": "2025-05", - "release_date": "2025-05-20", - "last_updated": "2025-05-20", - "type": "embedding" + "release_date": "2026-04-29", + "last_updated": "2026-04-29", + "cost": { + "input": 0.1, + "output": 0.3 + }, + "type": "chat" }, { - "id": "google/gemini-3-pro-image", - "name": "Nano Banana Pro (Gemini 3 Pro Image)", - "display_name": "Nano Banana Pro (Gemini 3 Pro Image)", + "id": "z-ai/glm-4.5v:thinking", + "name": "GLM 4.5V Thinking", + "display_name": "GLM 4.5V Thinking", "modalities": { "input": [ - "text" - ], - "output": [ "text", "image" + ], + "output": [ + "text" ] }, "limit": { - "context": 65536, - "output": 32768 + "context": 64000, + "output": 96000 }, - "temperature": true, "tool_call": false, "reasoning": { "supported": true, "default": true }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": true, - "mode": "level", - "level": "high", - "level_options": [ - "low", - "high" - ], - "summaries": true, - "visibility": "summary", - "continuation": [ - "thought_signatures" - ] - } - }, - "attachment": false, + "attachment": true, "open_weights": false, - "knowledge": "2025-03", - "release_date": "2025-09-01", - "last_updated": "2025-09", + "release_date": "2025-11-22", + "last_updated": "2025-11-22", "cost": { - "input": 2, - "output": 12, - "cache_read": 0.2 + "input": 0.6, + "output": 1.7999999999999998 }, "type": "chat" }, { - "id": "google/imagen-4.0-fast-generate-001", - "name": "Imagen 4 Fast", - "display_name": "Imagen 4 Fast", + "id": "z-ai/glm-4.6:thinking", + "name": "GLM 4.6 Thinking", + "display_name": "GLM 4.6 Thinking", "modalities": { "input": [ "text" ], "output": [ - "image" + "text" ] }, "limit": { - "context": 480, - "output": 8192 + "context": 200000, + "output": 65535 }, - "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "attachment": false, "open_weights": false, - "release_date": "2025-06-01", - "last_updated": "2025-06", - "type": "imageGeneration" + "release_date": "2025-09-29", + "last_updated": "2025-09-29", + "cost": { + "input": 0.4, + "output": 1.5 + }, + "type": "chat" }, { - "id": "google/text-multilingual-embedding-002", - "name": "Text Multilingual Embedding 002", - "display_name": "Text Multilingual Embedding 002", + "id": "z-ai/glm-4.5v", + "name": "GLM 4.5V", + "display_name": "GLM 4.5V", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 8192, - "output": 1536 + "context": 64000, + "output": 96000 }, - "temperature": true, "tool_call": false, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": false, + "attachment": true, "open_weights": false, - "release_date": "2024-03-01", - "last_updated": "2024-03", + "release_date": "2025-11-22", + "last_updated": "2025-11-22", + "cost": { + "input": 0.6, + "output": 1.7999999999999998 + }, "type": "chat" }, { - "id": "google/gemini-3.1-flash-image-preview", - "name": "Gemini 3.1 Flash Image Preview (Nano Banana 2)", - "display_name": "Gemini 3.1 Flash Image Preview (Nano Banana 2)", + "id": "z-ai/glm-4.6", + "name": "GLM 4.6", + "display_name": "GLM 4.6", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ - "text", - "image" + "text" ] }, "limit": { - "context": 131072, - "output": 32768 + "context": 200000, + "output": 65535 }, - "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { "supported": true, "default": true @@ -163388,309 +168343,221 @@ "supported": true } }, - "attachment": true, + "attachment": false, "open_weights": false, - "knowledge": "2025-01", - "release_date": "2026-02-26", - "last_updated": "2026-02-26", + "release_date": "2025-09-30", + "last_updated": "2025-09-30", "cost": { - "input": 0.5, - "output": 3, - "cache_read": 0.05 + "input": 0.4, + "output": 1.5 }, - "type": "imageGeneration" + "type": "chat" }, { - "id": "google/gemini-2.5-flash", - "name": "Gemini 2.5 Flash", - "display_name": "Gemini 2.5 Flash", + "id": "z-ai/glm-5v-turbo:thinking", + "name": "GLM 5V Turbo Thinking", + "display_name": "GLM 5V Turbo Thinking", "modalities": { "input": [ "text", - "image", - "audio", - "video", - "pdf" + "image" ], "output": [ "text" ] }, "limit": { - "context": 1048576, - "output": 65536 + "context": 202800, + "output": 131100 }, - "temperature": true, "tool_call": true, "reasoning": { "supported": true, "default": true }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": true, - "mode": "budget", - "budget": { - "default": -1, - "min": 0, - "max": 24576, - "auto": -1, - "off": 0, - "unit": "tokens" - }, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thought_signatures" - ] - } - }, "attachment": true, "open_weights": false, - "knowledge": "2025-01", - "release_date": "2025-03-20", - "last_updated": "2025-06-05", + "release_date": "2026-04-02", + "last_updated": "2026-04-02", "cost": { - "input": 0.3, - "output": 2.5, - "cache_read": 0.03, - "input_audio": 1 + "input": 1.2, + "output": 4, + "cache_read": 0.24 }, "type": "chat" }, { - "id": "google/gemini-2.5-pro", - "name": "Gemini 2.5 Pro", - "display_name": "Gemini 2.5 Pro", + "id": "z-ai/glm-5v-turbo", + "name": "GLM 5V Turbo", + "display_name": "GLM 5V Turbo", "modalities": { "input": [ "text", - "image", - "audio", - "video", - "pdf" + "image" ], "output": [ "text" ] }, "limit": { - "context": 1048576, - "output": 65536 + "context": 202800, + "output": 131100 }, - "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": true, - "mode": "budget", - "budget": { - "default": -1, - "min": 128, - "max": 32768, - "auto": -1, - "unit": "tokens" - }, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thought_signatures" - ] - } + "supported": false }, "attachment": true, "open_weights": false, - "knowledge": "2025-01", - "release_date": "2025-03-20", - "last_updated": "2025-06-05", + "release_date": "2026-04-01", + "last_updated": "2026-04-01", "cost": { - "input": 1.25, - "output": 10, - "cache_read": 0.125, - "tiers": [ - { - "input": 2.5, - "output": 15, - "cache_read": 0.25, - "tier": { - "type": "context", - "size": 200000 - } - } - ], - "context_over_200k": { - "input": 2.5, - "output": 15, - "cache_read": 0.25 - } + "input": 1.2, + "output": 4, + "cache_read": 0.24 }, "type": "chat" }, { - "id": "openai/gpt-5-pro", - "name": "GPT-5 pro", - "display_name": "GPT-5 pro", + "id": "z-ai/glm-5-turbo", + "name": "GLM 5 Turbo", + "display_name": "GLM 5 Turbo", "modalities": { "input": [ - "text", - "image", - "pdf" + "text" ], "output": [ - "text", - "image" + "text" ] }, "limit": { - "context": 400000, - "output": 272000 + "context": 202800, + "output": 131072 }, - "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": true }, "extra_capabilities": { "reasoning": { - "supported": true, - "default_enabled": true, - "mode": "fixed", - "effort": "high", - "verbosity": "medium", - "verbosity_options": [ - "low", - "medium", - "high" - ], - "visibility": "hidden" + "supported": true } }, - "attachment": true, + "attachment": false, "open_weights": false, - "knowledge": "2024-10", - "release_date": "2025-08-07", - "last_updated": "2025-10-06", + "release_date": "2026-03-15", + "last_updated": "2026-03-15", "cost": { - "input": 15, - "output": 120 + "input": 1.2, + "output": 4, + "cache_read": 0.24 }, "type": "chat" }, { - "id": "openai/gpt-image-1", - "name": "GPT Image 1", - "display_name": "GPT Image 1", + "id": "openai/o3-mini-low", + "name": "OpenAI o3-mini (Low)", + "display_name": "OpenAI o3-mini (Low)", "modalities": { "input": [ "text" ], "output": [ - "image" + "text" ] }, "limit": { - "context": 8192, - "output": 8192 + "context": 200000, + "output": 100000 }, - "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": true, + "mode": "effort", + "effort": "medium", + "effort_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" + } }, "attachment": false, "open_weights": false, - "release_date": "2025-03-25", - "last_updated": "2025-03-25", + "release_date": "2025-01-31", + "last_updated": "2025-01-31", "cost": { - "input": 5, - "output": 40, - "cache_read": 1.25 + "input": 9.996, + "output": 19.992 }, - "type": "imageGeneration" + "type": "chat" }, { - "id": "openai/gpt-5-chat", - "name": "GPT-5 Chat", - "display_name": "GPT-5 Chat", + "id": "openai/gpt-oss-safeguard-20b", + "name": "GPT OSS Safeguard 20B", + "display_name": "GPT OSS Safeguard 20B", "modalities": { "input": [ - "text", - "image", - "pdf" + "text" ], "output": [ - "text", - "image" + "text" ] }, "limit": { "context": 128000, "output": 16384 }, - "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": true, "default": true }, - "attachment": true, + "attachment": false, "open_weights": false, - "knowledge": "2024-10", - "release_date": "2025-08-07", - "last_updated": "2025-08-07", + "release_date": "2025-10-29", + "last_updated": "2025-10-29", "cost": { - "input": 1.25, - "output": 10, - "cache_read": 0.125 + "input": 0.075, + "output": 0.3 }, "type": "chat" }, { - "id": "openai/gpt-5.2", - "name": "GPT-5.2", - "display_name": "GPT-5.2", + "id": "openai/o3", + "name": "OpenAI o3", + "display_name": "OpenAI o3", "modalities": { "input": [ - "text", - "image", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 400000, - "output": 128000 + "context": 200000, + "output": 100000 }, - "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": true, - "default": false + "default": true }, "extra_capabilities": { "reasoning": { "supported": true, - "default_enabled": false, + "default_enabled": true, "mode": "effort", - "effort": "none", + "effort": "medium", "effort_options": [ - "none", - "low", - "medium", - "high", - "xhigh" - ], - "verbosity": "medium", - "verbosity_options": [ "low", "medium", "high" @@ -163698,22 +168565,20 @@ "visibility": "hidden" } }, - "attachment": true, + "attachment": false, "open_weights": false, - "knowledge": "2024-10", - "release_date": "2025-12-11", - "last_updated": "2025-12-11", + "release_date": "2025-04-16", + "last_updated": "2025-04-16", "cost": { - "input": 1.75, - "output": 14, - "cache_read": 0.175 + "input": 2, + "output": 8 }, "type": "chat" }, { - "id": "openai/text-embedding-3-small", - "name": "text-embedding-3-small", - "display_name": "text-embedding-3-small", + "id": "openai/o4-mini-high", + "name": "OpenAI o4-mini high", + "display_name": "OpenAI o4-mini high", "modalities": { "input": [ "text" @@ -163723,56 +168588,87 @@ ] }, "limit": { - "context": 8192, - "output": 1536 + "context": 200000, + "output": 100000 }, - "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": true, + "mode": "effort", + "effort": "medium", + "effort_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" + } }, "attachment": false, "open_weights": false, - "release_date": "2024-01-25", - "last_updated": "2024-01-25", - "type": "embedding" + "release_date": "2025-04-16", + "last_updated": "2025-04-16", + "cost": { + "input": 1.1, + "output": 4.4 + }, + "type": "chat" }, { - "id": "openai/gpt-image-1-mini", - "name": "GPT Image 1 Mini", - "display_name": "GPT Image 1 Mini", + "id": "openai/o3-pro-2025-06-10", + "name": "OpenAI o3-pro (2025-06-10)", + "display_name": "OpenAI o3-pro (2025-06-10)", "modalities": { "input": [ "text" ], "output": [ - "image" + "text" ] }, "limit": { - "context": 8192, - "output": 8192 + "context": 200000, + "output": 100000 }, - "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": true, + "mode": "effort", + "effort": "medium", + "effort_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" + } }, "attachment": false, "open_weights": false, - "release_date": "2025-10-06", - "last_updated": "2025-10-06", + "release_date": "2025-06-10", + "last_updated": "2025-06-10", "cost": { - "input": 2, - "output": 8, - "cache_read": 0.2 + "input": 9.996, + "output": 19.992 }, - "type": "imageGeneration" + "type": "chat" }, { - "id": "openai/gpt-5.4-pro", - "name": "GPT 5.4 Pro", - "display_name": "GPT 5.4 Pro", + "id": "openai/gpt-5.2-pro", + "name": "GPT 5.2 Pro", + "display_name": "GPT 5.2 Pro", "modalities": { "input": [ "text", @@ -163784,10 +168680,9 @@ ] }, "limit": { - "context": 1050000, + "context": 400000, "output": 128000 }, - "temperature": true, "tool_call": true, "reasoning": { "supported": true, @@ -163815,19 +168710,18 @@ }, "attachment": true, "open_weights": false, - "knowledge": "2025-08-31", - "release_date": "2026-03-05", - "last_updated": "2026-03-05", + "release_date": "2026-01-01", + "last_updated": "2026-01-01", "cost": { - "input": 30, - "output": 180 + "input": 21, + "output": 168 }, "type": "chat" }, { - "id": "openai/text-embedding-3-large", - "name": "text-embedding-3-large", - "display_name": "text-embedding-3-large", + "id": "openai/gpt-4o-mini-search-preview", + "name": "GPT-4o mini Search Preview", + "display_name": "GPT-4o mini Search Preview", "modalities": { "input": [ "text" @@ -163837,24 +168731,27 @@ ] }, "limit": { - "context": 8192, - "output": 1536 + "context": 128000, + "output": 16384 }, - "temperature": true, "tool_call": false, "reasoning": { "supported": false }, "attachment": false, "open_weights": false, - "release_date": "2024-01-25", - "last_updated": "2024-01-25", - "type": "embedding" + "release_date": "2024-07-18", + "last_updated": "2024-07-18", + "cost": { + "input": 0.088, + "output": 0.35 + }, + "type": "chat" }, { - "id": "openai/gpt-5.2-pro", - "name": "GPT 5.2 ", - "display_name": "GPT 5.2 ", + "id": "openai/gpt-5", + "name": "GPT 5", + "display_name": "GPT 5", "modalities": { "input": [ "text", @@ -163869,7 +168766,6 @@ "context": 400000, "output": 128000 }, - "temperature": true, "tool_call": true, "reasoning": { "supported": true, @@ -163880,11 +168776,12 @@ "supported": true, "default_enabled": true, "mode": "effort", - "effort": "high", + "effort": "medium", "effort_options": [ + "minimal", + "low", "medium", - "high", - "xhigh" + "high" ], "verbosity": "medium", "verbosity_options": [ @@ -163897,35 +168794,62 @@ }, "attachment": true, "open_weights": false, - "knowledge": "2024-10", - "release_date": "2025-12-11", - "last_updated": "2025-12-11", + "release_date": "2025-08-07", + "last_updated": "2025-08-07", "cost": { - "input": 21, - "output": 168 + "input": 1.25, + "output": 10 }, "type": "chat" }, { - "id": "openai/o3-pro", - "name": "o3 Pro", - "display_name": "o3 Pro", + "id": "openai/gpt-3.5-turbo", + "name": "GPT-3.5 Turbo", + "display_name": "GPT-3.5 Turbo", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 16385, + "output": 4096 + }, + "tool_call": false, + "reasoning": { + "supported": false + }, + "attachment": false, + "open_weights": false, + "release_date": "2022-11-30", + "last_updated": "2024-01-01", + "cost": { + "input": 0.5, + "output": 1.5 + }, + "type": "chat" + }, + { + "id": "openai/gpt-5-pro", + "name": "GPT 5 Pro", + "display_name": "GPT 5 Pro", "modalities": { "input": [ "text", - "image", - "pdf" + "image" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 100000 + "context": 400000, + "output": 128000 }, - "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": true, "default": true @@ -163934,9 +168858,10 @@ "reasoning": { "supported": true, "default_enabled": true, - "mode": "effort", - "effort": "medium", - "effort_options": [ + "mode": "fixed", + "effort": "high", + "verbosity": "medium", + "verbosity_options": [ "low", "medium", "high" @@ -163946,22 +168871,22 @@ }, "attachment": true, "open_weights": false, - "knowledge": "2024-10", - "release_date": "2025-04-16", - "last_updated": "2025-06-10", + "release_date": "2025-08-07", + "last_updated": "2025-08-07", "cost": { - "input": 20, - "output": 80 + "input": 15, + "output": 120 }, "type": "chat" }, { - "id": "openai/gpt-4o-mini-search-preview", - "name": "GPT 4o Mini Search Preview", - "display_name": "GPT 4o Mini Search Preview", + "id": "openai/gpt-4o", + "name": "GPT-4o", + "display_name": "GPT-4o", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" @@ -163971,61 +168896,48 @@ "context": 128000, "output": 16384 }, - "temperature": true, "tool_call": false, "reasoning": { "supported": false }, - "attachment": false, + "attachment": true, "open_weights": false, - "knowledge": "2023-09", - "release_date": "2025-03-12", - "last_updated": "2025-01", + "release_date": "2024-05-13", + "last_updated": "2024-05-13", "cost": { - "input": 0.15, - "output": 0.6 + "input": 2.499, + "output": 9.996 }, "type": "chat" }, { - "id": "openai/gpt-5.4", - "name": "GPT 5.4", - "display_name": "GPT 5.4", + "id": "openai/o4-mini", + "name": "OpenAI o4-mini", + "display_name": "OpenAI o4-mini", "modalities": { "input": [ - "text", - "image", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 1050000, - "output": 128000 + "context": 200000, + "output": 100000 }, - "temperature": true, "tool_call": true, "reasoning": { "supported": true, - "default": false + "default": true }, "extra_capabilities": { "reasoning": { "supported": true, - "default_enabled": false, + "default_enabled": true, "mode": "effort", - "effort": "none", + "effort": "medium", "effort_options": [ - "none", - "low", - "medium", - "high", - "xhigh" - ], - "verbosity": "medium", - "verbosity_options": [ "low", "medium", "high" @@ -164033,22 +168945,20 @@ "visibility": "hidden" } }, - "attachment": true, + "attachment": false, "open_weights": false, - "knowledge": "2025-08-31", - "release_date": "2026-03-05", - "last_updated": "2026-03-05", + "release_date": "2025-04-16", + "last_updated": "2025-04-16", "cost": { - "input": 2.5, - "output": 15, - "cache_read": 0.25 + "input": 1.1, + "output": 4.4 }, "type": "chat" }, { - "id": "openai/gpt-5.5", - "name": "GPT 5.5", - "display_name": "GPT 5.5", + "id": "openai/gpt-5.4-nano", + "name": "GPT 5.4 Nano", + "display_name": "GPT 5.4 Nano", "modalities": { "input": [ "text", @@ -164060,22 +168970,22 @@ ] }, "limit": { - "context": 1000000, + "context": 400000, "output": 128000 }, - "temperature": true, "tool_call": true, "reasoning": { "supported": true, - "default": true + "default": false }, "extra_capabilities": { "reasoning": { "supported": true, - "default_enabled": true, + "default_enabled": false, "mode": "effort", - "effort": "medium", + "effort": "none", "effort_options": [ + "none", "low", "medium", "high", @@ -164092,64 +169002,23 @@ }, "attachment": true, "open_weights": false, - "knowledge": "2025-12-01", - "release_date": "2026-04-24", - "last_updated": "2026-04-23", - "cost": { - "input": 5, - "output": 30, - "cache_read": 0.5 - }, - "type": "chat" - }, - { - "id": "openai/gpt-oss-120b", - "name": "GPT OSS 120B", - "display_name": "GPT OSS 120B", - "modalities": { - "input": [ - "text" - ], - "output": [ - "text" - ] - }, - "limit": { - "context": 131072, - "output": 131000 - }, - "temperature": true, - "tool_call": true, - "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true - } - }, - "attachment": false, - "open_weights": true, - "knowledge": "2024-10", - "release_date": "2025-08-05", - "last_updated": "2025-08-05", + "release_date": "2026-03-17", + "last_updated": "2026-03-17", "cost": { - "input": 0.35, - "output": 0.75, - "cache_read": 0.25 + "input": 0.2, + "output": 1.25, + "cache_read": 0.02 }, "type": "chat" }, { - "id": "openai/gpt-5.1-codex-max", - "name": "GPT 5.1 Codex Max", - "display_name": "GPT 5.1 Codex Max", + "id": "openai/gpt-5.1-codex", + "name": "GPT 5.1 Codex", + "display_name": "GPT 5.1 Codex", "modalities": { "input": [ "text", - "image", - "pdf" + "image" ], "output": [ "text" @@ -164159,8 +169028,7 @@ "context": 400000, "output": 128000 }, - "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": true, "default": false @@ -164188,20 +169056,18 @@ }, "attachment": true, "open_weights": false, - "knowledge": "2024-10", - "release_date": "2025-11-19", + "release_date": "2025-11-13", "last_updated": "2025-11-13", "cost": { "input": 1.25, - "output": 10, - "cache_read": 0.125 + "output": 10 }, "type": "chat" }, { - "id": "openai/gpt-5.1-codex-mini", - "name": "GPT-5.1 Codex mini", - "display_name": "GPT-5.1 Codex mini", + "id": "openai/gpt-5.1-codex-max", + "name": "GPT 5.1 Codex Max", + "display_name": "GPT 5.1 Codex Max", "modalities": { "input": [ "text", @@ -164216,7 +169082,6 @@ "context": 400000, "output": 128000 }, - "temperature": true, "tool_call": true, "reasoning": { "supported": true, @@ -164245,47 +169110,49 @@ }, "attachment": true, "open_weights": false, - "knowledge": "2024-10", - "release_date": "2025-11-12", + "release_date": "2025-11-13", "last_updated": "2025-11-13", "cost": { - "input": 0.25, - "output": 2, - "cache_read": 0.025 + "input": 2.5, + "output": 20 }, "type": "chat" }, { - "id": "openai/text-embedding-ada-002", - "name": "text-embedding-ada-002", - "display_name": "text-embedding-ada-002", + "id": "openai/gpt-4o-2024-08-06", + "name": "GPT-4o (2024-08-06)", + "display_name": "GPT-4o (2024-08-06)", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 8192, - "output": 1536 + "context": 128000, + "output": 16384 }, - "temperature": true, "tool_call": false, "reasoning": { "supported": false }, - "attachment": false, + "attachment": true, "open_weights": false, - "release_date": "2022-12-15", - "last_updated": "2022-12-15", - "type": "embedding" + "release_date": "2024-08-06", + "last_updated": "2024-08-06", + "cost": { + "input": 2.499, + "output": 9.996 + }, + "type": "chat" }, { - "id": "openai/gpt-oss-20b", - "name": "GPT OSS 20B", - "display_name": "GPT OSS 20B", + "id": "openai/o1-preview", + "name": "OpenAI o1-preview", + "display_name": "OpenAI o1-preview", "modalities": { "input": [ "text" @@ -164295,40 +169162,45 @@ ] }, "limit": { - "context": 131072, - "output": 8192 + "context": 128000, + "output": 32768 }, - "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": true, "default": true }, "extra_capabilities": { "reasoning": { - "supported": true + "supported": true, + "default_enabled": true, + "mode": "effort", + "effort": "medium", + "effort_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" } }, "attachment": false, - "open_weights": true, - "knowledge": "2024-10", - "release_date": "2025-08-05", - "last_updated": "2025-08-05", + "open_weights": false, + "release_date": "2024-09-12", + "last_updated": "2024-09-12", "cost": { - "input": 0.05, - "output": 0.2 + "input": 14.993999999999998, + "output": 59.993 }, "type": "chat" }, { - "id": "openai/o3-deep-research", - "name": "o3-deep-research", - "display_name": "o3-deep-research", + "id": "openai/o3-mini", + "name": "OpenAI o3-mini", + "display_name": "OpenAI o3-mini", "modalities": { "input": [ - "text", - "image", - "pdf" + "text" ], "output": [ "text" @@ -164338,7 +169210,6 @@ "context": 200000, "output": 100000 }, - "temperature": true, "tool_call": true, "reasoning": { "supported": true, @@ -164358,22 +169229,20 @@ "visibility": "hidden" } }, - "attachment": true, + "attachment": false, "open_weights": false, - "knowledge": "2024-10", - "release_date": "2024-06-26", - "last_updated": "2024-06-26", + "release_date": "2025-01-31", + "last_updated": "2025-01-31", "cost": { - "input": 10, - "output": 40, - "cache_read": 2.5 + "input": 1.1, + "output": 4.4 }, "type": "chat" }, { - "id": "openai/gpt-5.4-nano", - "name": "GPT 5.4 Nano", - "display_name": "GPT 5.4 Nano", + "id": "openai/gpt-5.2", + "name": "GPT 5.2", + "display_name": "GPT 5.2", "modalities": { "input": [ "text", @@ -164388,7 +169257,6 @@ "context": 400000, "output": 128000 }, - "temperature": true, "tool_call": true, "reasoning": { "supported": true, @@ -164418,13 +169286,11 @@ }, "attachment": true, "open_weights": false, - "knowledge": "2025-08-31", - "release_date": "2026-03-17", - "last_updated": "2026-03-17", + "release_date": "2026-01-01", + "last_updated": "2026-01-01", "cost": { - "input": 0.2, - "output": 1.25, - "cache_read": 0.02 + "input": 1.75, + "output": 14 }, "type": "chat" }, @@ -164446,7 +169312,6 @@ "context": 400000, "output": 128000 }, - "temperature": true, "tool_call": true, "reasoning": { "supported": true, @@ -164475,9 +169340,8 @@ }, "attachment": true, "open_weights": false, - "knowledge": "2025-08-31", "release_date": "2026-02-24", - "last_updated": "2026-02-05", + "last_updated": "2026-02-24", "cost": { "input": 1.75, "output": 14, @@ -164486,9 +169350,9 @@ "type": "chat" }, { - "id": "openai/gpt-5.5-pro", - "name": "GPT 5.5 Pro", - "display_name": "GPT 5.5 Pro", + "id": "openai/gpt-latest", + "name": "GPT Latest", + "display_name": "GPT Latest", "modalities": { "input": [ "text", @@ -164503,32 +169367,79 @@ "context": 1000000, "output": 128000 }, - "temperature": true, "tool_call": true, "reasoning": { "supported": true, "default": true }, + "attachment": true, + "open_weights": false, + "release_date": "2026-03-29", + "last_updated": "2026-03-29", + "cost": { + "input": 5, + "output": 30, + "cache_read": 0.5 + }, + "type": "chat" + }, + { + "id": "openai/gpt-5.1-codex-mini", + "name": "GPT 5.1 Codex Mini", + "display_name": "GPT 5.1 Codex Mini", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 400000, + "output": 128000 + }, + "tool_call": false, + "reasoning": { + "supported": true, + "default": false + }, "extra_capabilities": { "reasoning": { - "supported": true + "supported": true, + "default_enabled": false, + "mode": "effort", + "effort": "none", + "effort_options": [ + "none", + "low", + "medium", + "high" + ], + "verbosity": "medium", + "verbosity_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" } }, "attachment": true, "open_weights": false, - "knowledge": "2025-12-01", - "release_date": "2026-04-24", - "last_updated": "2026-04-23", + "release_date": "2025-11-13", + "last_updated": "2025-11-13", "cost": { - "input": 30, - "output": 180 + "input": 0.25, + "output": 2 }, "type": "chat" }, { - "id": "openai/gpt-3.5-turbo", - "name": "GPT-3.5 Turbo", - "display_name": "GPT-3.5 Turbo", + "id": "openai/o4-mini-deep-research", + "name": "OpenAI o4-mini Deep Research", + "display_name": "OpenAI o4-mini Deep Research", "modalities": { "input": [ "text" @@ -164538,29 +169449,42 @@ ] }, "limit": { - "context": 16385, - "output": 4096 + "context": 200000, + "output": 100000 }, - "temperature": true, "tool_call": false, "reasoning": { - "supported": false + "supported": true, + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": true, + "mode": "effort", + "effort": "medium", + "effort_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" + } }, "attachment": false, "open_weights": false, - "knowledge": "2021-09", - "release_date": "2023-05-28", - "last_updated": "2023-11-06", + "release_date": "2025-04-16", + "last_updated": "2025-04-16", "cost": { - "input": 0.5, - "output": 1.5 + "input": 9.996, + "output": 19.992 }, "type": "chat" }, { - "id": "openai/gpt-5.2-chat", - "name": "GPT-5.2 Chat", - "display_name": "GPT-5.2 Chat", + "id": "openai/gpt-4.1-nano", + "name": "GPT 4.1 Nano", + "display_name": "GPT 4.1 Nano", "modalities": { "input": [ "text", @@ -164571,98 +169495,119 @@ "text" ] }, + "limit": { + "context": 1047576, + "output": 32768 + }, + "tool_call": false, + "reasoning": { + "supported": false + }, + "attachment": true, + "open_weights": false, + "release_date": "2025-04-14", + "last_updated": "2025-04-14", + "cost": { + "input": 0.1, + "output": 0.4 + }, + "type": "chat" + }, + { + "id": "openai/gpt-oss-120b", + "name": "GPT OSS 120B", + "display_name": "GPT OSS 120B", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, "limit": { "context": 128000, "output": 16384 }, - "temperature": true, "tool_call": true, "reasoning": { "supported": true, "default": true }, - "attachment": true, + "extra_capabilities": { + "reasoning": { + "supported": true + } + }, + "attachment": false, "open_weights": false, - "knowledge": "2024-10", - "release_date": "2025-12-11", - "last_updated": "2025-08-07", + "release_date": "2025-08-05", + "last_updated": "2025-08-05", "cost": { - "input": 1.75, - "output": 14, - "cache_read": 0.175 + "input": 0.05, + "output": 0.25 }, "type": "chat" }, { - "id": "openai/gpt-3.5-turbo-instruct", - "name": "GPT-3.5 Turbo Instruct", - "display_name": "GPT-3.5 Turbo Instruct", + "id": "openai/gpt-4o-2024-11-20", + "name": "GPT-4o (2024-11-20)", + "display_name": "GPT-4o (2024-11-20)", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 8192, - "output": 4096 + "context": 128000, + "output": 16384 }, - "temperature": true, "tool_call": false, "reasoning": { "supported": false }, - "attachment": false, + "attachment": true, "open_weights": false, - "knowledge": "2021-09", - "release_date": "2023-09-28", - "last_updated": "2023-03-01", + "release_date": "2024-11-20", + "last_updated": "2024-11-20", "cost": { - "input": 1.5, - "output": 2 + "input": 2.5, + "output": 10 }, "type": "chat" }, { - "id": "openai/gpt-5.1-instant", - "name": "GPT-5.1 Instant", - "display_name": "GPT-5.1 Instant", + "id": "openai/o1", + "name": "OpenAI o1", + "display_name": "OpenAI o1", "modalities": { "input": [ - "text", - "image", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 16384 + "context": 200000, + "output": 100000 }, - "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": true, - "default": false + "default": true }, "extra_capabilities": { "reasoning": { "supported": true, - "default_enabled": false, + "default_enabled": true, "mode": "effort", - "effort": "none", + "effort": "medium", "effort_options": [ - "none", - "low", - "medium", - "high" - ], - "verbosity": "medium", - "verbosity_options": [ "low", "medium", "high" @@ -164670,22 +169615,20 @@ "visibility": "hidden" } }, - "attachment": true, + "attachment": false, "open_weights": false, - "knowledge": "2024-10", - "release_date": "2025-11-12", - "last_updated": "2025-08-07", + "release_date": "2024-12-17", + "last_updated": "2024-12-17", "cost": { - "input": 1.25, - "output": 10, - "cache_read": 0.125 + "input": 14.993999999999998, + "output": 59.993 }, "type": "chat" }, { - "id": "openai/gpt-5.2-codex", - "name": "GPT-5.2-Codex", - "display_name": "GPT-5.2-Codex", + "id": "openai/o1-pro", + "name": "OpenAI o1 Pro", + "display_name": "OpenAI o1 Pro", "modalities": { "input": [ "text", @@ -164697,11 +169640,10 @@ ] }, "limit": { - "context": 400000, - "output": 128000 + "context": 200000, + "output": 100000 }, - "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": true, "default": true @@ -164713,13 +169655,6 @@ "mode": "effort", "effort": "medium", "effort_options": [ - "low", - "medium", - "high", - "xhigh" - ], - "verbosity": "medium", - "verbosity_options": [ "low", "medium", "high" @@ -164729,52 +169664,56 @@ }, "attachment": true, "open_weights": false, - "knowledge": "2024-10", - "release_date": "2025-12-18", - "last_updated": "2025-12-11", + "release_date": "2025-01-25", + "last_updated": "2025-01-25", "cost": { - "input": 1.75, - "output": 14, - "cache_read": 0.175 + "input": 150, + "output": 600 }, "type": "chat" }, { - "id": "openai/gpt-image-2", - "name": "GPT Image 2", - "display_name": "GPT Image 2", + "id": "openai/gpt-chat-latest", + "name": "GPT Chat Latest", + "display_name": "GPT Chat Latest", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ - "image" + "text" ] }, "limit": { - "context": 8192, - "output": 8192 + "context": 400000, + "output": 128000 }, - "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { - "supported": false + "supported": true }, - "attachment": false, + "extra_capabilities": { + "reasoning": { + "supported": true + } + }, + "attachment": true, "open_weights": false, - "release_date": "2026-04-21", - "last_updated": "2026-04-21", + "release_date": "2026-05-03", + "last_updated": "2026-05-03", "cost": { "input": 5, "output": 30, - "cache_read": 1.25 + "cache_read": 0.5 }, - "type": "imageGeneration" + "type": "chat" }, { - "id": "openai/gpt-5.1-codex", - "name": "GPT-5.1-Codex", - "display_name": "GPT-5.1-Codex", + "id": "openai/gpt-5.4", + "name": "GPT 5.4", + "display_name": "GPT 5.4", "modalities": { "input": [ "text", @@ -164786,10 +169725,9 @@ ] }, "limit": { - "context": 400000, + "context": 922000, "output": 128000 }, - "temperature": true, "tool_call": true, "reasoning": { "supported": true, @@ -164805,7 +169743,8 @@ "none", "low", "medium", - "high" + "high", + "xhigh" ], "verbosity": "medium", "verbosity_options": [ @@ -164818,47 +169757,12 @@ }, "attachment": true, "open_weights": false, - "knowledge": "2024-10", - "release_date": "2025-11-12", - "last_updated": "2025-11-13", - "cost": { - "input": 1.25, - "output": 10, - "cache_read": 0.125 - }, - "type": "chat" - }, - { - "id": "openai/gpt-oss-safeguard-20b", - "name": "gpt-oss-safeguard-20b", - "display_name": "gpt-oss-safeguard-20b", - "modalities": { - "input": [ - "text" - ], - "output": [ - "text" - ] - }, - "limit": { - "context": 131072, - "output": 65536 - }, - "temperature": true, - "tool_call": true, - "reasoning": { - "supported": true, - "default": true - }, - "attachment": false, - "open_weights": false, - "knowledge": "2024-10", - "release_date": "2024-12-01", - "last_updated": "2024-12-01", + "release_date": "2026-03-05", + "last_updated": "2026-03-05", "cost": { - "input": 0.075, - "output": 0.3, - "cache_read": 0.037 + "input": 2.5, + "output": 15, + "cache_read": 0.25 }, "type": "chat" }, @@ -164880,7 +169784,6 @@ "context": 400000, "output": 128000 }, - "temperature": true, "tool_call": true, "reasoning": { "supported": true, @@ -164910,7 +169813,6 @@ }, "attachment": true, "open_weights": false, - "knowledge": "2025-08-31", "release_date": "2026-03-17", "last_updated": "2026-03-17", "cost": { @@ -164921,9 +169823,9 @@ "type": "chat" }, { - "id": "openai/gpt-5.1-thinking", - "name": "GPT 5.1 Thinking", - "display_name": "GPT 5.1 Thinking", + "id": "openai/gpt-4.1", + "name": "GPT 4.1", + "display_name": "GPT 4.1", "modalities": { "input": [ "text", @@ -164931,34 +169833,55 @@ "pdf" ], "output": [ - "text", - "image" + "text" ] }, "limit": { - "context": 400000, - "output": 128000 + "context": 1047576, + "output": 32768 }, - "temperature": true, "tool_call": true, + "reasoning": { + "supported": false + }, + "attachment": true, + "open_weights": false, + "release_date": "2025-09-10", + "last_updated": "2025-09-10", + "cost": { + "input": 2, + "output": 8 + }, + "type": "chat" + }, + { + "id": "openai/o3-deep-research", + "name": "OpenAI o3 Deep Research", + "display_name": "OpenAI o3 Deep Research", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 200000, + "output": 100000 + }, + "tool_call": false, "reasoning": { "supported": true, - "default": false + "default": true }, "extra_capabilities": { "reasoning": { "supported": true, - "default_enabled": false, + "default_enabled": true, "mode": "effort", - "effort": "none", + "effort": "medium", "effort_options": [ - "none", - "low", - "medium", - "high" - ], - "verbosity": "medium", - "verbosity_options": [ "low", "medium", "high" @@ -164966,89 +169889,103 @@ "visibility": "hidden" } }, - "attachment": true, + "attachment": false, "open_weights": false, - "knowledge": "2024-10", - "release_date": "2025-11-12", - "last_updated": "2025-08-07", + "release_date": "2025-04-16", + "last_updated": "2025-04-16", "cost": { - "input": 1.25, - "output": 10, - "cache_read": 0.125 + "input": 9.996, + "output": 19.992 }, "type": "chat" }, { - "id": "openai/gpt-image-1.5", - "name": "GPT Image 1.5", - "display_name": "GPT Image 1.5", + "id": "openai/gpt-4-turbo-preview", + "name": "GPT-4 Turbo Preview", + "display_name": "GPT-4 Turbo Preview", "modalities": { "input": [ "text" ], "output": [ - "image" + "text" ] }, "limit": { - "context": 8192, - "output": 8192 + "context": 128000, + "output": 4096 }, - "temperature": true, "tool_call": false, "reasoning": { "supported": false }, "attachment": false, "open_weights": false, - "release_date": "2025-12-16", - "last_updated": "2025-12-16", + "release_date": "2023-11-06", + "last_updated": "2024-01-01", "cost": { - "input": 5, - "output": 32, - "cache_read": 1.25 + "input": 9.996, + "output": 30.004999999999995 }, - "type": "imageGeneration" + "type": "chat" }, { - "id": "openai/gpt-5.3-chat", - "name": "GPT-5.3 Chat", - "display_name": "GPT-5.3 Chat", + "id": "openai/gpt-5-mini", + "name": "GPT 5 Mini", + "display_name": "GPT 5 Mini", "modalities": { "input": [ "text", - "image", - "pdf" + "image" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 16384 + "context": 400000, + "output": 128000 }, - "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": true, "default": true }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": true, + "mode": "effort", + "effort": "medium", + "effort_options": [ + "minimal", + "low", + "medium", + "high" + ], + "verbosity": "medium", + "verbosity_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" + } + }, "attachment": true, "open_weights": false, - "release_date": "2026-03-03", - "last_updated": "2026-03-06", + "release_date": "2025-08-07", + "last_updated": "2025-08-07", "cost": { - "input": 1.75, - "output": 14, - "cache_read": 0.175 + "input": 0.25, + "output": 2 }, "type": "chat" }, { - "id": "openai/gpt-4.1-nano", - "name": "GPT-4.1 nano", - "display_name": "GPT-4.1 nano", + "id": "openai/gpt-4.1-mini", + "name": "GPT 4.1 Mini", + "display_name": "GPT 4.1 Mini", "modalities": { "input": [ "text", @@ -165062,43 +169999,69 @@ "context": 1047576, "output": 32768 }, - "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": false }, "attachment": true, "open_weights": false, - "knowledge": "2024-04", "release_date": "2025-04-14", "last_updated": "2025-04-14", "cost": { - "input": 0.1, - "output": 0.4, - "cache_read": 0.025 + "input": 0.4, + "output": 1.6 }, "type": "chat" }, { - "id": "openai/o1", - "name": "o1", - "display_name": "o1", + "id": "openai/gpt-4-turbo", + "name": "GPT-4 Turbo", + "display_name": "GPT-4 Turbo", "modalities": { "input": [ "text", - "image", - "pdf" + "image" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 100000 + "context": 128000, + "output": 4096 }, - "temperature": false, - "tool_call": true, + "tool_call": false, + "reasoning": { + "supported": false + }, + "attachment": true, + "open_weights": false, + "release_date": "2023-11-06", + "last_updated": "2024-01-01", + "cost": { + "input": 10, + "output": 30 + }, + "type": "chat" + }, + { + "id": "openai/gpt-5-nano", + "name": "GPT 5 Nano", + "display_name": "GPT 5 Nano", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 400000, + "output": 128000 + }, + "tool_call": false, "reasoning": { "supported": true, "default": true @@ -165110,6 +170073,13 @@ "mode": "effort", "effort": "medium", "effort_options": [ + "minimal", + "low", + "medium", + "high" + ], + "verbosity": "medium", + "verbosity_options": [ "low", "medium", "high" @@ -165119,93 +170089,121 @@ }, "attachment": true, "open_weights": false, - "knowledge": "2023-09", - "release_date": "2024-12-05", - "last_updated": "2024-12-05", + "release_date": "2025-08-07", + "last_updated": "2025-08-07", "cost": { - "input": 15, - "output": 60, - "cache_read": 7.5 + "input": 0.05, + "output": 0.4 }, "type": "chat" }, { - "id": "openai/gpt-4-turbo", - "name": "GPT-4 Turbo", - "display_name": "GPT-4 Turbo", + "id": "openai/gpt-5.4-pro", + "name": "GPT 5.4 Pro", + "display_name": "GPT 5.4 Pro", "modalities": { "input": [ "text", - "image" + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 4096 + "context": 922000, + "output": 128000 }, - "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": true, + "mode": "effort", + "effort": "high", + "effort_options": [ + "medium", + "high", + "xhigh" + ], + "verbosity": "medium", + "verbosity_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" + } }, "attachment": true, "open_weights": false, - "knowledge": "2023-12", - "release_date": "2023-11-06", - "last_updated": "2024-04-09", + "release_date": "2026-03-05", + "last_updated": "2026-03-05", "cost": { - "input": 10, - "output": 30 + "input": 30, + "output": 180, + "cache_read": 3 }, "type": "chat" }, { - "id": "openai/gpt-4.1", - "name": "GPT-4.1", - "display_name": "GPT-4.1", + "id": "openai/o3-mini-high", + "name": "OpenAI o3-mini (High)", + "display_name": "OpenAI o3-mini (High)", "modalities": { "input": [ - "text", - "image", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 1047576, - "output": 32768 + "context": 200000, + "output": 100000 }, - "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": true, + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": true, + "mode": "effort", + "effort": "medium", + "effort_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" + } + }, + "attachment": false, "open_weights": false, - "knowledge": "2024-04", - "release_date": "2025-04-14", - "last_updated": "2025-04-14", + "release_date": "2025-01-31", + "last_updated": "2025-01-31", "cost": { - "input": 2, - "output": 8, - "cache_read": 0.5 + "input": 0.64, + "output": 2.588 }, "type": "chat" }, { - "id": "openai/gpt-4o-mini", - "name": "GPT-4o mini", - "display_name": "GPT-4o mini", + "id": "openai/gpt-4o-search-preview", + "name": "GPT-4o Search Preview", + "display_name": "GPT-4o Search Preview", "modalities": { "input": [ "text", - "image", - "pdf" + "image" ], "output": [ "text" @@ -165215,54 +170213,49 @@ "context": 128000, "output": 16384 }, - "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": false }, "attachment": true, "open_weights": false, - "knowledge": "2023-09", - "release_date": "2024-07-18", - "last_updated": "2024-07-18", + "release_date": "2024-05-13", + "last_updated": "2024-05-13", "cost": { - "input": 0.15, - "output": 0.6, - "cache_read": 0.075 + "input": 1.47, + "output": 5.88 }, "type": "chat" }, { - "id": "openai/gpt-5-nano", - "name": "GPT-5 Nano", - "display_name": "GPT-5 Nano", + "id": "openai/gpt-5.1-2025-11-13", + "name": "GPT-5.1 (2025-11-13)", + "display_name": "GPT-5.1 (2025-11-13)", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 400000, - "output": 128000 + "context": 1000000, + "output": 32768 }, - "temperature": false, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": true, - "default": true + "default": false }, "extra_capabilities": { "reasoning": { "supported": true, - "default_enabled": true, + "default_enabled": false, "mode": "effort", - "effort": "medium", + "effort": "none", "effort_options": [ - "minimal", + "none", "low", "medium", "high" @@ -165276,22 +170269,51 @@ "visibility": "hidden" } }, + "attachment": false, + "open_weights": false, + "release_date": "2025-11-13", + "last_updated": "2025-11-13", + "cost": { + "input": 1.25, + "output": 10 + }, + "type": "chat" + }, + { + "id": "openai/gpt-4o-mini", + "name": "GPT-4o mini", + "display_name": "GPT-4o mini", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 128000, + "output": 16384 + }, + "tool_call": false, + "reasoning": { + "supported": false + }, "attachment": true, "open_weights": false, - "knowledge": "2024-05-30", - "release_date": "2025-08-07", - "last_updated": "2025-08-07", + "release_date": "2024-07-18", + "last_updated": "2024-07-18", "cost": { - "input": 0.05, - "output": 0.4, - "cache_read": 0.005 + "input": 0.1496, + "output": 0.595 }, "type": "chat" }, { - "id": "openai/o3-mini", - "name": "o3-mini", - "display_name": "o3-mini", + "id": "openai/gpt-oss-20b", + "name": "GPT OSS 20B", + "display_name": "GPT OSS 20B", "modalities": { "input": [ "text" @@ -165301,60 +170323,46 @@ ] }, "limit": { - "context": 200000, - "output": 100000 + "context": 128000, + "output": 16384 }, - "temperature": false, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": true, "default": true }, "extra_capabilities": { "reasoning": { - "supported": true, - "default_enabled": true, - "mode": "effort", - "effort": "medium", - "effort_options": [ - "low", - "medium", - "high" - ], - "visibility": "hidden" + "supported": true } }, "attachment": false, "open_weights": false, - "knowledge": "2024-05", - "release_date": "2024-12-20", - "last_updated": "2025-01-29", + "release_date": "2025-08-05", + "last_updated": "2025-08-05", "cost": { - "input": 1.1, - "output": 4.4, - "cache_read": 0.55 + "input": 0.04, + "output": 0.15 }, "type": "chat" }, { - "id": "openai/o4-mini", - "name": "o4-mini", - "display_name": "o4-mini", + "id": "openai/gpt-5-codex", + "name": "GPT-5 Codex", + "display_name": "GPT-5 Codex", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 100000 + "context": 256000, + "output": 32768 }, - "temperature": false, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": true, "default": true @@ -165366,6 +170374,13 @@ "mode": "effort", "effort": "medium", "effort_options": [ + "minimal", + "low", + "medium", + "high" + ], + "verbosity": "medium", + "verbosity_options": [ "low", "medium", "high" @@ -165373,22 +170388,20 @@ "visibility": "hidden" } }, - "attachment": true, + "attachment": false, "open_weights": false, - "knowledge": "2024-05", - "release_date": "2025-04-16", - "last_updated": "2025-04-16", + "release_date": "2025-09-15", + "last_updated": "2025-09-15", "cost": { - "input": 1.1, - "output": 4.4, - "cache_read": 0.275 + "input": 9.996, + "output": 19.992 }, "type": "chat" }, { - "id": "openai/gpt-4.1-mini", - "name": "GPT-4.1 mini", - "display_name": "GPT-4.1 mini", + "id": "openai/gpt-5.2-codex", + "name": "GPT 5.2 Codex", + "display_name": "GPT 5.2 Codex", "modalities": { "input": [ "text", @@ -165399,45 +170412,10 @@ "text" ] }, - "limit": { - "context": 1047576, - "output": 32768 - }, - "temperature": true, - "tool_call": true, - "reasoning": { - "supported": false - }, - "attachment": true, - "open_weights": false, - "knowledge": "2024-04", - "release_date": "2025-04-14", - "last_updated": "2025-04-14", - "cost": { - "input": 0.4, - "output": 1.6, - "cache_read": 0.1 - }, - "type": "chat" - }, - { - "id": "openai/gpt-5", - "name": "GPT-5", - "display_name": "GPT-5", - "modalities": { - "input": [ - "text", - "image" - ], - "output": [ - "text" - ] - }, "limit": { "context": 400000, "output": 128000 }, - "temperature": false, "tool_call": true, "reasoning": { "supported": true, @@ -165450,10 +170428,10 @@ "mode": "effort", "effort": "medium", "effort_options": [ - "minimal", "low", "medium", - "high" + "high", + "xhigh" ], "verbosity": "medium", "verbosity_options": [ @@ -165466,20 +170444,18 @@ }, "attachment": true, "open_weights": false, - "knowledge": "2024-09-30", - "release_date": "2025-08-07", - "last_updated": "2025-08-07", + "release_date": "2026-01-14", + "last_updated": "2026-01-14", "cost": { - "input": 1.25, - "output": 10, - "cache_read": 0.125 + "input": 1.75, + "output": 14 }, "type": "chat" }, { - "id": "openai/o3", - "name": "o3", - "display_name": "o3", + "id": "openai/gpt-5.1", + "name": "GPT 5.1", + "display_name": "GPT 5.1", "modalities": { "input": [ "text", @@ -165491,22 +170467,28 @@ ] }, "limit": { - "context": 200000, - "output": 100000 + "context": 400000, + "output": 128000 }, - "temperature": false, "tool_call": true, "reasoning": { "supported": true, - "default": true + "default": false }, "extra_capabilities": { "reasoning": { "supported": true, - "default_enabled": true, + "default_enabled": false, "mode": "effort", - "effort": "medium", + "effort": "none", "effort_options": [ + "none", + "low", + "medium", + "high" + ], + "verbosity": "medium", + "verbosity_options": [ "low", "medium", "high" @@ -165516,34 +170498,32 @@ }, "attachment": true, "open_weights": false, - "knowledge": "2024-05", - "release_date": "2025-04-16", - "last_updated": "2025-04-16", + "release_date": "2025-11-13", + "last_updated": "2025-11-13", "cost": { - "input": 2, - "output": 8, - "cache_read": 0.5 + "input": 1.25, + "output": 10 }, "type": "chat" }, { - "id": "openai/gpt-5-codex", - "name": "GPT-5-Codex", - "display_name": "GPT-5-Codex", + "id": "openai/gpt-5.5", + "name": "GPT 5.5", + "display_name": "GPT 5.5", "modalities": { "input": [ "text", - "image" + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 400000, + "context": 1000000, "output": 128000 }, - "temperature": false, "tool_call": true, "reasoning": { "supported": true, @@ -165556,10 +170536,10 @@ "mode": "effort", "effort": "medium", "effort_options": [ - "minimal", "low", "medium", - "high" + "high", + "xhigh" ], "verbosity": "medium", "verbosity_options": [ @@ -165570,331 +170550,384 @@ "visibility": "hidden" } }, - "attachment": false, + "attachment": true, "open_weights": false, - "knowledge": "2024-09-30", - "release_date": "2025-09-15", - "last_updated": "2025-09-15", + "release_date": "2026-04-23", + "last_updated": "2026-04-23", "cost": { - "input": 1.25, - "output": 10, - "cache_read": 0.125 + "input": 5, + "output": 30, + "cache_read": 0.5 }, "type": "chat" }, { - "id": "openai/gpt-4o", - "name": "GPT-4o", - "display_name": "GPT-4o", + "id": "Gryphe/MythoMax-L2-13b", + "name": "MythoMax 13B", + "display_name": "MythoMax 13B", "modalities": { "input": [ - "text", - "image", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 16384 + "context": 4000, + "output": 4096 }, - "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": false }, - "attachment": true, + "attachment": false, "open_weights": false, - "knowledge": "2023-09", - "release_date": "2024-05-13", - "last_updated": "2024-08-06", + "release_date": "2025-08-08", + "last_updated": "2025-08-08", "cost": { - "input": 2.5, - "output": 10, - "cache_read": 1.25 + "input": 0.1003, + "output": 0.1003 }, "type": "chat" }, { - "id": "openai/gpt-5-mini", - "name": "GPT-5 Mini", - "display_name": "GPT-5 Mini", + "id": "Unbabel/M-Prometheus-14B", + "name": "M-Prometheus 14B", + "display_name": "M-Prometheus 14B", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 400000, - "output": 128000 + "context": 32768, + "output": 8192 }, - "temperature": false, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": true, - "mode": "effort", - "effort": "medium", - "effort_options": [ - "minimal", - "low", - "medium", - "high" - ], - "verbosity": "medium", - "verbosity_options": [ - "low", - "medium", - "high" - ], - "visibility": "hidden" - } + "supported": false }, - "attachment": true, + "attachment": false, "open_weights": false, - "knowledge": "2024-05-30", - "release_date": "2025-08-07", - "last_updated": "2025-08-07", + "release_date": "2026-05-29", + "last_updated": "2026-05-29", "cost": { - "input": 0.25, - "output": 2, - "cache_read": 0.025 + "input": 0.2, + "output": 0.2 }, "type": "chat" }, { - "id": "bytedance/seedance-v1.0-pro-fast", - "name": "Seedance v1.0 Pro Fast", - "display_name": "Seedance v1.0 Pro Fast", + "id": "LLM360/K2-Think", + "name": "K2-Think", + "display_name": "K2-Think", "modalities": { "input": [ "text" ], "output": [ - "video" + "text" ] }, "limit": { - "context": 8192, - "output": 8192 + "context": 128000, + "output": 32768 }, - "temperature": true, "tool_call": false, "reasoning": { "supported": false }, "attachment": false, "open_weights": false, - "release_date": "2025-10-31", - "last_updated": "2025-10-31", + "release_date": "2025-07-26", + "last_updated": "2025-07-26", + "cost": { + "input": 0.17, + "output": 0.68 + }, "type": "chat" }, { - "id": "bytedance/seedance-v1.0-lite-t2v", - "name": "Seedance v1.0 Lite Text-to-Video", - "display_name": "Seedance v1.0 Lite Text-to-Video", + "id": "NousResearch/hermes-4-405b", + "name": "Hermes 4 Large", + "display_name": "Hermes 4 Large", "modalities": { "input": [ "text" ], "output": [ - "video" + "text" ] }, "limit": { - "context": 8192, + "context": 128000, "output": 8192 }, - "temperature": true, "tool_call": false, "reasoning": { "supported": false }, "attachment": false, "open_weights": false, - "release_date": "2025-06-01", - "last_updated": "2025-06-01", + "release_date": "2025-08-26", + "last_updated": "2025-08-26", + "cost": { + "input": 0.3, + "output": 1.2 + }, "type": "chat" }, { - "id": "bytedance/seedance-2.0-fast", - "name": "Seedance 2.0 Fast", - "display_name": "Seedance 2.0 Fast", + "id": "NousResearch/hermes-3-llama-3.1-70b", + "name": "Hermes 3 70B", + "display_name": "Hermes 3 70B", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ - "video" + "text" ] }, "limit": { - "context": 8192, + "context": 65536, "output": 8192 }, - "temperature": true, "tool_call": false, "reasoning": { "supported": false }, - "attachment": true, + "attachment": false, "open_weights": false, - "release_date": "2026-04-14", - "last_updated": "2026-04-14", + "release_date": "2026-01-07", + "last_updated": "2026-01-07", + "cost": { + "input": 0.408, + "output": 0.408 + }, "type": "chat" }, { - "id": "bytedance/seedance-v1.0-lite-i2v", - "name": "Seedance v1.0 Lite Image-to-Video", - "display_name": "Seedance v1.0 Lite Image-to-Video", + "id": "NousResearch/Hermes-4-70B:thinking", + "name": "Hermes 4 (Thinking)", + "display_name": "Hermes 4 (Thinking)", "modalities": { "input": [ "text" ], "output": [ - "video" + "text" ] }, "limit": { - "context": 8192, + "context": 128000, "output": 8192 }, - "temperature": true, "tool_call": false, "reasoning": { "supported": false }, "attachment": false, "open_weights": false, - "release_date": "2025-06-01", - "last_updated": "2025-06-01", + "release_date": "2025-09-17", + "last_updated": "2025-09-17", + "cost": { + "input": 0.2006, + "output": 0.3995 + }, "type": "chat" }, { - "id": "bytedance/seedream-5.0-lite", - "name": "Seedream 5.0 Lite", - "display_name": "Seedream 5.0 Lite", + "id": "NousResearch/hermes-4-70b", + "name": "Hermes 4 Medium", + "display_name": "Hermes 4 Medium", "modalities": { "input": [ "text" ], "output": [ - "image" + "text" ] }, "limit": { - "context": 8192, + "context": 128000, "output": 8192 }, - "temperature": true, "tool_call": false, "reasoning": { "supported": false }, "attachment": false, "open_weights": false, - "release_date": "2026-01-28", - "last_updated": "2026-01-28", + "release_date": "2025-07-03", + "last_updated": "2025-07-03", + "cost": { + "input": 0.2006, + "output": 0.3995 + }, "type": "chat" }, { - "id": "bytedance/seedance-2.0", - "name": "Seedance 2.0", - "display_name": "Seedance 2.0", + "id": "NousResearch/DeepHermes-3-Mistral-24B-Preview", + "name": "DeepHermes-3 Mistral 24B (Preview)", + "display_name": "DeepHermes-3 Mistral 24B (Preview)", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ - "video" + "text" ] }, "limit": { - "context": 8192, - "output": 8192 + "context": 128000, + "output": 32768 }, - "temperature": true, "tool_call": false, "reasoning": { "supported": false }, - "attachment": true, + "attachment": false, "open_weights": false, - "release_date": "2026-04-14", - "last_updated": "2026-04-14", + "release_date": "2025-05-10", + "last_updated": "2025-05-10", + "cost": { + "input": 0.3, + "output": 0.3 + }, "type": "chat" }, { - "id": "bytedance/seedream-4.0", - "name": "Seedream 4.0", - "display_name": "Seedream 4.0", + "id": "NousResearch/hermes-4-405b:thinking", + "name": "Hermes 4 Large (Thinking)", + "display_name": "Hermes 4 Large (Thinking)", "modalities": { "input": [ "text" ], "output": [ - "image" + "text" ] }, "limit": { - "context": 8192, + "context": 128000, "output": 8192 }, - "temperature": true, "tool_call": false, "reasoning": { "supported": false }, "attachment": false, "open_weights": false, - "release_date": "2025-08-28", - "last_updated": "2025-08-28", + "release_date": "2024-01-01", + "last_updated": "2024-01-01", + "cost": { + "input": 0.3, + "output": 1.2 + }, "type": "chat" }, { - "id": "bytedance/seedream-4.5", - "name": "Seedream 4.5", - "display_name": "Seedream 4.5", + "id": "unsloth/gemma-3-12b-it", + "name": "Gemma 3 12B IT", + "display_name": "Gemma 3 12B IT", "modalities": { "input": [ + "text", + "pdf" + ], + "output": [ "text" + ] + }, + "limit": { + "context": 128000, + "output": 131072 + }, + "tool_call": false, + "reasoning": { + "supported": false + }, + "attachment": true, + "open_weights": false, + "release_date": "2025-03-10", + "last_updated": "2025-03-10", + "cost": { + "input": 0.272, + "output": 0.272 + }, + "type": "chat" + }, + { + "id": "unsloth/gemma-3-4b-it", + "name": "Gemma 3 4B IT", + "display_name": "Gemma 3 4B IT", + "modalities": { + "input": [ + "text", + "pdf" ], "output": [ - "image" + "text" ] }, "limit": { - "context": 8192, + "context": 128000, "output": 8192 }, - "temperature": true, "tool_call": false, "reasoning": { "supported": false }, - "attachment": false, + "attachment": true, "open_weights": false, - "release_date": "2025-11-28", - "last_updated": "2025-11-28", + "release_date": "2025-03-10", + "last_updated": "2025-03-10", + "cost": { + "input": 0.2006, + "output": 0.2006 + }, "type": "chat" }, { - "id": "bytedance/seed-1.6", - "name": "Seed 1.6", - "display_name": "Seed 1.6", + "id": "unsloth/gemma-3-27b-it", + "name": "Gemma 3 27B IT", + "display_name": "Gemma 3 27B IT", + "modalities": { + "input": [ + "text", + "pdf" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 128000, + "output": 96000 + }, + "tool_call": false, + "reasoning": { + "supported": false + }, + "attachment": true, + "open_weights": false, + "release_date": "2025-03-10", + "last_updated": "2025-03-10", + "cost": { + "input": 0.2992, + "output": 0.2992 + }, + "type": "chat" + }, + { + "id": "NeverSleep/Lumimaid-v0.2-70B", + "name": "Lumimaid v0.2", + "display_name": "Lumimaid v0.2", "modalities": { "input": [ "text" @@ -165904,58 +170937,57 @@ ] }, "limit": { - "context": 256000, - "output": 32000 + "context": 16384, + "output": 8192 }, - "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": true + "supported": false }, "attachment": false, "open_weights": false, - "knowledge": "2024-10", - "release_date": "2025-09-01", - "last_updated": "2025-09", + "release_date": "2024-07-01", + "last_updated": "2024-07-01", "cost": { - "input": 0.25, - "output": 2, - "cache_read": 0.05 + "input": 1, + "output": 1.5 }, "type": "chat" }, { - "id": "bytedance/seedance-v1.0-pro", - "name": "Seedance v1.0 Pro", - "display_name": "Seedance v1.0 Pro", + "id": "mistralai/mixtral-8x7b-instruct-v0.1", + "name": "Mixtral 8x7B", + "display_name": "Mixtral 8x7B", "modalities": { "input": [ "text" ], "output": [ - "video" + "text" ] }, "limit": { - "context": 8192, - "output": 8192 + "context": 32768, + "output": 32768 }, - "temperature": true, "tool_call": false, "reasoning": { "supported": false }, "attachment": false, "open_weights": false, - "release_date": "2025-06-11", - "last_updated": "2025-06-11", + "release_date": "2025-12-11", + "last_updated": "2025-12-11", + "cost": { + "input": 0.27, + "output": 0.27 + }, "type": "chat" }, { - "id": "bytedance/seed-1.8", - "name": "Seed 1.8", - "display_name": "Seed 1.8", + "id": "mistralai/mistral-small-4-119b-2603:thinking", + "name": "Mistral Small 4 119B Thinking", + "display_name": "Mistral Small 4 119B Thinking", "modalities": { "input": [ "text", @@ -165966,359 +170998,393 @@ ] }, "limit": { - "context": 256000, - "output": 64000 + "context": 262144, + "output": 16384 }, - "temperature": true, "tool_call": true, "reasoning": { "supported": true, "default": true }, - "attachment": false, + "attachment": true, "open_weights": false, - "knowledge": "2024-10", - "release_date": "2025-09-01", - "last_updated": "2025-10", + "release_date": "2026-03-17", + "last_updated": "2026-03-17", "cost": { - "input": 0.25, - "output": 2, - "cache_read": 0.05 + "input": 0.4, + "output": 1.4 }, "type": "chat" }, { - "id": "bytedance/seedance-v1.5-pro", - "name": "Seedance v1.5 Pro", - "display_name": "Seedance v1.5 Pro", + "id": "mistralai/mixtral-8x22b-instruct-v0.1", + "name": "Mixtral 8x22B", + "display_name": "Mixtral 8x22B", "modalities": { "input": [ "text" ], "output": [ - "video" + "text" ] }, "limit": { - "context": 8192, - "output": 8192 + "context": 65536, + "output": 32768 }, - "temperature": true, "tool_call": false, "reasoning": { "supported": false }, "attachment": false, "open_weights": false, - "release_date": "2025-12-16", - "last_updated": "2025-12-16", + "release_date": "2025-12-11", + "last_updated": "2025-12-11", + "cost": { + "input": 0.8999999999999999, + "output": 0.8999999999999999 + }, "type": "chat" }, { - "id": "recraft/recraft-v4.1-utility", - "name": "Recraft V4.1 Utility", - "display_name": "Recraft V4.1 Utility", + "id": "mistralai/Devstral-Small-2505", + "name": "Mistral Devstral Small 2505", + "display_name": "Mistral Devstral Small 2505", "modalities": { "input": [ "text" ], "output": [ - "image" + "text" ] }, "limit": { - "context": 8192, + "context": 32768, "output": 8192 }, - "temperature": true, "tool_call": false, "reasoning": { "supported": false }, "attachment": false, "open_weights": false, - "release_date": "2026-05-14", - "last_updated": "2026-05-14", + "release_date": "2025-08-02", + "last_updated": "2025-08-02", + "cost": { + "input": 0.060000000000000005, + "output": 0.060000000000000005 + }, "type": "chat" }, { - "id": "recraft/recraft-v4.1-pro", - "name": "Recraft V4.1 Pro", - "display_name": "Recraft V4.1 Pro", + "id": "mistralai/ministral-8b-2512", + "name": "Ministral 8B", + "display_name": "Ministral 8B", "modalities": { "input": [ "text" ], "output": [ - "image" + "text" ] }, "limit": { - "context": 8192, - "output": 8192 + "context": 262144, + "output": 32768 }, - "temperature": true, "tool_call": false, "reasoning": { "supported": false }, "attachment": false, "open_weights": false, - "release_date": "2026-05-14", - "last_updated": "2026-05-14", + "release_date": "2025-12-04", + "last_updated": "2025-12-04", + "cost": { + "input": 0.15, + "output": 0.15 + }, "type": "chat" }, { - "id": "recraft/recraft-v4-pro", - "name": "Recraft V4 Pro", - "display_name": "Recraft V4 Pro", + "id": "mistralai/mistral-saba", + "name": "Mistral Saba", + "display_name": "Mistral Saba", "modalities": { "input": [ "text" ], "output": [ - "image" + "text" ] }, "limit": { - "context": 8192, - "output": 8192 + "context": 32000, + "output": 32768 }, - "temperature": true, "tool_call": false, "reasoning": { "supported": false }, "attachment": false, "open_weights": false, - "release_date": "2026-02-17", - "last_updated": "2026-02-17", + "release_date": "2025-02-17", + "last_updated": "2025-02-17", + "cost": { + "input": 0.1989, + "output": 0.595 + }, "type": "chat" }, { - "id": "recraft/recraft-v4.1-utility-pro", - "name": "Recraft V4.1 Utility Pro", - "display_name": "Recraft V4.1 Utility Pro", + "id": "mistralai/mistral-large", + "name": "Mistral Large 2411", + "display_name": "Mistral Large 2411", "modalities": { "input": [ "text" ], "output": [ - "image" + "text" ] }, "limit": { - "context": 8192, - "output": 8192 + "context": 128000, + "output": 256000 }, - "temperature": true, "tool_call": false, "reasoning": { "supported": false }, "attachment": false, "open_weights": false, - "release_date": "2026-05-14", - "last_updated": "2026-05-14", + "release_date": "2024-02-26", + "last_updated": "2024-02-26", + "cost": { + "input": 2.006, + "output": 6.001 + }, "type": "chat" }, { - "id": "recraft/recraft-v2", - "name": "Recraft V2", - "display_name": "Recraft V2", + "id": "mistralai/mistral-medium-3.1", + "name": "Mistral Medium 3.1", + "display_name": "Mistral Medium 3.1", "modalities": { "input": [ "text" ], "output": [ - "image" + "text" ] }, "limit": { - "context": 512, - "output": 8192 + "context": 131072, + "output": 32768 }, - "temperature": true, "tool_call": false, "reasoning": { "supported": false }, "attachment": false, "open_weights": false, - "release_date": "2024-03-01", - "last_updated": "2024-03", + "release_date": "2025-09-05", + "last_updated": "2025-09-05", + "cost": { + "input": 0.4, + "output": 2 + }, "type": "chat" }, { - "id": "recraft/recraft-v3", - "name": "Recraft V3", - "display_name": "Recraft V3", + "id": "mistralai/ministral-3b-2512", + "name": "Ministral 3B", + "display_name": "Ministral 3B", "modalities": { "input": [ "text" ], "output": [ - "image" + "text" ] }, "limit": { - "context": 512, - "output": 8192 + "context": 131072, + "output": 32768 }, - "temperature": true, "tool_call": false, "reasoning": { "supported": false }, "attachment": false, "open_weights": false, - "release_date": "2024-10-01", - "last_updated": "2024-10", + "release_date": "2025-12-04", + "last_updated": "2025-12-04", + "cost": { + "input": 0.1, + "output": 0.1 + }, "type": "chat" }, { - "id": "recraft/recraft-v4", - "name": "Recraft V4", - "display_name": "Recraft V4", + "id": "mistralai/ministral-14b-instruct-2512", + "name": "Ministral 3 14B", + "display_name": "Ministral 3 14B", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ - "image" + "text" ] }, "limit": { - "context": 8192, - "output": 8192 + "context": 262144, + "output": 32768 }, - "temperature": true, "tool_call": false, "reasoning": { "supported": false }, - "attachment": false, + "attachment": true, "open_weights": false, - "release_date": "2026-02-17", - "last_updated": "2026-02-17", + "release_date": "2025-12-02", + "last_updated": "2025-12-02", + "cost": { + "input": 0.1, + "output": 0.4 + }, "type": "chat" }, { - "id": "recraft/recraft-v4.1", - "name": "Recraft V4.1", - "display_name": "Recraft V4.1", + "id": "mistralai/mistral-small-4-119b-2603", + "name": "Mistral Small 4 119B", + "display_name": "Mistral Small 4 119B", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 262144, + "output": 16384 + }, + "tool_call": true, + "reasoning": { + "supported": true, + "default": true + }, + "attachment": true, + "open_weights": false, + "release_date": "2026-03-16", + "last_updated": "2026-03-16", + "cost": { + "input": 0.4, + "output": 1.4 + }, + "type": "chat" + }, + { + "id": "mistralai/ministral-14b-2512", + "name": "Ministral 14B", + "display_name": "Ministral 14B", "modalities": { "input": [ "text" ], "output": [ - "image" + "text" ] }, "limit": { - "context": 8192, - "output": 8192 + "context": 262144, + "output": 32768 }, - "temperature": true, "tool_call": false, "reasoning": { "supported": false }, "attachment": false, "open_weights": false, - "release_date": "2026-05-14", - "last_updated": "2026-05-14", + "release_date": "2025-12-04", + "last_updated": "2025-12-04", + "cost": { + "input": 0.2, + "output": 0.2 + }, "type": "chat" }, { - "id": "minimax/minimax-m3", - "name": "MiniMax M3", - "display_name": "MiniMax M3", + "id": "mistralai/mistral-large-3-675b-instruct-2512", + "name": "Mistral Large 3 675B", + "display_name": "Mistral Large 3 675B", "modalities": { "input": [ "text", - "image", - "pdf" + "image" ], "output": [ "text" ] }, "limit": { - "context": 1000000, - "output": 1000000 + "context": 262144, + "output": 256000 }, - "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true - } + "supported": false }, "attachment": true, "open_weights": false, - "release_date": "2026-05-31", - "last_updated": "2026-06-01", + "release_date": "2025-12-02", + "last_updated": "2025-12-02", "cost": { - "input": 0.3, - "output": 1.2, - "cache_read": 0.06 + "input": 1, + "output": 3 }, "type": "chat" }, { - "id": "minimax/minimax-m2.7-highspeed", - "name": "MiniMax M2.7 High Speed", - "display_name": "MiniMax M2.7 High Speed", + "id": "mistralai/mistral-medium-3", + "name": "Mistral Medium 3", + "display_name": "Mistral Medium 3", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 204800, - "output": 131100 + "context": 131072, + "output": 32768 }, - "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } + "supported": false }, "attachment": true, - "open_weights": true, - "release_date": "2026-03-18", - "last_updated": "2026-03-18", + "open_weights": false, + "release_date": "2025-09-25", + "last_updated": "2025-09-25", "cost": { - "input": 0.6, - "output": 2.4, - "cache_read": 0.06, - "cache_write": 0.375 + "input": 0.4, + "output": 2 }, "type": "chat" }, { - "id": "minimax/minimax-m2.1", - "name": "MiniMax M2.1", - "display_name": "MiniMax M2.1", + "id": "mistralai/devstral-2-123b-instruct-2512", + "name": "Devstral 2 123B", + "display_name": "Devstral 2 123B", "modalities": { "input": [ "text" @@ -166328,38 +171394,57 @@ ] }, "limit": { - "context": 204800, - "output": 131072 + "context": 262144, + "output": 65536 }, - "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": true + "supported": false }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true - } + "attachment": false, + "open_weights": false, + "release_date": "2025-12-09", + "last_updated": "2025-12-09", + "cost": { + "input": 0.4, + "output": 1.4 + }, + "type": "chat" + }, + { + "id": "mistralai/codestral-2508", + "name": "Codestral 2508", + "display_name": "Codestral 2508", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 256000, + "output": 32768 + }, + "tool_call": false, + "reasoning": { + "supported": false }, "attachment": false, "open_weights": false, - "knowledge": "2024-10", - "release_date": "2025-10-27", - "last_updated": "2025-12-23", + "release_date": "2025-08-01", + "last_updated": "2025-08-01", "cost": { "input": 0.3, - "output": 1.2, - "cache_read": 0.03, - "cache_write": 0.375 + "output": 0.8999999999999999 }, "type": "chat" }, { - "id": "minimax/minimax-m2.7", - "name": "Minimax M2.7", - "display_name": "Minimax M2.7", + "id": "mistralai/Mistral-Nemo-Instruct-2407", + "name": "Mistral Nemo", + "display_name": "Mistral Nemo", "modalities": { "input": [ "text" @@ -166369,42 +171454,27 @@ ] }, "limit": { - "context": 204800, - "output": 131000 + "context": 16384, + "output": 8192 }, - "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } + "supported": false }, - "attachment": true, - "open_weights": true, - "release_date": "2026-03-18", - "last_updated": "2026-03-18", + "attachment": false, + "open_weights": false, + "release_date": "2024-07-18", + "last_updated": "2024-07-18", "cost": { - "input": 0.3, - "output": 1.2, - "cache_read": 0.06, - "cache_write": 0.375 + "input": 0.1003, + "output": 0.1207 }, "type": "chat" }, { - "id": "minimax/minimax-m2", - "name": "MiniMax M2", - "display_name": "MiniMax M2", + "id": "bytedance-seed/seed-2.0-lite", + "name": "ByteDance Seed 2.0 Lite", + "display_name": "ByteDance Seed 2.0 Lite", "modalities": { "input": [ "text" @@ -166414,38 +171484,88 @@ ] }, "limit": { - "context": 205000, - "output": 205000 + "context": 262144, + "output": 131072 }, - "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": true + "supported": false }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true - } + "attachment": false, + "open_weights": false, + "release_date": "2026-03-10", + "last_updated": "2026-03-10", + "cost": { + "input": 0.25, + "output": 2 + }, + "type": "chat" + }, + { + "id": "anthracite-org/magnum-v2-72b", + "name": "Magnum V2 72B", + "display_name": "Magnum V2 72B", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 16384, + "output": 8192 + }, + "tool_call": false, + "reasoning": { + "supported": false }, "attachment": false, - "open_weights": true, - "knowledge": "2024-10", - "release_date": "2025-10-27", - "last_updated": "2025-10-27", + "open_weights": false, + "release_date": "2024-07-01", + "last_updated": "2024-07-01", "cost": { - "input": 0.3, - "output": 1.2, - "cache_read": 0.03, - "cache_write": 0.375 + "input": 2.006, + "output": 2.992 }, "type": "chat" }, { - "id": "minimax/minimax-m2.5", - "name": "MiniMax M2.5", - "display_name": "MiniMax M2.5", + "id": "anthracite-org/magnum-v4-72b", + "name": "Magnum v4 72B", + "display_name": "Magnum v4 72B", + "modalities": { + "input": [ + "text", + "pdf" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 16384, + "output": 8192 + }, + "tool_call": false, + "reasoning": { + "supported": false + }, + "attachment": true, + "open_weights": false, + "release_date": "2025-01-01", + "last_updated": "2025-01-01", + "cost": { + "input": 2.006, + "output": 2.992 + }, + "type": "chat" + }, + { + "id": "inflatebot/MN-12B-Mag-Mell-R1", + "name": "Mag Mell R1", + "display_name": "Mag Mell R1", "modalities": { "input": [ "text" @@ -166455,47 +171575,39 @@ ] }, "limit": { - "context": 204800, - "output": 131000 + "context": 16384, + "output": 8192 }, - "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true - } + "supported": false }, "attachment": false, "open_weights": false, - "release_date": "2026-02-12", - "last_updated": "2026-02-12", + "release_date": "2024-07-01", + "last_updated": "2024-07-01", "cost": { - "input": 0.3, - "output": 1.2, - "cache_read": 0.03, - "cache_write": 0.375 + "input": 0.49299999999999994, + "output": 0.49299999999999994 }, "type": "chat" }, { - "id": "minimax/minimax-m2.5-highspeed", - "name": "MiniMax M2.5 High Speed", - "display_name": "MiniMax M2.5 High Speed", + "id": "nvidia/nemotron-3-nano-omni-30b-a3b-reasoning", + "name": "Nvidia Nemotron 3 Nano Omni", + "display_name": "Nvidia Nemotron 3 Nano Omni", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 204800, - "output": 131000 + "context": 256000, + "output": 65536 }, "temperature": true, "tool_call": true, @@ -166503,27 +171615,20 @@ "supported": true, "default": true }, - "extra_capabilities": { - "reasoning": { - "supported": true - } - }, - "attachment": false, + "attachment": true, "open_weights": false, - "release_date": "2026-02-12", - "last_updated": "2026-02-13", + "release_date": "2026-04-28", + "last_updated": "2026-04-28", "cost": { - "input": 0.6, - "output": 2.4, - "cache_read": 0.03, - "cache_write": 0.375 + "input": 0.105, + "output": 0.42 }, "type": "chat" }, { - "id": "minimax/minimax-m2.1-lightning", - "name": "MiniMax M2.1 Lightning", - "display_name": "MiniMax M2.1 Lightning", + "id": "nvidia/Llama-3.1-Nemotron-70B-Instruct-HF", + "name": "Nvidia Nemotron 70b", + "display_name": "Nvidia Nemotron 70b", "modalities": { "input": [ "text" @@ -166533,45 +171638,31 @@ ] }, "limit": { - "context": 204800, - "output": 131072 + "context": 16384, + "output": 8192 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": true + "supported": false }, "attachment": false, "open_weights": false, - "knowledge": "2024-10", - "release_date": "2025-10-27", - "last_updated": "2025-10-27", + "release_date": "2025-04-15", + "last_updated": "2025-04-15", "cost": { - "input": 0.3, - "output": 2.4, - "cache_read": 0.03, - "cache_write": 0.375 + "input": 0.357, + "output": 0.408 }, "type": "chat" - } - ] - }, - "abacus": { - "id": "abacus", - "name": "Abacus", - "display_name": "Abacus", - "api": "https://routellm.abacus.ai/v1", - "doc": "https://abacus.ai/help/api", - "models": [ + }, { - "id": "route-llm", - "name": "Route LLM", - "display_name": "Route LLM", + "id": "nvidia/nvidia-nemotron-nano-9b-v2", + "name": "Nvidia Nemotron Nano 9B v2", + "display_name": "Nvidia Nemotron Nano 9B v2", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" @@ -166582,527 +171673,342 @@ "output": 16384 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": false }, - "attachment": true, + "attachment": false, "open_weights": false, - "knowledge": "2024-10", - "release_date": "2024-01-01", - "last_updated": "2024-01-01", + "release_date": "2025-08-18", + "last_updated": "2025-08-18", "cost": { - "input": 3, - "output": 15 + "input": 0.17, + "output": 0.68 }, "type": "chat" }, { - "id": "claude-sonnet-4-6", - "name": "Claude Sonnet 4.6", - "display_name": "Claude Sonnet 4.6", + "id": "nvidia/Llama-3_3-Nemotron-Super-49B-v1_5", + "name": "Nvidia Nemotron Super 49B v1.5", + "display_name": "Nvidia Nemotron Super 49B v1.5", "modalities": { "input": [ - "text", - "image", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 64000 + "context": 128000, + "output": 16384 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": false - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": false, - "mode": "mixed", - "budget": { - "min": 1024, - "unit": "tokens" - }, - "effort": "high", - "effort_options": [ - "low", - "medium", - "high", - "max" - ], - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ], - "notes": [ - "Anthropic recommends adaptive thinking with effort for Claude 4.6; budget_tokens remains a deprecated compatibility path.", - "Anthropic API defaults effort to high; lower effort levels should be chosen per workload." - ] - } + "supported": false }, - "attachment": true, + "attachment": false, "open_weights": false, - "knowledge": "2025-08-31", - "release_date": "2026-02-17", - "last_updated": "2026-02-17", + "release_date": "2025-08-08", + "last_updated": "2025-08-08", "cost": { - "input": 3, - "output": 15 + "input": 0.05, + "output": 0.25 }, "type": "chat" }, { - "id": "gpt-5-mini", - "name": "GPT-5 Mini", - "display_name": "GPT-5 Mini", + "id": "nvidia/nemotron-3-nano-30b-a3b", + "name": "Nvidia Nemotron 3 Nano 30B", + "display_name": "Nvidia Nemotron 3 Nano 30B", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 400000, - "output": 128000 + "context": 256000, + "output": 262144 }, - "temperature": false, - "tool_call": true, + "temperature": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": true, - "mode": "effort", - "effort": "medium", - "effort_options": [ - "minimal", - "low", - "medium", - "high" - ], - "verbosity": "medium", - "verbosity_options": [ - "low", - "medium", - "high" - ], - "visibility": "hidden" - } + "supported": false }, - "attachment": true, + "attachment": false, "open_weights": false, - "knowledge": "2024-05-30", - "release_date": "2025-08-07", - "last_updated": "2025-08-07", + "release_date": "2025-12-15", + "last_updated": "2025-12-15", "cost": { - "input": 0.25, - "output": 2 + "input": 0.17, + "output": 0.68 }, "type": "chat" }, { - "id": "gpt-5.2", - "name": "GPT-5.2", - "display_name": "GPT-5.2", + "id": "nvidia/Llama-3.3-Nemotron-Super-49B-v1", + "name": "Nvidia Nemotron Super 49B", + "display_name": "Nvidia Nemotron Super 49B", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 400000, - "output": 128000 + "context": 128000, + "output": 16384 }, - "temperature": false, - "tool_call": true, + "temperature": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": false - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": false, - "mode": "effort", - "effort": "none", - "effort_options": [ - "none", - "low", - "medium", - "high", - "xhigh" - ], - "verbosity": "medium", - "verbosity_options": [ - "low", - "medium", - "high" - ], - "visibility": "hidden" - } + "supported": false }, - "attachment": true, + "attachment": false, "open_weights": false, - "knowledge": "2025-08-31", - "release_date": "2025-12-11", - "last_updated": "2025-12-11", + "release_date": "2025-08-08", + "last_updated": "2025-08-08", "cost": { - "input": 1.75, - "output": 14 + "input": 0.15, + "output": 0.15 }, "type": "chat" }, { - "id": "gpt-5-codex", - "name": "GPT-5 Codex", - "display_name": "GPT-5 Codex", + "id": "nvidia/nemotron-3-super-120b-a12b:thinking", + "name": "Nvidia Nemotron 3 Super 120B Thinking", + "display_name": "Nvidia Nemotron 3 Super 120B Thinking", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 400000, - "output": 128000 + "context": 262144, + "output": 16384 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, "default": true }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": true, - "mode": "effort", - "effort": "medium", - "effort_options": [ - "minimal", - "low", - "medium", - "high" - ], - "verbosity": "medium", - "verbosity_options": [ - "low", - "medium", - "high" - ], - "visibility": "hidden" - } - }, "attachment": false, "open_weights": false, - "knowledge": "2024-09-30", - "release_date": "2025-09-15", - "last_updated": "2025-09-15", + "release_date": "2026-03-01", + "last_updated": "2026-03-01", "cost": { - "input": 1.25, - "output": 10 + "input": 0.05, + "output": 0.25 }, "type": "chat" }, { - "id": "o3", - "name": "o3", - "display_name": "o3", + "id": "nvidia/nemotron-3-super-120b-a12b", + "name": "Nvidia Nemotron 3 Super 120B", + "display_name": "Nvidia Nemotron 3 Super 120B", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 100000 + "context": 262144, + "output": 16384 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, "default": true }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": true, - "mode": "effort", - "effort": "medium", - "effort_options": [ - "low", - "medium", - "high" - ], - "visibility": "hidden" - } - }, - "attachment": true, + "attachment": false, "open_weights": false, - "knowledge": "2024-05", - "release_date": "2025-04-16", - "last_updated": "2025-04-16", + "release_date": "2026-03-01", + "last_updated": "2026-03-01", "cost": { - "input": 2, - "output": 8 + "input": 0.05, + "output": 0.25 }, "type": "chat" }, { - "id": "gpt-5.3-chat-latest", - "name": "GPT-5.3 Chat Latest", - "display_name": "GPT-5.3 Chat Latest", + "id": "cognitivecomputations/dolphin-2.9.2-qwen2-72b", + "name": "Dolphin 72b", + "display_name": "Dolphin 72b", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 400000, - "output": 128000 + "context": 8192, + "output": 4096 }, - "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": true + "supported": false }, - "attachment": true, + "attachment": false, "open_weights": false, - "release_date": "2026-03-01", - "last_updated": "2026-03-01", + "release_date": "2025-02-27", + "last_updated": "2025-02-27", "cost": { - "input": 1.75, - "output": 14 + "input": 0.306, + "output": 0.306 }, "type": "chat" }, { - "id": "claude-haiku-4-5-20251001", - "name": "Claude Haiku 4.5", - "display_name": "Claude Haiku 4.5", + "id": "xiaomi/mimo-v2-flash-original", + "name": "MiMo V2 Flash Original", + "display_name": "MiMo V2 Flash Original", "modalities": { "input": [ - "text", - "image", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 64000 + "context": 256000, + "output": 32768 }, - "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": false - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": false, - "mode": "budget", - "budget": { - "min": 1024, - "unit": "tokens" - }, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ], - "notes": [ - "Claude 4 manual thinking uses thinking.type = \"enabled\" with budget_tokens.", - "Interleaved thinking requires the interleaved-thinking-2025-05-14 beta header for this model family." - ] - } + "supported": false }, - "attachment": true, + "attachment": false, "open_weights": false, - "knowledge": "2025-02-28", - "release_date": "2025-10-15", - "last_updated": "2025-10-15", + "release_date": "2025-12-17", + "last_updated": "2025-12-17", "cost": { - "input": 1, - "output": 5 + "input": 0.102, + "output": 0.306 }, "type": "chat" }, { - "id": "gpt-4o-2024-11-20", - "name": "GPT-4o (2024-11-20)", - "display_name": "GPT-4o (2024-11-20)", + "id": "xiaomi/mimo-v2-flash-thinking-original", + "name": "MiMo V2 Flash (Thinking) Original", + "display_name": "MiMo V2 Flash (Thinking) Original", "modalities": { "input": [ - "text", - "image", - "audio" + "text" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 16384 + "context": 256000, + "output": 32768 }, - "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": false }, - "attachment": true, + "attachment": false, "open_weights": false, - "knowledge": "2024-10", - "release_date": "2024-11-20", - "last_updated": "2024-11-20", + "release_date": "2025-12-17", + "last_updated": "2025-12-17", "cost": { - "input": 2.5, - "output": 10 + "input": 0.102, + "output": 0.306 }, "type": "chat" }, { - "id": "gpt-5", - "name": "GPT-5", - "display_name": "GPT-5", + "id": "xiaomi/mimo-v2.5", + "name": "MiMo V2.5", + "display_name": "MiMo V2.5", "modalities": { "input": [ "text", - "image" + "image", + "video" ], "output": [ "text" ] }, "limit": { - "context": 400000, - "output": 128000 + "context": 1048576, + "output": 131072 }, - "temperature": false, "tool_call": true, "reasoning": { "supported": true, "default": true }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": true, - "mode": "effort", - "effort": "medium", - "effort_options": [ - "minimal", - "low", - "medium", - "high" - ], - "verbosity": "medium", - "verbosity_options": [ - "low", - "medium", - "high" - ], - "visibility": "hidden" - } - }, "attachment": true, "open_weights": false, - "knowledge": "2024-09-30", - "release_date": "2025-08-07", - "last_updated": "2025-08-07", + "release_date": "2026-04-22", + "last_updated": "2026-04-22", "cost": { - "input": 1.25, - "output": 10 + "input": 0.14, + "output": 0.28, + "cache_read": 0.0028 }, "type": "chat" }, { - "id": "gemini-3.1-flash-lite-preview", - "name": "Gemini 3.1 Flash Lite Preview", - "display_name": "Gemini 3.1 Flash Lite Preview", + "id": "xiaomi/mimo-v2-omni", + "name": "MiMo V2 Omni", + "display_name": "MiMo V2 Omni", "modalities": { "input": [ "text", "image", - "audio", "video", - "pdf" + "audio" ], "output": [ "text" ] }, "limit": { - "context": 1048576, + "context": 262144, "output": 65536 }, - "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true - } + "supported": false }, "attachment": true, "open_weights": false, - "release_date": "2026-03-01", - "last_updated": "2026-03-01", + "release_date": "2026-03-19", + "last_updated": "2026-03-19", "cost": { - "input": 0.25, - "output": 1.5, - "cache_read": 0.025, - "cache_write": 1 + "input": 0.4, + "output": 2, + "cache_read": 0.08 }, "type": "chat" }, { - "id": "grok-4-0709", - "name": "Grok 4", - "display_name": "Grok 4", + "id": "xiaomi/mimo-v2-flash", + "name": "MiMo V2 Flash", + "display_name": "MiMo V2 Flash", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" @@ -167110,141 +172016,120 @@ }, "limit": { "context": 256000, - "output": 16384 + "output": 32768 }, - "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": true + "supported": false }, - "attachment": true, + "attachment": false, "open_weights": false, - "release_date": "2025-07-09", - "last_updated": "2025-07-09", + "release_date": "2025-12-17", + "last_updated": "2025-12-17", "cost": { - "input": 3, - "output": 15 + "input": 0.102, + "output": 0.306 }, "type": "chat" }, { - "id": "grok-4-fast-non-reasoning", - "name": "Grok 4 Fast (Non-Reasoning)", - "display_name": "Grok 4 Fast (Non-Reasoning)", + "id": "xiaomi/mimo-v2-pro", + "name": "MiMo V2 Pro", + "display_name": "MiMo V2 Pro", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 2000000, - "output": 16384 + "context": 1048576, + "output": 131072 }, - "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": true, + "attachment": false, "open_weights": false, - "release_date": "2025-07-09", - "last_updated": "2025-07-09", + "release_date": "2026-03-19", + "last_updated": "2026-03-19", "cost": { - "input": 0.2, - "output": 0.5 + "input": 1, + "output": 3, + "cache_read": 0.2 }, "type": "chat" }, { - "id": "gpt-4.1-mini", - "name": "GPT-4.1 Mini", - "display_name": "GPT-4.1 Mini", + "id": "xiaomi/mimo-v2.5-pro", + "name": "MiMo V2.5 Pro", + "display_name": "MiMo V2.5 Pro", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 1047576, - "output": 32768 + "context": 1048576, + "output": 131072 }, - "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": true, + "attachment": false, "open_weights": false, - "knowledge": "2024-04", - "release_date": "2025-04-14", - "last_updated": "2025-04-14", + "release_date": "2026-04-22", + "last_updated": "2026-04-22", "cost": { - "input": 0.4, - "output": 1.6 + "input": 0.435, + "output": 0.87, + "cache_read": 0.0036 }, "type": "chat" }, { - "id": "o3-pro", - "name": "o3-pro", - "display_name": "o3-pro", + "id": "xiaomi/mimo-v2-flash-thinking", + "name": "MiMo V2 Flash (Thinking)", + "display_name": "MiMo V2 Flash (Thinking)", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 100000 + "context": 256000, + "output": 32768 }, - "temperature": false, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": true, - "mode": "effort", - "effort": "medium", - "effort_options": [ - "low", - "medium", - "high" - ], - "visibility": "hidden" - } + "supported": false }, - "attachment": true, + "attachment": false, "open_weights": false, - "knowledge": "2024-05", - "release_date": "2025-06-10", - "last_updated": "2025-06-10", + "release_date": "2025-12-17", + "last_updated": "2025-12-17", "cost": { - "input": 20, - "output": 40 + "input": 0.102, + "output": 0.306 }, "type": "chat" }, { - "id": "claude-opus-4-20250514", - "name": "Claude Opus 4", - "display_name": "Claude Opus 4", + "id": "anthropic/claude-haiku-latest", + "name": "Claude Haiku Latest", + "display_name": "Claude Haiku Latest", "modalities": { "input": [ "text", @@ -167257,63 +172142,42 @@ }, "limit": { "context": 200000, - "output": 32000 + "output": 64000 }, - "temperature": true, "tool_call": true, "reasoning": { "supported": true, - "default": false - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": false, - "mode": "budget", - "budget": { - "min": 1024, - "unit": "tokens" - }, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ], - "notes": [ - "Claude 4 manual thinking uses thinking.type = \"enabled\" with budget_tokens.", - "Interleaved thinking requires the interleaved-thinking-2025-05-14 beta header for this model family." - ] - } + "default": true }, "attachment": true, "open_weights": false, - "release_date": "2025-05-14", - "last_updated": "2025-05-14", + "release_date": "2026-03-29", + "last_updated": "2026-03-29", "cost": { - "input": 15, - "output": 75 + "input": 1, + "output": 5, + "cache_read": 0.1 }, "type": "chat" }, { - "id": "o4-mini", - "name": "o4-mini", - "display_name": "o4-mini", + "id": "anthropic/claude-opus-4.7:thinking", + "name": "Claude 4.7 Opus Thinking", + "display_name": "Claude 4.7 Opus Thinking", "modalities": { "input": [ "text", - "image" + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 100000 + "context": 1000000, + "output": 128000 }, - "temperature": false, "tool_call": true, "reasoning": { "supported": true, @@ -167324,99 +172188,117 @@ "supported": true, "default_enabled": true, "mode": "effort", - "effort": "medium", + "effort": "high", "effort_options": [ "low", "medium", - "high" + "high", + "xhigh", + "max" ], - "visibility": "hidden" + "interleaved": true, + "summaries": true, + "visibility": "omitted", + "continuation": [ + "thinking_blocks" + ], + "notes": [ + "Claude Opus 4.7 and newer Opus models require thinking.type = \"adaptive\" to enable thinking explicitly.", + "Manual budget_tokens requests return 400 on Claude Opus 4.7 and newer adaptive-only Opus models.", + "task_budget is separate from thinking control and should not be treated as a thinking budget." + ] } }, "attachment": true, "open_weights": false, - "knowledge": "2024-05", - "release_date": "2025-04-16", - "last_updated": "2025-04-16", + "release_date": "2026-04-16", + "last_updated": "2026-04-16", "cost": { - "input": 1.1, - "output": 4.4 + "input": 4.998, + "output": 25.007, + "cache_read": 0.4998 }, "type": "chat" }, { - "id": "gpt-5.4", - "name": "GPT-5.4", - "display_name": "GPT-5.4", + "id": "anthropic/claude-opus-4.6:thinking:max", + "name": "Claude 4.6 Opus Thinking Max", + "display_name": "Claude 4.6 Opus Thinking Max", "modalities": { "input": [ "text", - "image" + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 1050000, + "context": 1000000, "output": 128000 }, - "temperature": false, "tool_call": true, "reasoning": { "supported": true, - "default": false + "default": true }, "extra_capabilities": { "reasoning": { "supported": true, - "default_enabled": false, - "mode": "effort", - "effort": "none", + "default_enabled": true, + "mode": "mixed", + "budget": { + "min": 1024, + "unit": "tokens" + }, + "effort": "high", "effort_options": [ - "none", "low", "medium", "high", - "xhigh" + "max" ], - "verbosity": "medium", - "verbosity_options": [ - "low", - "medium", - "high" + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" ], - "visibility": "hidden" + "notes": [ + "Anthropic recommends adaptive thinking with effort for Claude 4.6; budget_tokens remains a deprecated compatibility path.", + "Anthropic API defaults effort to high; lower effort levels should be chosen per workload." + ] } }, "attachment": true, "open_weights": false, - "knowledge": "2025-08-31", - "release_date": "2026-03-05", - "last_updated": "2026-03-05", + "release_date": "2026-02-05", + "last_updated": "2026-02-05", "cost": { - "input": 2.5, - "output": 15 + "input": 4.998, + "output": 25.007 }, "type": "chat" }, { - "id": "o3-mini", - "name": "o3-mini", - "display_name": "o3-mini", + "id": "anthropic/claude-opus-4.6:thinking:low", + "name": "Claude 4.6 Opus Thinking Low", + "display_name": "Claude 4.6 Opus Thinking Low", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 100000 + "context": 1000000, + "output": 128000 }, - "temperature": false, "tool_call": true, "reasoning": { "supported": true, @@ -167426,37 +172308,48 @@ "reasoning": { "supported": true, "default_enabled": true, - "mode": "effort", - "effort": "medium", + "mode": "mixed", + "budget": { + "min": 1024, + "unit": "tokens" + }, + "effort": "high", "effort_options": [ "low", "medium", - "high" + "high", + "max" ], - "visibility": "hidden" + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ], + "notes": [ + "Anthropic recommends adaptive thinking with effort for Claude 4.6; budget_tokens remains a deprecated compatibility path.", + "Anthropic API defaults effort to high; lower effort levels should be chosen per workload." + ] } }, - "attachment": false, + "attachment": true, "open_weights": false, - "knowledge": "2024-05", - "release_date": "2024-12-20", - "last_updated": "2025-01-29", + "release_date": "2026-02-05", + "last_updated": "2026-02-05", "cost": { - "input": 1.1, - "output": 4.4 + "input": 4.998, + "output": 25.007 }, "type": "chat" }, { - "id": "gemini-3-flash-preview", - "name": "Gemini 3 Flash Preview", - "display_name": "Gemini 3 Flash Preview", + "id": "anthropic/claude-sonnet-4.6:thinking", + "name": "Claude Sonnet 4.6 Thinking", + "display_name": "Claude Sonnet 4.6 Thinking", "modalities": { "input": [ "text", "image", - "audio", - "video", "pdf" ], "output": [ @@ -167464,10 +172357,9 @@ ] }, "limit": { - "context": 1048576, - "output": 65536 + "context": 1000000, + "output": 128000 }, - "temperature": true, "tool_call": true, "reasoning": { "supported": true, @@ -167477,213 +172369,180 @@ "reasoning": { "supported": true, "default_enabled": true, - "mode": "level", - "level": "high", - "level_options": [ - "minimal", + "mode": "mixed", + "budget": { + "min": 1024, + "unit": "tokens" + }, + "effort": "high", + "effort_options": [ "low", "medium", - "high" + "high", + "max" ], + "interleaved": true, "summaries": true, "visibility": "summary", "continuation": [ - "thought_signatures" + "thinking_blocks" + ], + "notes": [ + "Anthropic recommends adaptive thinking with effort for Claude 4.6; budget_tokens remains a deprecated compatibility path.", + "Anthropic API defaults effort to high; lower effort levels should be chosen per workload." ] } }, "attachment": true, "open_weights": false, - "knowledge": "2025-01", - "release_date": "2025-12-17", - "last_updated": "2025-12-17", - "cost": { - "input": 0.5, - "output": 3 - }, - "type": "chat" - }, - { - "id": "qwen-2.5-coder-32b", - "name": "Qwen 2.5 Coder 32B", - "display_name": "Qwen 2.5 Coder 32B", - "modalities": { - "input": [ - "text" - ], - "output": [ - "text" - ] - }, - "limit": { - "context": 128000, - "output": 8192 - }, - "temperature": true, - "tool_call": true, - "reasoning": { - "supported": false - }, - "attachment": false, - "open_weights": true, - "release_date": "2024-11-11", - "last_updated": "2024-11-11", + "knowledge": "2025-08-31", + "release_date": "2026-02-17", + "last_updated": "2026-02-17", "cost": { - "input": 0.79, - "output": 0.79 + "input": 2.992, + "output": 14.993999999999998 }, "type": "chat" }, { - "id": "qwen3-max", - "name": "Qwen3 Max", - "display_name": "Qwen3 Max", + "id": "anthropic/claude-opus-4.7", + "name": "Claude 4.7 Opus", + "display_name": "Claude 4.7 Opus", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 131072, - "output": 16384 + "context": 1000000, + "output": 128000 }, - "temperature": true, "tool_call": true, "reasoning": { "supported": true, - "default": true + "default": false }, "extra_capabilities": { "reasoning": { "supported": true, + "default_enabled": false, + "mode": "effort", + "effort": "high", + "effort_options": [ + "low", + "medium", + "high", + "xhigh", + "max" + ], "interleaved": true, "summaries": true, - "visibility": "summary", + "visibility": "omitted", "continuation": [ "thinking_blocks" + ], + "notes": [ + "Claude Opus 4.7 and newer Opus models require thinking.type = \"adaptive\" to enable thinking explicitly.", + "Manual budget_tokens requests return 400 on Claude Opus 4.7 and newer adaptive-only Opus models.", + "task_budget is separate from thinking control and should not be treated as a thinking budget." ] } }, - "attachment": false, - "open_weights": false, - "release_date": "2025-05-28", - "last_updated": "2025-05-28", - "cost": { - "input": 1.2, - "output": 6 - }, - "type": "chat" - }, - { - "id": "gpt-5.2-chat-latest", - "name": "GPT-5.2 Chat Latest", - "display_name": "GPT-5.2 Chat Latest", - "modalities": { - "input": [ - "text", - "image" - ], - "output": [ - "text" - ] - }, - "limit": { - "context": 400000, - "output": 128000 - }, - "temperature": true, - "tool_call": true, - "reasoning": { - "supported": true, - "default": true - }, "attachment": true, "open_weights": false, - "knowledge": "2024-09-30", - "release_date": "2026-01-01", - "last_updated": "2026-01-01", + "release_date": "2026-04-16", + "last_updated": "2026-04-16", "cost": { - "input": 1.75, - "output": 14 + "input": 4.998, + "output": 25.007, + "cache_read": 0.4998 }, "type": "chat" }, { - "id": "gpt-5.1", - "name": "GPT-5.1", - "display_name": "GPT-5.1", + "id": "anthropic/claude-opus-4.6:thinking:medium", + "name": "Claude 4.6 Opus Thinking Medium", + "display_name": "Claude 4.6 Opus Thinking Medium", "modalities": { "input": [ "text", - "image" + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 400000, + "context": 1000000, "output": 128000 }, - "temperature": false, "tool_call": true, "reasoning": { "supported": true, - "default": false + "default": true }, "extra_capabilities": { "reasoning": { "supported": true, - "default_enabled": false, - "mode": "effort", - "effort": "none", + "default_enabled": true, + "mode": "mixed", + "budget": { + "min": 1024, + "unit": "tokens" + }, + "effort": "high", "effort_options": [ - "none", "low", "medium", - "high" + "high", + "max" ], - "verbosity": "medium", - "verbosity_options": [ - "low", - "medium", - "high" + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" ], - "visibility": "hidden" + "notes": [ + "Anthropic recommends adaptive thinking with effort for Claude 4.6; budget_tokens remains a deprecated compatibility path.", + "Anthropic API defaults effort to high; lower effort levels should be chosen per workload." + ] } }, "attachment": true, "open_weights": false, - "knowledge": "2024-09-30", - "release_date": "2025-11-13", - "last_updated": "2025-11-13", + "release_date": "2026-02-05", + "last_updated": "2026-02-05", "cost": { - "input": 1.25, - "output": 10 + "input": 4.998, + "output": 25.007 }, "type": "chat" }, { - "id": "gpt-5-nano", - "name": "GPT-5 Nano", - "display_name": "GPT-5 Nano", + "id": "anthropic/claude-opus-4.8:thinking", + "name": "Claude Opus 4.8 Thinking", + "display_name": "Claude Opus 4.8 Thinking", "modalities": { "input": [ "text", - "image" + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 400000, + "context": 1000000, "output": 128000 }, - "temperature": false, "tool_call": true, "reasoning": { "supported": true, @@ -167694,84 +172553,90 @@ "supported": true, "default_enabled": true, "mode": "effort", - "effort": "medium", + "effort": "high", "effort_options": [ - "minimal", "low", "medium", - "high" + "high", + "xhigh", + "max" ], - "verbosity": "medium", - "verbosity_options": [ - "low", - "medium", - "high" + "interleaved": true, + "summaries": true, + "visibility": "omitted", + "continuation": [ + "thinking_blocks" ], - "visibility": "hidden" + "notes": [ + "Claude Opus 4.7 and newer Opus models require thinking.type = \"adaptive\" to enable thinking explicitly.", + "Manual budget_tokens requests return 400 on Claude Opus 4.7 and newer adaptive-only Opus models.", + "task_budget is separate from thinking control and should not be treated as a thinking budget." + ] } }, "attachment": true, "open_weights": false, - "knowledge": "2024-05-30", - "release_date": "2025-08-07", - "last_updated": "2025-08-07", + "release_date": "2026-05-28", + "last_updated": "2026-05-28", "cost": { - "input": 0.05, - "output": 0.4 + "input": 4.998, + "output": 25.007, + "cache_read": 0.4998 }, "type": "chat" }, { - "id": "gpt-4o-mini", - "name": "GPT-4o Mini", - "display_name": "GPT-4o Mini", + "id": "anthropic/claude-sonnet-latest", + "name": "Claude Sonnet Latest", + "display_name": "Claude Sonnet Latest", "modalities": { "input": [ "text", - "image" + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 16384 + "context": 1000000, + "output": 128000 }, - "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "attachment": true, "open_weights": false, - "knowledge": "2024-04", - "release_date": "2024-07-18", - "last_updated": "2024-07-18", + "release_date": "2026-03-01", + "last_updated": "2026-03-01", "cost": { - "input": 0.15, - "output": 0.6 + "input": 2.992, + "output": 14.994, + "cache_read": 0.2992 }, "type": "chat" }, { - "id": "gpt-5.1-codex-max", - "name": "GPT-5.1 Codex Max", - "display_name": "GPT-5.1 Codex Max", + "id": "anthropic/claude-opus-4.8", + "name": "Claude Opus 4.8", + "display_name": "Claude Opus 4.8", "modalities": { "input": [ "text", - "image" + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 400000, + "context": 1000000, "output": 128000 }, - "temperature": false, "tool_call": true, "reasoning": { "supported": true, @@ -167782,75 +172647,80 @@ "supported": true, "default_enabled": false, "mode": "effort", - "effort": "none", + "effort": "high", "effort_options": [ - "none", "low", "medium", - "high" + "high", + "xhigh", + "max" ], - "verbosity": "medium", - "verbosity_options": [ - "low", - "medium", - "high" + "interleaved": true, + "summaries": true, + "visibility": "omitted", + "continuation": [ + "thinking_blocks" ], - "visibility": "hidden" + "notes": [ + "Claude Opus 4.7 and newer Opus models require thinking.type = \"adaptive\" to enable thinking explicitly.", + "Manual budget_tokens requests return 400 on Claude Opus 4.7 and newer adaptive-only Opus models.", + "task_budget is separate from thinking control and should not be treated as a thinking budget." + ] } }, "attachment": true, "open_weights": false, - "knowledge": "2024-09-30", - "release_date": "2025-11-13", - "last_updated": "2025-11-13", + "release_date": "2026-05-28", + "last_updated": "2026-05-28", "cost": { - "input": 1.25, - "output": 10 + "input": 4.998, + "output": 25.007, + "cache_read": 0.4998 }, "type": "chat" }, { - "id": "grok-4-1-fast-non-reasoning", - "name": "Grok 4.1 Fast (Non-Reasoning)", - "display_name": "Grok 4.1 Fast (Non-Reasoning)", + "id": "anthropic/claude-opus-latest", + "name": "Claude Opus Latest", + "display_name": "Claude Opus Latest", "modalities": { "input": [ "text", - "image" + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 2000000, - "output": 16384 + "context": 1000000, + "output": 128000 }, - "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "attachment": true, "open_weights": false, - "release_date": "2025-11-17", - "last_updated": "2025-11-17", + "release_date": "2026-03-29", + "last_updated": "2026-03-29", "cost": { - "input": 0.2, - "output": 0.5 + "input": 4.998, + "output": 25.007, + "cache_read": 0.4998 }, "type": "chat" }, { - "id": "gemini-2.5-pro", - "name": "Gemini 2.5 Pro", - "display_name": "Gemini 2.5 Pro", + "id": "anthropic/claude-sonnet-4.6", + "name": "Claude Sonnet 4.6", + "display_name": "Claude Sonnet 4.6", "modalities": { "input": [ "text", "image", - "audio", - "video", "pdf" ], "output": [ @@ -167858,82 +172728,57 @@ ] }, "limit": { - "context": 1048576, - "output": 65536 + "context": 1000000, + "output": 128000 }, - "temperature": true, "tool_call": true, "reasoning": { "supported": true, - "default": true + "default": false }, "extra_capabilities": { "reasoning": { "supported": true, - "default_enabled": true, - "mode": "budget", + "default_enabled": false, + "mode": "mixed", "budget": { - "default": -1, - "min": 128, - "max": 32768, - "auto": -1, + "min": 1024, "unit": "tokens" }, + "effort": "high", + "effort_options": [ + "low", + "medium", + "high", + "max" + ], + "interleaved": true, "summaries": true, "visibility": "summary", "continuation": [ - "thought_signatures" + "thinking_blocks" + ], + "notes": [ + "Anthropic recommends adaptive thinking with effort for Claude 4.6; budget_tokens remains a deprecated compatibility path.", + "Anthropic API defaults effort to high; lower effort levels should be chosen per workload." ] } }, "attachment": true, "open_weights": false, - "knowledge": "2025-01", - "release_date": "2025-03-25", - "last_updated": "2025-03-25", - "cost": { - "input": 1.25, - "output": 10 - }, - "type": "chat" - }, - { - "id": "gpt-4.1", - "name": "GPT-4.1", - "display_name": "GPT-4.1", - "modalities": { - "input": [ - "text", - "image" - ], - "output": [ - "text" - ] - }, - "limit": { - "context": 1047576, - "output": 32768 - }, - "temperature": true, - "tool_call": true, - "reasoning": { - "supported": false - }, - "attachment": true, - "open_weights": false, - "knowledge": "2024-04", - "release_date": "2025-04-14", - "last_updated": "2025-04-14", + "knowledge": "2025-08-31", + "release_date": "2026-02-17", + "last_updated": "2026-02-17", "cost": { - "input": 2, - "output": 8 + "input": 2.992, + "output": 14.993999999999998 }, "type": "chat" }, { - "id": "claude-sonnet-4-5-20250929", - "name": "Claude Sonnet 4.5", - "display_name": "Claude Sonnet 4.5", + "id": "anthropic/claude-opus-4.6:thinking", + "name": "Claude 4.6 Opus Thinking", + "display_name": "Claude 4.6 Opus Thinking", "modalities": { "input": [ "text", @@ -167945,24 +172790,30 @@ ] }, "limit": { - "context": 200000, - "output": 64000 + "context": 1000000, + "output": 128000 }, - "temperature": true, "tool_call": true, "reasoning": { "supported": true, - "default": false + "default": true }, "extra_capabilities": { "reasoning": { "supported": true, - "default_enabled": false, - "mode": "budget", + "default_enabled": true, + "mode": "mixed", "budget": { "min": 1024, "unit": "tokens" }, + "effort": "high", + "effort_options": [ + "low", + "medium", + "high", + "max" + ], "interleaved": true, "summaries": true, "visibility": "summary", @@ -167970,26 +172821,25 @@ "thinking_blocks" ], "notes": [ - "Claude 4 manual thinking uses thinking.type = \"enabled\" with budget_tokens.", - "Interleaved thinking requires the interleaved-thinking-2025-05-14 beta header for this model family." + "Anthropic recommends adaptive thinking with effort for Claude 4.6; budget_tokens remains a deprecated compatibility path.", + "Anthropic API defaults effort to high; lower effort levels should be chosen per workload." ] } }, "attachment": true, "open_weights": false, - "knowledge": "2025-07-31", - "release_date": "2025-09-29", - "last_updated": "2025-09-29", + "release_date": "2026-02-05", + "last_updated": "2026-02-05", "cost": { - "input": 3, - "output": 15 + "input": 4.998, + "output": 25.007 }, "type": "chat" }, { - "id": "claude-opus-4-1-20250805", - "name": "Claude Opus 4.1", - "display_name": "Claude Opus 4.1", + "id": "anthropic/claude-opus-4.6", + "name": "Claude 4.6 Opus", + "display_name": "Claude 4.6 Opus", "modalities": { "input": [ "text", @@ -168001,10 +172851,9 @@ ] }, "limit": { - "context": 200000, - "output": 32000 + "context": 1000000, + "output": 128000 }, - "temperature": true, "tool_call": true, "reasoning": { "supported": true, @@ -168014,11 +172863,18 @@ "reasoning": { "supported": true, "default_enabled": false, - "mode": "budget", + "mode": "mixed", "budget": { "min": 1024, "unit": "tokens" }, + "effort": "high", + "effort_options": [ + "low", + "medium", + "high", + "max" + ], "interleaved": true, "summaries": true, "visibility": "summary", @@ -168026,247 +172882,151 @@ "thinking_blocks" ], "notes": [ - "Claude 4 manual thinking uses thinking.type = \"enabled\" with budget_tokens.", - "Interleaved thinking requires the interleaved-thinking-2025-05-14 beta header for this model family." + "Anthropic recommends adaptive thinking with effort for Claude 4.6; budget_tokens remains a deprecated compatibility path.", + "Anthropic API defaults effort to high; lower effort levels should be chosen per workload." ] } }, "attachment": true, "open_weights": false, - "release_date": "2025-08-05", - "last_updated": "2025-08-05", + "release_date": "2026-02-05", + "last_updated": "2026-02-05", "cost": { - "input": 15, - "output": 75 + "input": 4.998, + "output": 25.007 }, "type": "chat" }, { - "id": "gemini-3.1-pro-preview", - "name": "Gemini 3.1 Pro Preview", - "display_name": "Gemini 3.1 Pro Preview", + "id": "tencent/Hunyuan-MT-7B", + "name": "Hunyuan MT 7B", + "display_name": "Hunyuan MT 7B", "modalities": { "input": [ - "text", - "image", - "video", - "audio", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 1048576, - "output": 65536 + "context": 8192, + "output": 8192 }, - "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": true, - "mode": "level", - "level": "high", - "level_options": [ - "low", - "high" - ], - "summaries": true, - "visibility": "summary", - "continuation": [ - "thought_signatures" - ] - } + "supported": false }, - "attachment": true, + "attachment": false, "open_weights": false, - "knowledge": "2025-01", - "release_date": "2026-02-19", - "last_updated": "2026-02-19", + "release_date": "2025-09-18", + "last_updated": "2025-09-18", "cost": { - "input": 2, - "output": 12 + "input": 10, + "output": 20 }, "type": "chat" }, { - "id": "gpt-5.3-codex", - "name": "GPT-5.3 Codex", - "display_name": "GPT-5.3 Codex", + "id": "tencent/hy3-preview", + "name": "Tencent: Hy3 preview", + "display_name": "Tencent: Hy3 preview", "modalities": { "input": [ - "text", - "image", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 400000, - "output": 128000 + "context": 262144, + "output": 262144 }, - "temperature": false, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": true + "supported": true }, "extra_capabilities": { "reasoning": { - "supported": true, - "default_enabled": true, - "mode": "effort", - "effort": "medium", - "effort_options": [ - "low", - "medium", - "high", - "xhigh" - ], - "verbosity": "medium", - "verbosity_options": [ - "low", - "medium", - "high" - ], - "visibility": "hidden" + "supported": true } }, - "attachment": true, + "attachment": false, "open_weights": false, - "knowledge": "2025-08-31", - "release_date": "2026-02-05", - "last_updated": "2026-02-05", + "release_date": "2026-04-23", + "last_updated": "2026-04-23", "cost": { - "input": 1.75, - "output": 14 + "input": 0.066, + "output": 0.26, + "cache_read": 0.029 }, "type": "chat" }, { - "id": "gemini-2.5-flash", - "name": "Gemini 2.5 Flash", - "display_name": "Gemini 2.5 Flash", + "id": "chutesai/Mistral-Small-3.2-24B-Instruct-2506", + "name": "Mistral Small 3.2 24b Instruct", + "display_name": "Mistral Small 3.2 24b Instruct", "modalities": { "input": [ - "text", - "image", - "audio", - "video", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 1048576, - "output": 65536 + "context": 128000, + "output": 131072 }, - "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": true, - "mode": "budget", - "budget": { - "default": -1, - "min": 0, - "max": 24576, - "auto": -1, - "off": 0, - "unit": "tokens" - }, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thought_signatures" - ] - } + "supported": false }, - "attachment": true, + "attachment": false, "open_weights": false, - "knowledge": "2025-01", - "release_date": "2025-03-20", - "last_updated": "2025-06-05", + "release_date": "2025-04-15", + "last_updated": "2025-04-15", "cost": { - "input": 0.3, - "output": 2.5 + "input": 0.2, + "output": 0.4 }, "type": "chat" }, { - "id": "claude-3-7-sonnet-20250219", - "name": "Claude Sonnet 3.7", - "display_name": "Claude Sonnet 3.7", + "id": "dmind/dmind-1-mini", + "name": "DMind-1-Mini", + "display_name": "DMind-1-Mini", "modalities": { "input": [ - "text", - "image", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 64000 + "context": 32768, + "output": 8192 }, - "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": false - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": false, - "mode": "budget", - "budget": { - "min": 1024, - "unit": "tokens" - }, - "interleaved": false, - "summaries": false, - "visibility": "full", - "continuation": [ - "thinking_blocks" - ], - "notes": [ - "Anthropic uses thinking budget tokens" - ] - } + "supported": false }, - "attachment": true, + "attachment": false, "open_weights": false, - "knowledge": "2024-10-31", - "release_date": "2025-02-19", - "last_updated": "2025-02-19", + "release_date": "2025-06-01", + "last_updated": "2025-06-01", "cost": { - "input": 3, - "output": 15 + "input": 0.2, + "output": 0.4 }, "type": "chat" }, { - "id": "kimi-k2-turbo-preview", - "name": "Kimi K2 Turbo Preview", - "display_name": "Kimi K2 Turbo Preview", + "id": "dmind/dmind-1", + "name": "DMind-1", + "display_name": "DMind-1", "modalities": { "input": [ "text" @@ -168276,256 +173036,181 @@ ] }, "limit": { - "context": 256000, + "context": 32768, "output": 8192 }, - "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": false }, "attachment": false, "open_weights": false, - "release_date": "2025-07-08", - "last_updated": "2025-07-08", + "release_date": "2025-06-01", + "last_updated": "2025-06-01", "cost": { - "input": 0.15, - "output": 8 + "input": 0.3, + "output": 0.6 }, "type": "chat" }, { - "id": "claude-opus-4-5-20251101", - "name": "Claude Opus 4.5", - "display_name": "Claude Opus 4.5", + "id": "MarinaraSpaghetti/NemoMix-Unleashed-12B", + "name": "NemoMix 12B Unleashed", + "display_name": "NemoMix 12B Unleashed", "modalities": { "input": [ - "text", - "image", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 64000 + "context": 32768, + "output": 8192 }, - "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": false - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": false, - "mode": "mixed", - "budget": { - "min": 1024, - "unit": "tokens" - }, - "effort": "high", - "effort_options": [ - "low", - "medium", - "high" - ], - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ], - "notes": [ - "Claude Opus 4.5 uses manual thinking.type = \"enabled\" with budget_tokens; effort can be used alongside the thinking budget.", - "Interleaved thinking requires the interleaved-thinking-2025-05-14 beta header." - ] - } + "supported": false }, - "attachment": true, + "attachment": false, "open_weights": false, - "knowledge": "2025-03-31", - "release_date": "2025-11-01", - "last_updated": "2025-11-01", + "release_date": "2024-07-01", + "last_updated": "2024-07-01", "cost": { - "input": 5, - "output": 25 + "input": 0.49299999999999994, + "output": 0.49299999999999994 }, "type": "chat" }, { - "id": "gpt-5.2-codex", - "name": "GPT-5.2 Codex", - "display_name": "GPT-5.2 Codex", + "id": "deepcogito/cogito-v1-preview-qwen-32B", + "name": "Cogito v1 Preview Qwen 32B", + "display_name": "Cogito v1 Preview Qwen 32B", "modalities": { "input": [ - "text", - "image", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 400000, - "output": 128000 + "context": 128000, + "output": 32768 }, - "temperature": false, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": true + "supported": false }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": true, - "mode": "effort", - "effort": "medium", - "effort_options": [ - "low", - "medium", - "high", - "xhigh" - ], - "verbosity": "medium", - "verbosity_options": [ - "low", - "medium", - "high" - ], - "visibility": "hidden" - } + "attachment": false, + "open_weights": false, + "release_date": "2025-05-10", + "last_updated": "2025-05-10", + "cost": { + "input": 1.7999999999999998, + "output": 1.7999999999999998 }, - "attachment": true, + "type": "chat" + }, + { + "id": "cohere/command-r", + "name": "Cohere: Command R", + "display_name": "Cohere: Command R", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 128000, + "output": 4096 + }, + "tool_call": false, + "reasoning": { + "supported": false + }, + "attachment": false, "open_weights": false, - "knowledge": "2025-08-31", - "release_date": "2025-12-11", - "last_updated": "2025-12-11", + "release_date": "2024-03-11", + "last_updated": "2024-03-11", "cost": { - "input": 1.75, - "output": 14 + "input": 0.476, + "output": 1.428 }, "type": "chat" }, { - "id": "gpt-5.1-codex", - "name": "GPT-5.1 Codex", - "display_name": "GPT-5.1 Codex", + "id": "cohere/command-r-plus-08-2024", + "name": "Cohere: Command R+", + "display_name": "Cohere: Command R+", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 400000, - "output": 128000 + "context": 128000, + "output": 4096 }, - "temperature": false, "tool_call": true, "reasoning": { - "supported": true, - "default": false - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": false, - "mode": "effort", - "effort": "none", - "effort_options": [ - "none", - "low", - "medium", - "high" - ], - "verbosity": "medium", - "verbosity_options": [ - "low", - "medium", - "high" - ], - "visibility": "hidden" - } + "supported": false }, - "attachment": true, + "attachment": false, "open_weights": false, - "knowledge": "2024-09-30", - "release_date": "2025-11-13", - "last_updated": "2025-11-13", + "release_date": "2024-08-30", + "last_updated": "2024-08-30", "cost": { - "input": 1.25, - "output": 10 + "input": 2.856, + "output": 14.246 }, "type": "chat" }, { - "id": "claude-sonnet-4-20250514", - "name": "Claude Sonnet 4", - "display_name": "Claude Sonnet 4", + "id": "stepfun/step-3.7-flash:thinking", + "name": "Step 3.7 Flash Thinking", + "display_name": "Step 3.7 Flash Thinking", "modalities": { "input": [ "text", "image", - "pdf" + "video" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 64000 + "context": 256000, + "output": 256000 }, - "temperature": true, "tool_call": true, "reasoning": { "supported": true, - "default": false - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": false, - "mode": "budget", - "budget": { - "min": 1024, - "unit": "tokens" - }, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ], - "notes": [ - "Claude 4 manual thinking uses thinking.type = \"enabled\" with budget_tokens.", - "Interleaved thinking requires the interleaved-thinking-2025-05-14 beta header for this model family." - ] - } + "default": true }, "attachment": true, "open_weights": false, - "release_date": "2025-05-14", - "last_updated": "2025-05-14", + "release_date": "2026-05-29", + "last_updated": "2026-05-29", "cost": { - "input": 3, - "output": 15 + "input": 0.2, + "output": 1.15, + "cache_read": 0.04 }, "type": "chat" }, { - "id": "llama-3.3-70b-versatile", - "name": "Llama 3.3 70B Versatile", - "display_name": "Llama 3.3 70B Versatile", + "id": "nex-agi/deepseek-v3.1-nex-n1", + "name": "DeepSeek V3.1 Nex N1", + "display_name": "DeepSeek V3.1 Nex N1", "modalities": { "input": [ "text" @@ -168536,31 +173221,29 @@ }, "limit": { "context": 128000, - "output": 32768 + "output": 8192 }, - "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": false }, "attachment": false, - "open_weights": true, - "release_date": "2024-12-06", - "last_updated": "2024-12-06", + "open_weights": false, + "release_date": "2025-12-10", + "last_updated": "2025-12-10", "cost": { - "input": 0.59, - "output": 0.79 + "input": 0.27999999999999997, + "output": 0.42000000000000004 }, "type": "chat" }, { - "id": "claude-opus-4-6", - "name": "Claude Opus 4.6", - "display_name": "Claude Opus 4.6", + "id": "undi95/remm-slerp-l2-13b", + "name": "ReMM SLERP 13B", + "display_name": "ReMM SLERP 13B", "modalities": { "input": [ "text", - "image", "pdf" ], "output": [ @@ -168568,107 +173251,100 @@ ] }, "limit": { - "context": 200000, - "output": 128000 + "context": 6144, + "output": 4096 }, - "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": false - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": false, - "mode": "mixed", - "budget": { - "min": 1024, - "unit": "tokens" - }, - "effort": "high", - "effort_options": [ - "low", - "medium", - "high", - "max" - ], - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ], - "notes": [ - "Anthropic recommends adaptive thinking with effort for Claude 4.6; budget_tokens remains a deprecated compatibility path.", - "Anthropic API defaults effort to high; lower effort levels should be chosen per workload." - ] - } + "supported": false }, "attachment": true, "open_weights": false, - "knowledge": "2025-05-31", - "release_date": "2026-02-05", - "last_updated": "2026-02-05", + "release_date": "2025-01-01", + "last_updated": "2025-01-01", "cost": { - "input": 5, - "output": 25 + "input": 0.7989999999999999, + "output": 1.2069999999999999 }, "type": "chat" }, { - "id": "gpt-5.1-chat-latest", - "name": "GPT-5.1 Chat Latest", - "display_name": "GPT-5.1 Chat Latest", + "id": "nothingiisreal/L3.1-70B-Celeste-V0.1-BF16", + "name": "Llama 3.1 70B Celeste v0.1", + "display_name": "Llama 3.1 70B Celeste v0.1", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 400000, + "context": 16384, + "output": 16384 + }, + "tool_call": false, + "reasoning": { + "supported": false + }, + "attachment": false, + "open_weights": false, + "release_date": "2024-07-23", + "last_updated": "2024-07-23", + "cost": { + "input": 0.49299999999999994, + "output": 0.49299999999999994 + }, + "type": "chat" + }, + { + "id": "zai-org/glm-4.7-flash-original:thinking", + "name": "GLM 4.7 Flash Original Thinking", + "display_name": "GLM 4.7 Flash Original Thinking", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 200000, "output": 128000 }, - "temperature": false, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": true, "default": true }, - "attachment": true, + "attachment": false, "open_weights": false, - "knowledge": "2024-09-30", - "release_date": "2025-11-13", - "last_updated": "2025-11-13", + "release_date": "2026-01-19", + "last_updated": "2026-01-19", "cost": { - "input": 1.25, - "output": 10 + "input": 0.07, + "output": 0.4 }, "type": "chat" }, { - "id": "kimi-k2.5", - "name": "Kimi K2.5", - "display_name": "Kimi K2.5", + "id": "zai-org/glm-4.7", + "name": "GLM 4.7", + "display_name": "GLM 4.7", "modalities": { "input": [ - "text", - "image", - "video" + "text" ], "output": [ "text" ] }, "limit": { - "context": 262144, - "output": 32768 + "context": 200000, + "output": 128000 }, - "temperature": true, "tool_call": true, "reasoning": { "supported": true, @@ -168687,145 +173363,142 @@ }, "attachment": false, "open_weights": true, - "knowledge": "2025-01", - "release_date": "2026-01", - "last_updated": "2026-01", + "release_date": "2026-01-29", + "last_updated": "2026-01-29", "cost": { - "input": 0.6, - "output": 3 + "input": 0.15, + "output": 0.8 }, "type": "chat" }, { - "id": "gpt-5.3-codex-xhigh", - "name": "GPT-5.3 Codex XHigh", - "display_name": "GPT-5.3 Codex XHigh", + "id": "zai-org/GLM-4.5-Air:thinking", + "name": "GLM 4.5 Air (Thinking)", + "display_name": "GLM 4.5 Air (Thinking)", "modalities": { "input": [ - "text", - "image", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 400000, - "output": 128000 + "context": 128000, + "output": 98304 }, - "temperature": false, "tool_call": true, "reasoning": { "supported": true, "default": true }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": true, - "mode": "effort", - "effort": "medium", - "effort_options": [ - "low", - "medium", - "high", - "xhigh" - ], - "verbosity": "medium", - "verbosity_options": [ - "low", - "medium", - "high" - ], - "visibility": "hidden" - } - }, - "attachment": true, + "attachment": false, "open_weights": false, - "knowledge": "2025-08-31", - "release_date": "2026-02-05", - "last_updated": "2026-02-05", + "release_date": "2024-01-01", + "last_updated": "2024-01-01", "cost": { - "input": 1.75, - "output": 14 + "input": 0.12, + "output": 0.8 }, "type": "chat" }, { - "id": "grok-code-fast-1", - "name": "Grok Code Fast 1", - "display_name": "Grok Code Fast 1", + "id": "zai-org/GLM-4.5:thinking", + "name": "GLM 4.5 (Thinking)", + "display_name": "GLM 4.5 (Thinking)", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 128000, + "output": 65536 + }, + "tool_call": false, + "reasoning": { + "supported": true, + "default": true + }, + "attachment": false, + "open_weights": false, + "release_date": "2024-01-01", + "last_updated": "2024-01-01", + "cost": { + "input": 0.3, + "output": 1.3 + }, + "type": "chat" + }, + { + "id": "zai-org/glm-4.5", + "name": "GLM 4.5", + "display_name": "GLM 4.5", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 256000, - "output": 16384 + "context": 128000, + "output": 65536 }, - "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true - } + "supported": false }, - "attachment": true, + "attachment": false, "open_weights": false, - "release_date": "2025-09-01", - "last_updated": "2025-09-01", + "release_date": "2025-04-15", + "last_updated": "2025-04-15", "cost": { - "input": 0.2, - "output": 1.5 + "input": 0.3, + "output": 1.3 }, "type": "chat" }, { - "id": "gpt-4.1-nano", - "name": "GPT-4.1 Nano", - "display_name": "GPT-4.1 Nano", + "id": "zai-org/glm-5-original", + "name": "GLM 5 Original", + "display_name": "GLM 5 Original", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 1047576, - "output": 32768 + "context": 200000, + "output": 128000 }, - "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": true, + "attachment": false, "open_weights": false, - "knowledge": "2024-04", - "release_date": "2025-04-14", - "last_updated": "2025-04-14", + "release_date": "2026-02-11", + "last_updated": "2026-02-11", "cost": { - "input": 0.1, - "output": 0.4 + "input": 1, + "output": 3.2, + "cache_read": 0.2 }, "type": "chat" }, { - "id": "deepseek/deepseek-v3.1", - "name": "DeepSeek V3.1", - "display_name": "DeepSeek V3.1", + "id": "zai-org/glm-5.1", + "name": "GLM 5.1", + "display_name": "GLM 5.1", "modalities": { "input": [ "text" @@ -168835,29 +173508,33 @@ ] }, "limit": { - "context": 128000, - "output": 8192 + "context": 200000, + "output": 131072 }, - "temperature": true, "tool_call": true, "reasoning": { "supported": true, "default": true }, + "extra_capabilities": { + "reasoning": { + "supported": true + } + }, "attachment": false, "open_weights": true, - "release_date": "2025-01-20", - "last_updated": "2025-01-20", + "release_date": "2026-03-27", + "last_updated": "2026-03-27", "cost": { - "input": 0.55, - "output": 1.66 + "input": 0.3, + "output": 2.55 }, "type": "chat" }, { - "id": "zai-org/glm-4.6", - "name": "GLM-4.6", - "display_name": "GLM-4.6", + "id": "zai-org/glm-4.7-original", + "name": "GLM 4.7 Original", + "display_name": "GLM 4.7 Original", "modalities": { "input": [ "text" @@ -168867,33 +173544,29 @@ ] }, "limit": { - "context": 128000, - "output": 8192 + "context": 200000, + "output": 65535 }, - "temperature": true, "tool_call": true, "reasoning": { - "supported": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true - } + "supported": true, + "default": true }, "attachment": false, - "open_weights": true, - "release_date": "2025-03-01", - "last_updated": "2025-03-01", + "open_weights": false, + "release_date": "2025-12-22", + "last_updated": "2025-12-22", "cost": { "input": 0.6, - "output": 2.2 + "output": 2.2, + "cache_read": 0.11 }, "type": "chat" }, { - "id": "zai-org/glm-4.7", - "name": "GLM-4.7", - "display_name": "GLM-4.7", + "id": "zai-org/glm-4.7-original:thinking", + "name": "GLM 4.7 Original Thinking", + "display_name": "GLM 4.7 Original Thinking", "modalities": { "input": [ "text" @@ -168903,39 +173576,29 @@ ] }, "limit": { - "context": 128000, - "output": 8192 + "context": 200000, + "output": 65535 }, - "temperature": true, "tool_call": true, "reasoning": { - "supported": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } + "supported": true, + "default": true }, "attachment": false, - "open_weights": true, - "release_date": "2025-06-01", - "last_updated": "2025-06-01", + "open_weights": false, + "release_date": "2025-12-22", + "last_updated": "2025-12-22", "cost": { "input": 0.6, - "output": 2.2 + "output": 2.2, + "cache_read": 0.11 }, "type": "chat" }, { - "id": "zai-org/glm-5", - "name": "GLM-5", - "display_name": "GLM-5", + "id": "zai-org/glm-4.7-flash-original", + "name": "GLM 4.7 Flash Original", + "display_name": "GLM 4.7 Flash Original", "modalities": { "input": [ "text" @@ -168945,40 +173608,28 @@ ] }, "limit": { - "context": 204800, - "output": 131072 + "context": 200000, + "output": 128000 }, - "temperature": true, "tool_call": true, "reasoning": { "supported": true, "default": true }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } - }, "attachment": false, - "open_weights": true, - "release_date": "2026-02-11", - "last_updated": "2026-02-11", + "open_weights": false, + "release_date": "2026-01-19", + "last_updated": "2026-01-19", "cost": { - "input": 1, - "output": 3.2 + "input": 0.07, + "output": 0.4 }, "type": "chat" }, { - "id": "zai-org/glm-4.5", - "name": "GLM-4.5", - "display_name": "GLM-4.5", + "id": "zai-org/glm-4.7:thinking", + "name": "GLM 4.7 Thinking", + "display_name": "GLM 4.7 Thinking", "modalities": { "input": [ "text" @@ -168988,62 +173639,59 @@ ] }, "limit": { - "context": 128000, - "output": 8192 + "context": 200000, + "output": 65535 }, - "temperature": true, "tool_call": true, "reasoning": { "supported": true, "default": true }, "attachment": false, - "open_weights": true, - "release_date": "2025-07-28", - "last_updated": "2025-07-28", + "open_weights": false, + "release_date": "2025-12-22", + "last_updated": "2025-12-22", "cost": { - "input": 0.6, - "output": 2.2 + "input": 0.2, + "output": 0.8 }, "type": "chat" }, { - "id": "meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8", - "name": "Llama 4 Maverick 17B 128E Instruct FP8", - "display_name": "Llama 4 Maverick 17B 128E Instruct FP8", + "id": "zai-org/glm-5.1:thinking", + "name": "GLM 5.1 Thinking", + "display_name": "GLM 5.1 Thinking", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 1000000, - "output": 32768 + "context": 200000, + "output": 131072 }, - "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": true, + "attachment": false, "open_weights": true, - "knowledge": "2024-08", - "release_date": "2025-04-05", - "last_updated": "2025-04-05", + "release_date": "2026-03-27", + "last_updated": "2026-03-27", "cost": { - "input": 0.14, - "output": 0.59 + "input": 0.3, + "output": 2.55 }, "type": "chat" }, { - "id": "meta-llama/Meta-Llama-3.1-8B-Instruct", - "name": "Llama 3.1 8B Instruct", - "display_name": "Llama 3.1 8B Instruct", + "id": "zai-org/glm-5:thinking", + "name": "GLM 5 Thinking", + "display_name": "GLM 5 Thinking", "modalities": { "input": [ "text" @@ -169053,31 +173701,32 @@ ] }, "limit": { - "context": 128000, - "output": 4096 + "context": 200000, + "output": 128000 }, - "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "attachment": false, "open_weights": true, - "release_date": "2024-07-23", - "last_updated": "2024-07-23", + "release_date": "2026-02-11", + "last_updated": "2026-02-11", "cost": { - "input": 0.02, - "output": 0.05 + "input": 0.3, + "output": 2.55 }, "type": "chat" }, { - "id": "meta-llama/Meta-Llama-3.1-405B-Instruct-Turbo", - "name": "Llama 3.1 405B Instruct Turbo", - "display_name": "Llama 3.1 405B Instruct Turbo", + "id": "zai-org/glm-4.6v", + "name": "GLM 4.6V", + "display_name": "GLM 4.6V", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" @@ -169085,27 +173734,26 @@ }, "limit": { "context": 128000, - "output": 4096 + "output": 24000 }, - "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": false }, - "attachment": false, - "open_weights": true, - "release_date": "2024-07-23", - "last_updated": "2024-07-23", + "attachment": true, + "open_weights": false, + "release_date": "2025-12-11", + "last_updated": "2025-12-11", "cost": { - "input": 3.5, - "output": 3.5 + "input": 0.3, + "output": 0.9 }, "type": "chat" }, { - "id": "deepseek-ai/DeepSeek-V3.1-Terminus", - "name": "DeepSeek V3.1 Terminus", - "display_name": "DeepSeek V3.1 Terminus", + "id": "zai-org/glm-4.6-original", + "name": "GLM 4.6 Original", + "display_name": "GLM 4.6 Original", "modalities": { "input": [ "text" @@ -169115,29 +173763,28 @@ ] }, "limit": { - "context": 128000, - "output": 8192 + "context": 256000, + "output": 65535 }, - "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": true, "default": true }, "attachment": false, - "open_weights": true, - "release_date": "2025-06-01", - "last_updated": "2025-06-01", + "open_weights": false, + "release_date": "2025-12-11", + "last_updated": "2025-12-11", "cost": { - "input": 0.27, - "output": 1 + "input": 0.35, + "output": 1.4 }, "type": "chat" }, { - "id": "deepseek-ai/DeepSeek-V3.2", - "name": "DeepSeek V3.2", - "display_name": "DeepSeek V3.2", + "id": "zai-org/glm-5-original:thinking", + "name": "GLM 5 Original Thinking", + "display_name": "GLM 5 Original Thinking", "modalities": { "input": [ "text" @@ -169147,34 +173794,29 @@ ] }, "limit": { - "context": 128000, - "output": 8192 + "context": 200000, + "output": 128000 }, - "temperature": true, "tool_call": true, "reasoning": { "supported": true, "default": true }, - "extra_capabilities": { - "reasoning": { - "supported": true - } - }, "attachment": false, - "open_weights": true, - "release_date": "2025-06-15", - "last_updated": "2025-06-15", + "open_weights": false, + "release_date": "2026-02-11", + "last_updated": "2026-02-11", "cost": { - "input": 0.27, - "output": 0.4 + "input": 1, + "output": 3.2, + "cache_read": 0.2 }, "type": "chat" }, { - "id": "deepseek-ai/DeepSeek-R1", - "name": "DeepSeek R1", - "display_name": "DeepSeek R1", + "id": "zai-org/glm-4.7-flash:thinking", + "name": "GLM 4.7 Flash Thinking", + "display_name": "GLM 4.7 Flash Thinking", "modalities": { "input": [ "text" @@ -169184,86 +173826,64 @@ ] }, "limit": { - "context": 128000, - "output": 8192 + "context": 200000, + "output": 128000 }, - "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": true, "default": true }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } - }, "attachment": false, - "open_weights": true, - "release_date": "2025-01-20", - "last_updated": "2025-01-20", + "open_weights": false, + "release_date": "2026-01-19", + "last_updated": "2026-01-19", "cost": { - "input": 3, - "output": 7 + "input": 0.07, + "output": 0.4 }, "type": "chat" }, { - "id": "Qwen/QwQ-32B", - "name": "QwQ 32B", - "display_name": "QwQ 32B", + "id": "zai-org/glm-4.6v-flash-original", + "name": "GLM 4.6V Flash", + "display_name": "GLM 4.6V Flash", "modalities": { "input": [ - "text" + "text", + "image", + "video" ], "output": [ "text" ] }, "limit": { - "context": 32768, - "output": 32768 + "context": 128000, + "output": 24000 }, - "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } + "supported": false }, - "attachment": false, - "open_weights": true, - "release_date": "2024-11-28", - "last_updated": "2024-11-28", + "attachment": true, + "open_weights": false, + "release_date": "2025-12-08", + "last_updated": "2025-12-08", "cost": { - "input": 0.4, + "input": 0.1, "output": 0.4 }, "type": "chat" }, { - "id": "Qwen/Qwen2.5-72B-Instruct", - "name": "Qwen 2.5 72B Instruct", - "display_name": "Qwen 2.5 72B Instruct", + "id": "zai-org/glm-4.6v-original", + "name": "GLM 4.6V Original", + "display_name": "GLM 4.6V Original", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" @@ -169271,27 +173891,26 @@ }, "limit": { "context": 128000, - "output": 8192 + "output": 24000 }, - "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": false }, - "attachment": false, - "open_weights": true, - "release_date": "2024-09-19", - "last_updated": "2024-09-19", + "attachment": true, + "open_weights": false, + "release_date": "2025-12-08", + "last_updated": "2025-12-08", "cost": { - "input": 0.11, - "output": 0.38 + "input": 0.6, + "output": 0.9 }, "type": "chat" }, { - "id": "Qwen/qwen3-coder-480b-a35b-instruct", - "name": "Qwen3 Coder 480B A35B Instruct", - "display_name": "Qwen3 Coder 480B A35B Instruct", + "id": "zai-org/glm-latest", + "name": "GLM Latest", + "display_name": "GLM Latest", "modalities": { "input": [ "text" @@ -169301,29 +173920,29 @@ ] }, "limit": { - "context": 262144, - "output": 65536 + "context": 200000, + "output": 131072 }, - "temperature": true, "tool_call": true, "reasoning": { "supported": true, "default": true }, "attachment": false, - "open_weights": true, - "release_date": "2025-07-22", - "last_updated": "2025-07-22", + "open_weights": false, + "release_date": "2026-05-03", + "last_updated": "2026-05-03", "cost": { - "input": 0.29, - "output": 1.2 + "input": 0.75, + "output": 2.6, + "cache_read": 0.15 }, "type": "chat" }, { - "id": "Qwen/Qwen3-235B-A22B-Instruct-2507", - "name": "Qwen3 235B A22B Instruct", - "display_name": "Qwen3 235B A22B Instruct", + "id": "zai-org/glm-4.7-flash", + "name": "GLM 4.7 Flash", + "display_name": "GLM 4.7 Flash", "modalities": { "input": [ "text" @@ -169333,29 +173952,33 @@ ] }, "limit": { - "context": 262144, - "output": 8192 + "context": 200000, + "output": 128000 }, - "temperature": true, "tool_call": true, "reasoning": { "supported": true, "default": true }, + "extra_capabilities": { + "reasoning": { + "supported": true + } + }, "attachment": false, "open_weights": true, - "release_date": "2025-07-01", - "last_updated": "2025-07-01", + "release_date": "2026-01-19", + "last_updated": "2026-01-19", "cost": { - "input": 0.13, - "output": 0.6 + "input": 0.07, + "output": 0.4 }, "type": "chat" }, { - "id": "Qwen/Qwen3-32B", - "name": "Qwen3 32B", - "display_name": "Qwen3 32B", + "id": "zai-org/GLM-4.6-turbo:thinking", + "name": "GLM 4.6 Turbo (Thinking)", + "display_name": "GLM 4.6 Turbo (Thinking)", "modalities": { "input": [ "text" @@ -169365,44 +173988,31 @@ ] }, "limit": { - "context": 128000, - "output": 8192 + "context": 200000, + "output": 204800 }, - "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": true, "default": true }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } - }, "attachment": false, - "open_weights": true, - "release_date": "2025-04-29", - "last_updated": "2025-04-29", + "open_weights": false, + "release_date": "2025-10-02", + "last_updated": "2025-10-02", "cost": { - "input": 0.09, - "output": 0.29 + "input": 1, + "output": 3 }, "type": "chat" }, { - "id": "openai/gpt-oss-120b", - "name": "GPT-OSS 120B", - "display_name": "GPT-OSS 120B", + "id": "zai-org/GLM-4.5-Air", + "name": "GLM 4.5 Air", + "display_name": "GLM 4.5 Air", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" @@ -169410,42 +174020,26 @@ }, "limit": { "context": 128000, - "output": 32768 + "output": 98304 }, - "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true - } + "supported": false }, - "attachment": true, - "open_weights": true, - "release_date": "2025-08-05", - "last_updated": "2025-08-05", + "attachment": false, + "open_weights": false, + "release_date": "2025-04-15", + "last_updated": "2025-04-15", "cost": { - "input": 0.08, - "output": 0.44 + "input": 0.12, + "output": 0.8 }, "type": "chat" - } - ] - }, - "drun": { - "id": "drun", - "name": "D.Run (China)", - "display_name": "D.Run (China)", - "api": "https://chat.d.run/v1", - "doc": "https://www.d.run", - "models": [ + }, { - "id": "public/deepseek-r1", - "name": "DeepSeek R1", - "display_name": "DeepSeek R1", + "id": "zai-org/GLM-4.6-turbo", + "name": "GLM 4.6 Turbo", + "display_name": "GLM 4.6 Turbo", "modalities": { "input": [ "text" @@ -169455,41 +174049,27 @@ ] }, "limit": { - "context": 131072, - "output": 32000 + "context": 200000, + "output": 204800 }, - "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } + "supported": false }, "attachment": false, - "open_weights": true, - "knowledge": "2024-12", - "release_date": "2025-01-20", - "last_updated": "2025-01-20", + "open_weights": false, + "release_date": "2025-10-02", + "last_updated": "2025-10-02", "cost": { - "input": 0.55, - "output": 2.2 + "input": 1, + "output": 3 }, "type": "chat" }, { - "id": "public/minimax-m25", - "name": "MiniMax M2.5", - "display_name": "MiniMax M2.5", + "id": "zai-org/glm-5", + "name": "GLM 5", + "display_name": "GLM 5", "modalities": { "input": [ "text" @@ -169499,10 +174079,9 @@ ] }, "limit": { - "context": 204800, - "output": 131072 + "context": 200000, + "output": 128000 }, - "temperature": true, "tool_call": true, "reasoning": { "supported": true, @@ -169520,19 +174099,19 @@ } }, "attachment": false, - "open_weights": false, - "release_date": "2025-03-01", - "last_updated": "2025-03-01", + "open_weights": true, + "release_date": "2026-02-11", + "last_updated": "2026-02-11", "cost": { - "input": 0.29, - "output": 1.16 + "input": 0.3, + "output": 2.55 }, "type": "chat" }, { - "id": "public/deepseek-v3", - "name": "DeepSeek V3", - "display_name": "DeepSeek V3", + "id": "Infermatic/MN-12B-Inferor-v0.0", + "name": "Mistral Nemo Inferor 12B", + "display_name": "Mistral Nemo Inferor 12B", "modalities": { "input": [ "text" @@ -169542,269 +174121,221 @@ ] }, "limit": { - "context": 131072, + "context": 16384, "output": 8192 }, - "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": false }, "attachment": false, - "open_weights": true, - "knowledge": "2024-07", - "release_date": "2024-12-26", - "last_updated": "2024-12-26", + "open_weights": false, + "release_date": "2024-07-01", + "last_updated": "2024-07-01", "cost": { - "input": 0.28, - "output": 1.1 + "input": 0.25499999999999995, + "output": 0.49299999999999994 }, "type": "chat" - } - ] - }, - "google": { - "id": "google", - "name": "google", - "display_name": "google", - "doc": "https://ai.google.dev/gemini-api/docs/models", - "models": [ + }, { - "id": "gemini-2.5-flash-preview-tts", - "name": "Gemini 2.5 Flash Preview TTS", - "display_name": "Gemini 2.5 Flash Preview TTS", + "id": "shisa-ai/shisa-v2.1-llama3.3-70b", + "name": "Shisa V2.1 Llama 3.3 70B", + "display_name": "Shisa V2.1 Llama 3.3 70B", "modalities": { "input": [ "text" ], "output": [ - "audio" + "text" ] }, "limit": { - "context": 8192, - "output": 16384 + "context": 32768, + "output": 4096 }, - "temperature": true, "tool_call": false, "reasoning": { "supported": false }, "attachment": false, "open_weights": false, - "knowledge": "2025-01", - "release_date": "2025-05-01", - "last_updated": "2025-05-01", + "release_date": "2024-12-06", + "last_updated": "2024-12-06", "cost": { "input": 0.5, - "output": 10 + "output": 0.5 }, "type": "chat" }, { - "id": "gemini-2.5-flash-image", - "name": "Gemini 2.5 Flash Image", - "display_name": "Gemini 2.5 Flash Image", + "id": "shisa-ai/shisa-v2-llama3.3-70b", + "name": "Shisa V2 Llama 3.3 70B", + "display_name": "Shisa V2 Llama 3.3 70B", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ - "text", - "image" + "text" ] }, "limit": { - "context": 32768, - "output": 32768 + "context": 128000, + "output": 16384 }, - "temperature": true, "tool_call": false, "reasoning": { "supported": false }, "attachment": false, "open_weights": false, - "knowledge": "2025-06", - "release_date": "2025-08-26", - "last_updated": "2025-08-26", + "release_date": "2025-07-26", + "last_updated": "2025-07-26", "cost": { - "input": 0.3, - "output": 30, - "cache_read": 0.075 + "input": 0.5, + "output": 0.5 }, - "type": "imageGeneration" + "type": "chat" }, { - "id": "gemini-3.1-flash-lite-preview", - "name": "Gemini 3.1 Flash Lite Preview", - "display_name": "Gemini 3.1 Flash Lite Preview", + "id": "abacusai/Dracarys-72B-Instruct", + "name": "Llama 3.1 70B Dracarys 2", + "display_name": "Llama 3.1 70B Dracarys 2", "modalities": { "input": [ - "text", - "image", - "video", - "audio", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 1048576, - "output": 65536 + "context": 16384, + "output": 8192 }, - "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true - } + "supported": false }, - "attachment": true, + "attachment": false, "open_weights": false, - "knowledge": "2025-01", - "release_date": "2026-03-03", - "last_updated": "2026-03-03", + "release_date": "2025-08-02", + "last_updated": "2025-08-02", "cost": { - "input": 0.25, - "output": 1.5, - "cache_read": 0.025, - "input_audio": 0.5 + "input": 0.49299999999999994, + "output": 0.49299999999999994 }, "type": "chat" }, { - "id": "gemini-2.0-flash-lite", - "name": "Gemini 2.0 Flash Lite", - "display_name": "Gemini 2.0 Flash Lite", + "id": "deepseek-ai/DeepSeek-V3.1:thinking", + "name": "DeepSeek V3.1 Thinking", + "display_name": "DeepSeek V3.1 Thinking", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 1048576, - "output": 8192 + "context": 128000, + "output": 65536 }, - "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": false }, - "search": { - "supported": false - }, - "attachment": true, + "attachment": false, "open_weights": false, - "knowledge": "2024-06", - "release_date": "2024-12-11", - "last_updated": "2024-12-11", + "release_date": "2025-08-21", + "last_updated": "2025-08-21", "cost": { - "input": 0.075, - "output": 0.3 + "input": 0.2, + "output": 0.7 }, "type": "chat" }, { - "id": "gemma-4-31b-it", - "name": "Gemma 4 31B IT", - "display_name": "Gemma 4 31B IT", + "id": "deepseek-ai/DeepSeek-V3.1-Terminus", + "name": "DeepSeek V3.1 Terminus", + "display_name": "DeepSeek V3.1 Terminus", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 262144, - "output": 32768 + "context": 128000, + "output": 65536 }, - "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false + }, + "attachment": false, + "open_weights": false, + "release_date": "2025-08-02", + "last_updated": "2025-08-02", + "cost": { + "input": 0.25, + "output": 0.7 }, - "attachment": true, - "open_weights": true, - "release_date": "2026-04-02", - "last_updated": "2026-04-02", "type": "chat" }, { - "id": "gemini-flash-lite-latest", - "name": "Gemini Flash-Lite Latest", - "display_name": "Gemini Flash-Lite Latest", + "id": "deepseek-ai/deepseek-v3.2-exp-thinking", + "name": "DeepSeek V3.2 Exp Thinking", + "display_name": "DeepSeek V3.2 Exp Thinking", "modalities": { "input": [ - "text", - "image", - "audio", - "video", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 1048576, + "context": 163840, "output": 65536 }, - "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": true, "default": true }, - "attachment": true, + "attachment": false, "open_weights": false, - "knowledge": "2025-01", - "release_date": "2025-09-25", - "last_updated": "2025-09-25", + "release_date": "2025-09-29", + "last_updated": "2025-09-29", "cost": { - "input": 0.1, - "output": 0.4, - "cache_read": 0.025 + "input": 0.27999999999999997, + "output": 0.42000000000000004 }, "type": "chat" }, { - "id": "gemini-3-flash-preview", - "name": "Gemini 3 Flash Preview", - "display_name": "Gemini 3 Flash Preview", + "id": "deepseek-ai/DeepSeek-R1-0528", + "name": "DeepSeek R1 0528", + "display_name": "DeepSeek R1 0528", "modalities": { "input": [ - "text", - "image", - "video", - "audio", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 1048576, - "output": 65536 + "context": 128000, + "output": 163840 }, - "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": true, "default": true @@ -169812,45 +174343,31 @@ "extra_capabilities": { "reasoning": { "supported": true, - "default_enabled": true, - "mode": "level", - "level": "high", - "level_options": [ - "minimal", - "low", - "medium", - "high" - ], + "interleaved": true, "summaries": true, "visibility": "summary", "continuation": [ - "thought_signatures" + "thinking_blocks" ] } }, - "attachment": true, + "attachment": false, "open_weights": false, - "knowledge": "2025-01", - "release_date": "2025-12-17", - "last_updated": "2025-12-17", + "release_date": "2025-05-28", + "last_updated": "2025-05-28", "cost": { - "input": 0.5, - "output": 3, - "cache_read": 0.05, - "input_audio": 1 + "input": 0.4, + "output": 1.7 }, "type": "chat" }, { - "id": "gemini-3.1-pro-preview-customtools", - "name": "Gemini 3.1 Pro Preview Custom Tools", - "display_name": "Gemini 3.1 Pro Preview Custom Tools", + "id": "deepseek-ai/DeepSeek-V3.1", + "name": "DeepSeek V3.1", + "display_name": "DeepSeek V3.1", "modalities": { "input": [ "text", - "image", - "video", - "audio", "pdf" ], "output": [ @@ -169858,570 +174375,343 @@ ] }, "limit": { - "context": 1048576, + "context": 128000, "output": 65536 }, - "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": true, - "mode": "level", - "level": "high", - "level_options": [ - "low", - "high" - ], - "summaries": true, - "visibility": "summary", - "continuation": [ - "thought_signatures" - ] - } + "supported": false }, "attachment": true, "open_weights": false, - "knowledge": "2025-01", - "release_date": "2026-02-19", - "last_updated": "2026-02-19", + "release_date": "2025-07-26", + "last_updated": "2025-07-26", "cost": { - "input": 2, - "output": 12, - "cache_read": 0.2, - "tiers": [ - { - "input": 4, - "output": 18, - "cache_read": 0.4, - "tier": { - "type": "context", - "size": 200000 - } - } - ], - "context_over_200k": { - "input": 4, - "output": 18, - "cache_read": 0.4 - } + "input": 0.2, + "output": 0.7 }, "type": "chat" }, { - "id": "gemini-flash-latest", - "name": "Gemini Flash Latest", - "display_name": "Gemini Flash Latest", + "id": "deepseek-ai/deepseek-v3.2-exp", + "name": "DeepSeek V3.2 Exp", + "display_name": "DeepSeek V3.2 Exp", "modalities": { "input": [ - "text", - "image", - "audio", - "video", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 1048576, + "context": 163840, "output": 65536 }, - "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": true + "supported": false }, - "attachment": true, + "attachment": false, "open_weights": false, - "knowledge": "2025-01", - "release_date": "2025-09-25", - "last_updated": "2025-09-25", + "release_date": "2025-09-29", + "last_updated": "2025-09-29", "cost": { - "input": 0.3, - "output": 2.5, - "cache_read": 0.075, - "input_audio": 1 + "input": 0.27999999999999997, + "output": 0.42000000000000004 }, "type": "chat" }, { - "id": "gemini-2.5-pro", - "name": "Gemini 2.5 Pro", - "display_name": "Gemini 2.5 Pro", + "id": "deepseek-ai/DeepSeek-V3.1-Terminus:thinking", + "name": "DeepSeek V3.1 Terminus (Thinking)", + "display_name": "DeepSeek V3.1 Terminus (Thinking)", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 1048576, + "context": 128000, "output": 65536 }, - "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true, - "budget": { - "default": -1, - "min": 128, - "max": 32768 - } - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": true, - "mode": "budget", - "budget": { - "default": -1, - "min": 128, - "max": 32768, - "auto": -1, - "unit": "tokens" - }, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thought_signatures" - ] - } - }, - "search": { - "supported": true, - "default": false + "supported": false }, - "attachment": true, + "attachment": false, "open_weights": false, - "knowledge": "2025-01", - "release_date": "2025-03-20", - "last_updated": "2025-06-05", + "release_date": "2025-09-22", + "last_updated": "2025-09-22", "cost": { - "input": 1.25, - "output": 10, - "cache_read": 0.125, - "tiers": [ - { - "input": 2.5, - "output": 15, - "cache_read": 0.25, - "tier": { - "type": "context", - "size": 200000 - } - } - ], - "context_over_200k": { - "input": 2.5, - "output": 15, - "cache_read": 0.25 - } + "input": 0.25, + "output": 0.7 }, "type": "chat" }, { - "id": "gemini-3.1-pro-preview", - "name": "Gemini 3.1 Pro Preview", - "display_name": "Gemini 3.1 Pro Preview", + "id": "arcee-ai/trinity-large-thinking", + "name": "Trinity Large Thinking", + "display_name": "Trinity Large Thinking", "modalities": { "input": [ - "text", - "image", - "video", - "audio", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 1048576, - "output": 65536 + "context": 262144, + "output": 80000 }, - "temperature": true, "tool_call": true, "reasoning": { "supported": true, "default": true }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": true, - "mode": "level", - "level": "high", - "level_options": [ - "low", - "high" - ], - "summaries": true, - "visibility": "summary", - "continuation": [ - "thought_signatures" - ] - } - }, - "attachment": true, + "attachment": false, "open_weights": false, - "knowledge": "2025-01", - "release_date": "2026-02-19", - "last_updated": "2026-02-19", + "release_date": "2026-04-01", + "last_updated": "2026-04-01", "cost": { - "input": 2, - "output": 12, - "cache_read": 0.2, - "tiers": [ - { - "input": 4, - "output": 18, - "cache_read": 0.4, - "tier": { - "type": "context", - "size": 200000 - } - } - ], - "context_over_200k": { - "input": 4, - "output": 18, - "cache_read": 0.4 - } + "input": 0.25, + "output": 0.9 }, "type": "chat" }, { - "id": "gemini-3.1-flash-lite", - "name": "Gemini 3.1 Flash Lite", - "display_name": "Gemini 3.1 Flash Lite", + "id": "arcee-ai/trinity-mini", + "name": "Trinity Mini", + "display_name": "Trinity Mini", "modalities": { "input": [ - "text", - "image", - "video", - "audio", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 1048576, - "output": 65536 + "context": 131072, + "output": 8192 }, - "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true - } + "supported": false }, - "attachment": true, + "attachment": false, "open_weights": false, - "knowledge": "2025-01", - "release_date": "2026-05-07", - "last_updated": "2026-05-07", + "release_date": "2025-12-01", + "last_updated": "2025-12-01", "cost": { - "input": 0.25, - "output": 1.5, - "cache_read": 0.025, - "input_audio": 0.5 + "input": 0.045000000000000005, + "output": 0.15 }, "type": "chat" }, { - "id": "gemini-2.5-flash-lite", - "name": "Gemini 2.5 Flash Lite", - "display_name": "Gemini 2.5 Flash Lite", + "id": "soob3123/GrayLine-Qwen3-8B", + "name": "Grayline Qwen3 8B", + "display_name": "Grayline Qwen3 8B", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 1048576, - "output": 65536 + "context": 16384, + "output": 32768 }, - "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": false, - "budget": { - "default": -1, - "min": 512, - "max": 24576 - } - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": false, - "mode": "budget", - "budget": { - "default": -1, - "min": 512, - "max": 24576, - "auto": -1, - "unit": "tokens" - }, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thought_signatures" - ] - } - }, - "search": { - "supported": true, - "default": false + "supported": false }, - "attachment": true, + "attachment": false, "open_weights": false, - "knowledge": "2025-01", - "release_date": "2025-06-17", - "last_updated": "2025-06-17", + "release_date": "2025-09-25", + "last_updated": "2025-09-25", "cost": { - "input": 0.1, - "output": 0.4, - "cache_read": 0.01, - "input_audio": 0.3 + "input": 0.3, + "output": 0.3 }, "type": "chat" }, { - "id": "gemini-2.5-flash", - "name": "Gemini 2.5 Flash", - "display_name": "Gemini 2.5 Flash", + "id": "soob3123/Veiled-Calla-12B", + "name": "Veiled Calla 12B", + "display_name": "Veiled Calla 12B", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 1048576, - "output": 65536 + "context": 32768, + "output": 8192 }, - "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": true, - "budget": { - "default": -1, - "min": 0, - "max": 24576 - } - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": true, - "mode": "budget", - "budget": { - "default": -1, - "min": 0, - "max": 24576, - "auto": -1, - "off": 0, - "unit": "tokens" - }, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thought_signatures" - ] - } - }, - "search": { - "supported": true, - "default": false + "supported": false }, - "attachment": true, + "attachment": false, "open_weights": false, - "knowledge": "2025-01", - "release_date": "2025-03-20", - "last_updated": "2025-06-05", + "release_date": "2025-04-13", + "last_updated": "2025-04-13", "cost": { "input": 0.3, - "output": 2.5, - "cache_read": 0.03, - "input_audio": 1 + "output": 0.3 }, "type": "chat" }, { - "id": "gemma-4-26b-a4b-it", - "name": "Gemma 4 26B A4B IT", - "display_name": "Gemma 4 26B A4B IT", + "id": "soob3123/amoral-gemma3-27B-v2", + "name": "Amoral Gemma3 27B v2", + "display_name": "Amoral Gemma3 27B v2", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 262144, - "output": 32768 + "context": 32768, + "output": 8192 }, - "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": true + "supported": false + }, + "attachment": false, + "open_weights": false, + "release_date": "2025-05-23", + "last_updated": "2025-05-23", + "cost": { + "input": 0.3, + "output": 0.3 }, - "attachment": true, - "open_weights": true, - "release_date": "2026-04-02", - "last_updated": "2026-04-02", "type": "chat" }, { - "id": "gemini-2.0-flash", - "name": "Gemini 2.0 Flash", - "display_name": "Gemini 2.0 Flash", + "id": "meganova-ai/manta-mini-1.0", + "name": "Manta Mini 1.0", + "display_name": "Manta Mini 1.0", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 1048576, + "context": 8192, "output": 8192 }, - "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": false - }, - "search": { - "supported": true, - "default": false + "supported": false }, - "attachment": true, + "attachment": false, "open_weights": false, - "knowledge": "2024-06", - "release_date": "2024-12-11", - "last_updated": "2024-12-11", + "release_date": "2025-12-20", + "last_updated": "2025-12-20", "cost": { - "input": 0.1, - "output": 0.4, - "cache_read": 0.025 + "input": 0.02, + "output": 0.16 }, "type": "chat" }, { - "id": "gemini-3.5-flash", - "name": "Gemini 3.5 Flash", - "display_name": "Gemini 3.5 Flash", + "id": "meganova-ai/manta-flash-1.0", + "name": "Manta Flash 1.0", + "display_name": "Manta Flash 1.0", "modalities": { "input": [ - "text", - "image", - "video", - "audio", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 1048576, - "output": 65536 + "context": 16384, + "output": 16384 }, - "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": true + "supported": false }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": true, - "mode": "level", - "level": "high", - "level_options": [ - "minimal", - "low", - "medium", - "high" - ], - "summaries": true, - "visibility": "summary", - "continuation": [ - "thought_signatures" - ] - } + "attachment": false, + "open_weights": false, + "release_date": "2025-12-20", + "last_updated": "2025-12-20", + "cost": { + "input": 0.02, + "output": 0.16 }, - "attachment": true, + "type": "chat" + }, + { + "id": "meganova-ai/manta-pro-1.0", + "name": "Manta Pro 1.0", + "display_name": "Manta Pro 1.0", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 32768, + "output": 32768 + }, + "tool_call": false, + "reasoning": { + "supported": false + }, + "attachment": false, "open_weights": false, - "knowledge": "2025-01", - "release_date": "2026-05-19", - "last_updated": "2026-05-19", + "release_date": "2025-12-20", + "last_updated": "2025-12-20", "cost": { - "input": 1.5, - "output": 9, - "cache_read": 0.15, - "input_audio": 1.5 + "input": 0.060000000000000005, + "output": 0.5 }, "type": "chat" }, { - "id": "gemini-3-pro-preview", - "name": "Gemini 3 Pro Preview", - "display_name": "Gemini 3 Pro Preview", + "id": "qwen/Qwen3.6-35B-A3B:thinking", + "name": "Qwen3.6 35B A3B Thinking", + "display_name": "Qwen3.6 35B A3B Thinking", "modalities": { "input": [ "text", "image", - "video", - "audio", - "pdf" + "video" ], "output": [ "text" ] }, "limit": { - "context": 1048576, - "output": 65536 + "context": 262144, + "output": 16384 }, - "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": true, "default": true @@ -170429,52 +174719,28 @@ "extra_capabilities": { "reasoning": { "supported": true, - "default_enabled": true, - "mode": "level", - "level": "high", - "level_options": [ - "low", - "high" - ], + "interleaved": true, "summaries": true, "visibility": "summary", "continuation": [ - "thought_signatures" + "thinking_blocks" ] } }, "attachment": true, "open_weights": false, - "knowledge": "2025-01", - "release_date": "2025-11-18", - "last_updated": "2025-11-18", + "release_date": "2026-04-19", + "last_updated": "2026-04-19", "cost": { - "input": 2, - "output": 12, - "cache_read": 0.2, - "tiers": [ - { - "input": 4, - "output": 18, - "cache_read": 0.4, - "tier": { - "type": "context", - "size": 200000 - } - } - ], - "context_over_200k": { - "input": 4, - "output": 18, - "cache_read": 0.4 - } + "input": 0.112, + "output": 0.8 }, "type": "chat" }, { - "id": "gemini-embedding-001", - "name": "Gemini Embedding 001", - "display_name": "Gemini Embedding 001", + "id": "qwen/qwen3-coder-plus", + "name": "Qwen3 Coder Plus", + "display_name": "Qwen3 Coder Plus", "modalities": { "input": [ "text" @@ -170484,347 +174750,258 @@ ] }, "limit": { - "context": 2048, - "output": 1 + "context": 128000, + "output": 65536 }, - "temperature": false, "tool_call": false, "reasoning": { "supported": false }, "attachment": false, "open_weights": false, - "knowledge": "2025-05", - "release_date": "2025-05-20", - "last_updated": "2025-05-20", + "release_date": "2025-09-17", + "last_updated": "2025-09-17", "cost": { - "input": 0.15, - "output": 0 + "input": 1, + "output": 5 }, - "type": "embedding" + "type": "chat" }, { - "id": "gemini-2.5-pro-preview-tts", - "name": "Gemini 2.5 Pro Preview TTS", - "display_name": "Gemini 2.5 Pro Preview TTS", + "id": "qwen/Qwen3.6-35B-A3B", + "name": "Qwen3.6 35B A3B", + "display_name": "Qwen3.6 35B A3B", "modalities": { "input": [ - "text" + "text", + "image", + "video" ], "output": [ - "audio" + "text" ] }, "limit": { - "context": 8192, + "context": 262144, "output": 16384 }, - "temperature": true, "tool_call": false, "reasoning": { - "supported": true, - "default": true + "supported": true }, "extra_capabilities": { "reasoning": { "supported": true, - "default_enabled": true, - "mode": "budget", - "budget": { - "default": -1, - "min": 128, - "max": 32768, - "auto": -1, - "unit": "tokens" - }, + "interleaved": true, "summaries": true, "visibility": "summary", "continuation": [ - "thought_signatures" + "thinking_blocks" ] } }, - "attachment": false, + "attachment": true, "open_weights": false, - "knowledge": "2025-01", - "release_date": "2025-05-01", - "last_updated": "2025-05-01", + "release_date": "2026-04-17", + "last_updated": "2026-04-17", "cost": { - "input": 1, - "output": 20 + "input": 0.112, + "output": 0.8 }, "type": "chat" }, { - "id": "gemini-3-pro-image-preview", - "name": "Nano Banana Pro", - "display_name": "Nano Banana Pro", + "id": "qwen/qwen3-32b", + "name": "Qwen 3 32b", + "display_name": "Qwen 3 32b", "modalities": { "input": [ "text", - "image" + "pdf" ], "output": [ - "text", - "image" + "text" ] }, "limit": { - "context": 131072, + "context": 41000, "output": 32768 }, - "temperature": true, "tool_call": false, "reasoning": { - "supported": true, - "default": true + "supported": true }, "extra_capabilities": { "reasoning": { "supported": true, - "default_enabled": true, - "mode": "level", - "level": "high", - "level_options": [ - "low", - "high" - ], + "interleaved": true, "summaries": true, "visibility": "summary", "continuation": [ - "thought_signatures" + "thinking_blocks" ] } }, "attachment": true, "open_weights": false, - "knowledge": "2025-01", - "release_date": "2025-11-20", - "last_updated": "2025-11-20", + "release_date": "2024-01-01", + "last_updated": "2024-01-01", "cost": { - "input": 2, - "output": 120 + "input": 0.1, + "output": 0.3 }, - "type": "imageGeneration" + "type": "chat" }, { - "id": "gemini-3.1-flash-image-preview", - "name": "Nano Banana 2", - "display_name": "Nano Banana 2", + "id": "qwen/Qwen3-VL-235B-A22B-Instruct", + "name": "Qwen3 VL 235B A22B Instruct", + "display_name": "Qwen3 VL 235B A22B Instruct", "modalities": { "input": [ "text", - "image", - "pdf" + "image" ], "output": [ - "text", - "image" + "text" ] }, "limit": { - "context": 65536, - "output": 65536 + "context": 128000, + "output": 262144 }, - "temperature": true, "tool_call": false, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true - } + "supported": false }, "attachment": true, "open_weights": false, - "knowledge": "2025-01", - "release_date": "2026-02-26", - "last_updated": "2026-02-26", + "release_date": "2024-01-01", + "last_updated": "2024-01-01", "cost": { - "input": 0.5, - "output": 60 + "input": 0.3, + "output": 1.2 }, - "type": "imageGeneration" + "type": "chat" }, { - "id": "gemini-2.5-flash-preview-09-2025", - "name": "Gemini 2.5 Flash Preview 09 2025", - "display_name": "Gemini 2.5 Flash Preview 09 2025", + "id": "qwen/qwen3-max", + "name": "Qwen3 Max", + "display_name": "Qwen3 Max", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 1048576, - "output": 65536 + "context": 256000, + "output": 32768 }, - "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": true, - "budget": { - "default": -1, - "min": 0, - "max": 24576 - } + "supported": true }, "extra_capabilities": { "reasoning": { "supported": true, - "default_enabled": true, - "mode": "budget", - "budget": { - "default": -1, - "min": 0, - "max": 24576, - "auto": -1, - "off": 0, - "unit": "tokens" - }, + "interleaved": true, "summaries": true, "visibility": "summary", "continuation": [ - "thought_signatures" + "thinking_blocks" ] } }, - "search": { - "supported": true, - "default": false + "attachment": false, + "open_weights": false, + "release_date": "2025-09-05", + "last_updated": "2025-09-05", + "cost": { + "input": 1.08018, + "output": 5.4009 }, - "attachment": true, "type": "chat" }, { - "id": "gemini-2.5-flash-image-preview", - "name": "Gemini 2.5 Flash Image Preview", - "display_name": "Gemini 2.5 Flash Image Preview", - "modalities": { - "input": [ - "text", - "image" - ], - "output": [ - "text", - "image" - ] - }, - "limit": { - "context": 32768, - "output": 32768 - }, - "temperature": true, - "tool_call": false, - "reasoning": { - "supported": false - }, - "attachment": false, - "type": "imageGeneration" - }, - { - "id": "gemini-2.5-flash-lite-preview-09-2025", - "name": "Gemini 2.5 Flash Lite Preview 09 2025", - "display_name": "Gemini 2.5 Flash Lite Preview 09 2025", + "id": "qwen/qwen3.5-397b-a17b-thinking", + "name": "Qwen3.5 397B A17B Thinking", + "display_name": "Qwen3.5 397B A17B Thinking", "modalities": { "input": [ "text", - "image" + "image", + "video" ], "output": [ "text" ] }, "limit": { - "context": 1048576, + "context": 258048, "output": 65536 }, - "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": true, - "default": false, - "budget": { - "default": -1, - "min": 512, - "max": 24576 - } + "default": true }, "extra_capabilities": { "reasoning": { "supported": true, - "default_enabled": false, - "mode": "budget", - "budget": { - "default": -1, - "min": 512, - "max": 24576, - "auto": -1, - "unit": "tokens" - }, + "interleaved": true, "summaries": true, "visibility": "summary", "continuation": [ - "thought_signatures" + "thinking_blocks" ] } }, - "search": { - "supported": true, - "default": false - }, "attachment": true, + "open_weights": false, + "release_date": "2026-02-16", + "last_updated": "2026-02-16", + "cost": { + "input": 0.6, + "output": 3.6 + }, "type": "chat" }, { - "id": "gemini-2.0-flash-preview-image-generation", - "name": "Gemini 2.0 Flash Preview Image Generation", - "display_name": "Gemini 2.0 Flash Preview Image Generation", + "id": "qwen/Qwen3-Next-80B-A3B-Instruct", + "name": "Qwen3 Next 80B A3B (Instruct)", + "display_name": "Qwen3 Next 80B A3B (Instruct)", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ - "text", - "image" + "text" ] }, "limit": { - "context": 32000, - "output": 8192 + "context": 256000, + "output": 262144 }, - "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { "supported": false }, - "search": { - "supported": false + "attachment": false, + "open_weights": false, + "release_date": "2025-09-11", + "last_updated": "2025-09-11", + "cost": { + "input": 0.15, + "output": 0.65 }, - "attachment": true, "type": "chat" - } - ] - }, - "wandb": { - "id": "wandb", - "name": "Weights & Biases", - "display_name": "Weights & Biases", - "api": "https://api.inference.wandb.ai/v1", - "doc": "https://docs.wandb.ai/guides/integrations/inference/", - "models": [ + }, { - "id": "MiniMaxAI/MiniMax-M2.5", - "name": "MiniMax M2.5", - "display_name": "MiniMax M2.5", + "id": "qwen/Qwen3-235B-A22B-Instruct-2507-TEE", + "name": "Qwen 3 235b A22B 2507 (TEE)", + "display_name": "Qwen 3 235b A22B 2507 (TEE)", "modalities": { "input": [ "text" @@ -170834,33 +175011,27 @@ ] }, "limit": { - "context": 196608, - "output": 196608 + "context": 256000, + "output": 262144 }, - "temperature": true, "tool_call": true, "reasoning": { - "supported": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true - } + "supported": false }, "attachment": false, - "open_weights": true, - "release_date": "2026-02-12", - "last_updated": "2026-03-12", + "open_weights": false, + "release_date": "2025-07-25", + "last_updated": "2025-07-25", "cost": { - "input": 0.3, - "output": 1.2 + "input": 0.13, + "output": 0.5 }, "type": "chat" }, { - "id": "zai-org/GLM-5.1", - "name": "GLM-5.1", - "display_name": "GLM-5.1", + "id": "qwen/qwq-32b-preview", + "name": "Qwen QwQ 32B Preview", + "display_name": "Qwen QwQ 32B Preview", "modalities": { "input": [ "text" @@ -170870,14 +175041,12 @@ ] }, "limit": { - "context": 200000, - "output": 131072 + "context": 32768, + "output": 32768 }, - "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": true + "supported": true }, "extra_capabilities": { "reasoning": { @@ -170891,21 +175060,19 @@ } }, "attachment": false, - "open_weights": true, - "release_date": "2026-03-27", - "last_updated": "2026-03-27", + "open_weights": false, + "release_date": "2025-02-27", + "last_updated": "2025-02-27", "cost": { - "input": 1.4, - "output": 4.4, - "cache_read": 0.26, - "cache_write": 0 + "input": 0.2, + "output": 0.2 }, "type": "chat" }, { - "id": "zai-org/GLM-5-FP8", - "name": "GLM 5", - "display_name": "GLM 5", + "id": "qwen/qwen3-next-80b-a3b-thinking", + "name": "Qwen3 Next 80B A3B (Thinking)", + "display_name": "Qwen3 Next 80B A3B (Thinking)", "modalities": { "input": [ "text" @@ -170915,28 +175082,38 @@ ] }, "limit": { - "context": 200000, - "output": 200000 + "context": 256000, + "output": 32768 }, - "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": false + "supported": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } }, "attachment": false, - "open_weights": true, - "release_date": "2026-02-11", - "last_updated": "2026-03-12", + "open_weights": false, + "release_date": "2024-01-01", + "last_updated": "2024-01-01", "cost": { - "input": 1, - "output": 3.2 + "input": 0.15, + "output": 0.65 }, "type": "chat" }, { - "id": "OpenPipe/Qwen3-14B-Instruct", - "name": "OpenPipe Qwen3 14B Instruct", - "display_name": "OpenPipe Qwen3 14B Instruct", + "id": "qwen/qwen3-coder", + "name": "Qwen 3 Coder 480B", + "display_name": "Qwen 3 Coder 480B", "modalities": { "input": [ "text" @@ -170946,46 +175123,42 @@ ] }, "limit": { - "context": 32768, - "output": 32768 + "context": 262000, + "output": 65536 }, - "temperature": true, "tool_call": true, "reasoning": { "supported": false }, "attachment": false, - "open_weights": true, - "release_date": "2025-04-29", - "last_updated": "2026-03-12", + "open_weights": false, + "release_date": "2026-03-17", + "last_updated": "2026-03-17", "cost": { - "input": 0.05, - "output": 0.22 + "input": 0.13, + "output": 0.5 }, "type": "chat" }, { - "id": "moonshotai/Kimi-K2.5", - "name": "Kimi K2.5", - "display_name": "Kimi K2.5", + "id": "qwen/Qwen3-235B-A22B-Thinking-2507", + "name": "Qwen 3 235b A22B 2507 Thinking", + "display_name": "Qwen 3 235b A22B 2507 Thinking", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 262144, + "context": 256000, "output": 262144 }, - "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": true + "supported": true }, "extra_capabilities": { "reasoning": { @@ -170998,151 +175171,181 @@ ] } }, - "attachment": true, - "open_weights": true, - "release_date": "2026-01-27", - "last_updated": "2026-03-12", + "attachment": false, + "open_weights": false, + "release_date": "2025-09-11", + "last_updated": "2025-09-11", "cost": { - "input": 0.5, - "output": 2.85 + "input": 0.3, + "output": 0.5 }, "type": "chat" }, { - "id": "meta-llama/Llama-3.1-70B-Instruct", - "name": "Llama 3.1 70B", - "display_name": "Llama 3.1 70B", + "id": "qwen/qwen3.5-plus", + "name": "Qwen3.5 Plus", + "display_name": "Qwen3.5 Plus", "modalities": { "input": [ - "text" + "text", + "image", + "video" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 128000 + "context": 983616, + "output": 65536 }, - "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": false + "supported": true }, - "attachment": false, - "open_weights": true, - "release_date": "2024-07-23", - "last_updated": "2026-03-12", + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } + }, + "attachment": true, + "open_weights": false, + "release_date": "2026-02-16", + "last_updated": "2026-02-16", "cost": { - "input": 0.8, - "output": 0.8 + "input": 0.4, + "output": 2.4, + "cache_read": 0.04 }, "type": "chat" }, { - "id": "meta-llama/Llama-3.1-8B-Instruct", - "name": "Meta-Llama-3.1-8B-Instruct", - "display_name": "Meta-Llama-3.1-8B-Instruct", + "id": "qwen/qwen3.5-plus-thinking", + "name": "Qwen3.5 Plus Thinking", + "display_name": "Qwen3.5 Plus Thinking", "modalities": { "input": [ - "text" + "text", + "image", + "video" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 128000 + "context": 983616, + "output": 65536 }, - "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": true, "default": true }, - "attachment": false, - "open_weights": true, - "knowledge": "2023-12", - "release_date": "2024-07-23", - "last_updated": "2026-03-12", + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } + }, + "attachment": true, + "open_weights": false, + "release_date": "2026-02-16", + "last_updated": "2026-02-16", "cost": { - "input": 0.22, - "output": 0.22 + "input": 0.4, + "output": 2.4, + "cache_read": 0.04 }, "type": "chat" }, { - "id": "meta-llama/Llama-3.3-70B-Instruct", - "name": "Llama-3.3-70B-Instruct", - "display_name": "Llama-3.3-70B-Instruct", + "id": "qwen/qwen3-235b-a22b", + "name": "Qwen 3 235b A22B", + "display_name": "Qwen 3 235b A22B", "modalities": { "input": [ - "text" + "text", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 128000 + "context": 41000, + "output": 32768 }, - "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": true }, - "attachment": false, - "open_weights": true, - "knowledge": "2023-12", - "release_date": "2024-12-06", - "last_updated": "2026-03-12", + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } + }, + "attachment": true, + "open_weights": false, + "release_date": "2025-04-29", + "last_updated": "2025-04-29", "cost": { - "input": 0.71, - "output": 0.71 + "input": 0.3, + "output": 0.5 }, "type": "chat" }, { - "id": "meta-llama/Llama-4-Scout-17B-16E-Instruct", - "name": "Llama 4 Scout 17B 16E Instruct", - "display_name": "Llama 4 Scout 17B 16E Instruct", + "id": "qwen/qwen-2.5-72b-instruct", + "name": "Qwen2.5 72B", + "display_name": "Qwen2.5 72B", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 64000, - "output": 64000 + "context": 131072, + "output": 8192 }, - "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": true + "supported": false }, "attachment": false, - "open_weights": true, - "knowledge": "2024-12", - "release_date": "2025-01-31", - "last_updated": "2026-03-12", + "open_weights": false, + "release_date": "2025-07-03", + "last_updated": "2025-07-03", "cost": { - "input": 0.17, - "output": 0.66 + "input": 0.357, + "output": 0.408 }, "type": "chat" }, { - "id": "deepseek-ai/DeepSeek-V3.1", - "name": "DeepSeek V3.1", - "display_name": "DeepSeek V3.1", + "id": "qwen/qwen3-coder-next", + "name": "Qwen3 Coder Next", + "display_name": "Qwen3 Coder Next", "modalities": { "input": [ "text" @@ -171152,92 +175355,113 @@ ] }, "limit": { - "context": 161000, - "output": 161000 + "context": 262144, + "output": 65536 }, - "temperature": true, "tool_call": true, "reasoning": { "supported": false }, "attachment": false, - "open_weights": true, - "release_date": "2025-08-21", - "last_updated": "2026-03-12", + "open_weights": false, + "release_date": "2025-12-08", + "last_updated": "2025-12-08", "cost": { - "input": 0.55, - "output": 1.65 + "input": 0.15, + "output": 1.5 }, "type": "chat" }, { - "id": "nvidia/NVIDIA-Nemotron-3-Super-120B-A12B-FP8", - "name": "NVIDIA Nemotron 3 Super 120B", - "display_name": "NVIDIA Nemotron 3 Super 120B", + "id": "qwen/qwen3.5-9b", + "name": "Qwen3.5 9B", + "display_name": "Qwen3.5 9B", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 262144, - "output": 262144 + "context": 256000, + "output": 65536 }, - "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": false, - "open_weights": true, - "release_date": "2026-03-11", - "last_updated": "2026-03-12", + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } + }, + "attachment": true, + "open_weights": false, + "release_date": "2026-03-10", + "last_updated": "2026-03-10", "cost": { - "input": 0.2, - "output": 0.8 + "input": 0.05, + "output": 0.15 }, "type": "chat" }, { - "id": "microsoft/Phi-4-mini-instruct", - "name": "Phi-4-mini-instruct", - "display_name": "Phi-4-mini-instruct", + "id": "qwen/qwen3.5-397b-a17b", + "name": "Qwen3.5 397B A17B", + "display_name": "Qwen3.5 397B A17B", "modalities": { "input": [ - "text" + "text", + "image", + "video" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 128000 + "context": 258048, + "output": 65536 }, - "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": true + "supported": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } }, "attachment": false, "open_weights": true, - "knowledge": "2023-10", - "release_date": "2024-12-11", - "last_updated": "2026-03-12", + "release_date": "2026-02-16", + "last_updated": "2026-02-16", "cost": { - "input": 0.08, - "output": 0.35 + "input": 0.6, + "output": 3.6 }, "type": "chat" }, { - "id": "Qwen/Qwen3-Coder-480B-A35B-Instruct", - "name": "Qwen3-Coder-480B-A35B-Instruct", - "display_name": "Qwen3-Coder-480B-A35B-Instruct", + "id": "qwen/qwen3-coder-flash", + "name": "Qwen3 Coder Flash", + "display_name": "Qwen3 Coder Flash", "modalities": { "input": [ "text" @@ -171247,29 +175471,27 @@ ] }, "limit": { - "context": 262144, - "output": 262144 + "context": 128000, + "output": 65536 }, - "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": false }, "attachment": false, - "open_weights": true, - "knowledge": "2025-04", - "release_date": "2025-07-23", - "last_updated": "2026-03-12", + "open_weights": false, + "release_date": "2025-09-17", + "last_updated": "2025-09-17", "cost": { - "input": 1, + "input": 0.3, "output": 1.5 }, "type": "chat" }, { - "id": "Qwen/Qwen3-30B-A3B-Instruct-2507", - "name": "Qwen3 30B A3B Instruct 2507", - "display_name": "Qwen3 30B A3B Instruct 2507", + "id": "qwen/Qwen2.5-Coder-32B-Instruct", + "name": "Qwen 2.5 Coder 32b", + "display_name": "Qwen 2.5 Coder 32b", "modalities": { "input": [ "text" @@ -171279,28 +175501,27 @@ ] }, "limit": { - "context": 262144, - "output": 262144 + "context": 32000, + "output": 8192 }, - "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": false }, "attachment": false, - "open_weights": true, - "release_date": "2025-07-29", - "last_updated": "2026-03-12", + "open_weights": false, + "release_date": "2025-07-03", + "last_updated": "2025-07-03", "cost": { - "input": 0.1, - "output": 0.3 + "input": 0.2006, + "output": 0.2006 }, "type": "chat" }, { - "id": "Qwen/Qwen3-235B-A22B-Thinking-2507", - "name": "Qwen3-235B-A22B-Thinking-2507", - "display_name": "Qwen3-235B-A22B-Thinking-2507", + "id": "qwen/Qwen3-8B", + "name": "Qwen 3 8B", + "display_name": "Qwen 3 8B", "modalities": { "input": [ "text" @@ -171310,14 +175531,12 @@ ] }, "limit": { - "context": 262144, - "output": 262144 + "context": 41000, + "output": 32768 }, - "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": true + "supported": true }, "extra_capabilities": { "reasoning": { @@ -171331,20 +175550,19 @@ } }, "attachment": false, - "open_weights": true, - "knowledge": "2025-04", - "release_date": "2025-07-25", - "last_updated": "2026-03-12", + "open_weights": false, + "release_date": "2024-01-01", + "last_updated": "2024-01-01", "cost": { - "input": 0.1, - "output": 0.1 + "input": 0.47, + "output": 0.47 }, "type": "chat" }, { - "id": "Qwen/Qwen3-235B-A22B-Instruct-2507", - "name": "Qwen3 235B A22B Instruct 2507", - "display_name": "Qwen3 235B A22B Instruct 2507", + "id": "qwen/qwen3-14b", + "name": "Qwen 3 14b", + "display_name": "Qwen 3 14b", "modalities": { "input": [ "text" @@ -171354,29 +175572,38 @@ ] }, "limit": { - "context": 262144, - "output": 262144 + "context": 41000, + "output": 32768 }, - "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": false + "supported": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } }, "attachment": false, - "open_weights": true, - "knowledge": "2025-04", - "release_date": "2025-04-28", - "last_updated": "2026-03-12", + "open_weights": false, + "release_date": "2024-01-01", + "last_updated": "2024-01-01", "cost": { - "input": 0.1, - "output": 0.1 + "input": 0.08, + "output": 0.24 }, "type": "chat" }, { - "id": "openai/gpt-oss-120b", - "name": "gpt-oss-120b", - "display_name": "gpt-oss-120b", + "id": "qwen/Qwen3-235B-A22B-Instruct-2507", + "name": "Qwen 3 235b A22B 2507", + "display_name": "Qwen 3 235b A22B 2507", "modalities": { "input": [ "text" @@ -171386,33 +175613,27 @@ ] }, "limit": { - "context": 131072, - "output": 131072 + "context": 256000, + "output": 262144 }, - "temperature": true, "tool_call": true, "reasoning": { - "supported": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true - } + "supported": false }, "attachment": false, "open_weights": false, - "release_date": "2025-08-05", - "last_updated": "2026-03-12", + "release_date": "2025-07-25", + "last_updated": "2025-07-25", "cost": { - "input": 0.15, - "output": 0.6 + "input": 0.13, + "output": 0.5 }, "type": "chat" }, { - "id": "openai/gpt-oss-20b", - "name": "gpt-oss-20b", - "display_name": "gpt-oss-20b", + "id": "qwen/qwen3-30b-a3b", + "name": "Qwen3 30B A3B", + "display_name": "Qwen3 30B A3B", "modalities": { "input": [ "text" @@ -171422,65 +175643,28 @@ ] }, "limit": { - "context": 131072, - "output": 131072 + "context": 41000, + "output": 32768 }, - "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": true }, "extra_capabilities": { "reasoning": { - "supported": true + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] } }, "attachment": false, "open_weights": false, - "release_date": "2025-08-05", - "last_updated": "2026-03-12", - "cost": { - "input": 0.05, - "output": 0.2 - }, - "type": "chat" - } - ] - }, - "meganova": { - "id": "meganova", - "name": "Meganova", - "display_name": "Meganova", - "api": "https://api.meganova.ai/v1", - "doc": "https://docs.meganova.ai", - "models": [ - { - "id": "XiaomiMiMo/MiMo-V2-Flash", - "name": "MiMo V2 Flash", - "display_name": "MiMo V2 Flash", - "modalities": { - "input": [ - "text" - ], - "output": [ - "text" - ] - }, - "limit": { - "context": 262144, - "output": 32000 - }, - "temperature": true, - "tool_call": true, - "reasoning": { - "supported": true, - "default": true - }, - "attachment": false, - "open_weights": true, - "knowledge": "2024-12-01", - "release_date": "2025-12-17", - "last_updated": "2025-12-17", + "release_date": "2025-02-27", + "last_updated": "2025-02-27", "cost": { "input": 0.1, "output": 0.3 @@ -171488,9 +175672,9 @@ "type": "chat" }, { - "id": "mistralai/Mistral-Nemo-Instruct-2407", - "name": "Mistral Nemo Instruct 2407", - "display_name": "Mistral Nemo Instruct 2407", + "id": "amazon/nova-lite-v1", + "name": "Amazon Nova Lite 1.0", + "display_name": "Amazon Nova Lite 1.0", "modalities": { "input": [ "text" @@ -171500,61 +175684,57 @@ ] }, "limit": { - "context": 131072, - "output": 65536 + "context": 300000, + "output": 5120 }, - "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": false }, "attachment": false, - "open_weights": true, - "release_date": "2024-07-18", - "last_updated": "2024-07-18", + "open_weights": false, + "release_date": "2024-12-03", + "last_updated": "2024-12-03", "cost": { - "input": 0.02, - "output": 0.04 + "input": 0.0595, + "output": 0.238 }, "type": "chat" }, { - "id": "mistralai/Mistral-Small-3.2-24B-Instruct-2506", - "name": "Mistral Small 3.2 24B Instruct", - "display_name": "Mistral Small 3.2 24B Instruct", + "id": "amazon/nova-pro-v1", + "name": "Amazon Nova Pro 1.0", + "display_name": "Amazon Nova Pro 1.0", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 32768, - "output": 8192 + "context": 300000, + "output": 32000 }, - "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": false }, - "attachment": true, - "open_weights": true, - "knowledge": "2024-10", - "release_date": "2025-06-20", - "last_updated": "2025-06-20", + "attachment": false, + "open_weights": false, + "release_date": "2024-12-03", + "last_updated": "2024-12-03", "cost": { - "input": 0, - "output": 0 + "input": 0.7989999999999999, + "output": 3.1959999999999997 }, "type": "chat" }, { - "id": "MiniMaxAI/MiniMax-M2.5", - "name": "MiniMax M2.5", - "display_name": "MiniMax M2.5", + "id": "amazon/nova-micro-v1", + "name": "Amazon Nova Micro 1.0", + "display_name": "Amazon Nova Micro 1.0", "modalities": { "input": [ "text" @@ -171564,40 +175744,27 @@ ] }, "limit": { - "context": 204800, - "output": 131072 + "context": 128000, + "output": 5120 }, - "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } + "supported": false }, "attachment": false, - "open_weights": true, - "release_date": "2026-02-12", - "last_updated": "2026-02-12", + "open_weights": false, + "release_date": "2024-12-03", + "last_updated": "2024-12-03", "cost": { - "input": 0.3, - "output": 1.2 + "input": 0.0357, + "output": 0.1394 }, "type": "chat" }, { - "id": "MiniMaxAI/MiniMax-M2.1", - "name": "MiniMax M2.1", - "display_name": "MiniMax M2.1", + "id": "amazon/nova-2-lite-v1", + "name": "Amazon Nova 2 Lite", + "display_name": "Amazon Nova 2 Lite", "modalities": { "input": [ "text" @@ -171607,57 +175774,44 @@ ] }, "limit": { - "context": 196608, - "output": 131072 + "context": 1000000, + "output": 65535 }, - "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } + "supported": false }, "attachment": false, - "open_weights": true, - "release_date": "2025-12-23", - "last_updated": "2025-12-23", + "open_weights": false, + "release_date": "2024-12-03", + "last_updated": "2024-12-03", "cost": { - "input": 0.28, - "output": 1.2 + "input": 0.5099999999999999, + "output": 4.25 }, "type": "chat" }, { - "id": "zai-org/GLM-4.7", - "name": "GLM-4.7", - "display_name": "GLM-4.7", + "id": "alibaba/qwen3.6-flash", + "name": "Qwen3.6 Flash", + "display_name": "Qwen3.6 Flash", "modalities": { "input": [ - "text" + "text", + "image", + "video" ], "output": [ "text" ] }, "limit": { - "context": 202752, - "output": 131072 + "context": 991800, + "output": 65536 }, - "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": true + "supported": true }, "extra_capabilities": { "reasoning": { @@ -171671,37 +175825,36 @@ } }, "attachment": false, - "open_weights": true, - "knowledge": "2025-04", - "release_date": "2025-12-22", - "last_updated": "2025-12-22", + "open_weights": false, + "release_date": "2026-04-17", + "last_updated": "2026-04-17", "cost": { - "input": 0.2, - "output": 0.8 + "input": 0.19, + "output": 1.16 }, "type": "chat" }, { - "id": "zai-org/GLM-5", - "name": "GLM-5", - "display_name": "GLM-5", + "id": "alibaba/qwen3.6-27b", + "name": "Qwen3.6 27B", + "display_name": "Qwen3.6 27B", "modalities": { "input": [ - "text" + "text", + "image", + "video" ], "output": [ "text" ] }, "limit": { - "context": 202752, - "output": 131072 + "context": 260096, + "output": 65536 }, - "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": true + "supported": true }, "extra_capabilities": { "reasoning": { @@ -171714,34 +175867,35 @@ ] } }, - "attachment": false, - "open_weights": true, - "release_date": "2026-02-11", - "last_updated": "2026-02-11", + "attachment": true, + "open_weights": false, + "release_date": "2026-04-23", + "last_updated": "2026-04-23", "cost": { - "input": 0.8, - "output": 2.56 + "input": 0.203, + "output": 2.24 }, "type": "chat" }, { - "id": "zai-org/GLM-4.6", - "name": "GLM-4.6", - "display_name": "GLM-4.6", + "id": "alibaba/qwen3.6-27b:thinking", + "name": "Qwen3.6 27B Thinking", + "display_name": "Qwen3.6 27B Thinking", "modalities": { "input": [ - "text" + "text", + "image", + "video" ], "output": [ "text" ] }, "limit": { - "context": 202752, - "output": 131072 + "context": 260096, + "output": 65536 }, - "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": true, "default": true @@ -171757,66 +175911,50 @@ ] } }, - "attachment": false, - "open_weights": true, - "knowledge": "2025-04", - "release_date": "2025-09-30", - "last_updated": "2025-09-30", + "attachment": true, + "open_weights": false, + "release_date": "2026-04-23", + "last_updated": "2026-04-23", "cost": { - "input": 0.45, - "output": 1.9 + "input": 0.203, + "output": 2.24 }, "type": "chat" }, { - "id": "moonshotai/Kimi-K2.5", - "name": "Kimi K2.5", - "display_name": "Kimi K2.5", + "id": "aion-labs/aion-rp-llama-3.1-8b", + "name": "Llama 3.1 8b (uncensored)", + "display_name": "Llama 3.1 8b (uncensored)", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 262144, - "output": 262144 + "context": 32768, + "output": 16384 }, - "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } + "supported": false }, "attachment": false, - "open_weights": true, - "knowledge": "2026-01", - "release_date": "2026-01-27", - "last_updated": "2026-01-27", + "open_weights": false, + "release_date": "2024-07-23", + "last_updated": "2024-07-23", "cost": { - "input": 0.45, - "output": 2.8 + "input": 0.2006, + "output": 0.2006 }, "type": "chat" }, { - "id": "moonshotai/Kimi-K2-Thinking", - "name": "Kimi K2 Thinking", - "display_name": "Kimi K2 Thinking", + "id": "aion-labs/aion-2.5", + "name": "AionLabs: Aion-2.5", + "display_name": "AionLabs: Aion-2.5", "modalities": { "input": [ "text" @@ -171826,41 +175964,28 @@ ] }, "limit": { - "context": 262144, - "output": 262144 + "context": 131072, + "output": 32768 }, - "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } + "supported": false }, "attachment": false, - "open_weights": true, - "knowledge": "2024-08", - "release_date": "2025-11-06", - "last_updated": "2025-11-06", + "open_weights": false, + "release_date": "2026-03-20", + "last_updated": "2026-03-20", "cost": { - "input": 0.6, - "output": 2.6 + "input": 1, + "output": 3, + "cache_read": 0.35 }, "type": "chat" }, { - "id": "meta-llama/Llama-3.3-70B-Instruct", - "name": "Llama 3.3 70B Instruct", - "display_name": "Llama 3.3 70B Instruct", + "id": "aion-labs/aion-1.0-mini", + "name": "Aion 1.0 mini (DeepSeek)", + "display_name": "Aion 1.0 mini (DeepSeek)", "modalities": { "input": [ "text" @@ -171871,27 +175996,26 @@ }, "limit": { "context": 131072, - "output": 16384 + "output": 8192 }, - "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": false }, "attachment": false, - "open_weights": true, - "release_date": "2024-12-06", - "last_updated": "2024-12-06", + "open_weights": false, + "release_date": "2025-02-20", + "last_updated": "2025-02-20", "cost": { - "input": 0.1, - "output": 0.3 + "input": 0.7989999999999999, + "output": 1.394 }, "type": "chat" }, { - "id": "deepseek-ai/DeepSeek-V3.1", - "name": "DeepSeek V3.1", - "display_name": "DeepSeek V3.1", + "id": "aion-labs/aion-2.0", + "name": "AionLabs: Aion-2.0", + "display_name": "AionLabs: Aion-2.0", "modalities": { "input": [ "text" @@ -171901,28 +176025,27 @@ ] }, "limit": { - "context": 164000, - "output": 164000 + "context": 131072, + "output": 32768 }, - "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": false }, "attachment": false, - "open_weights": true, - "release_date": "2025-08-25", - "last_updated": "2025-08-25", + "open_weights": false, + "release_date": "2026-02-23", + "last_updated": "2026-02-23", "cost": { - "input": 0.27, - "output": 1 + "input": 0.8, + "output": 1.6 }, "type": "chat" }, { - "id": "deepseek-ai/DeepSeek-V3.2", - "name": "DeepSeek V3.2", - "display_name": "DeepSeek V3.2", + "id": "aion-labs/aion-1.0", + "name": "Aion 1.0", + "display_name": "Aion 1.0", "modalities": { "input": [ "text" @@ -171932,33 +176055,27 @@ ] }, "limit": { - "context": 164000, - "output": 164000 + "context": 65536, + "output": 8192 }, - "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true - } + "supported": false }, "attachment": false, - "open_weights": true, - "release_date": "2025-12-03", - "last_updated": "2025-12-03", + "open_weights": false, + "release_date": "2025-02-01", + "last_updated": "2025-02-01", "cost": { - "input": 0.26, - "output": 0.38 + "input": 3.995, + "output": 7.99 }, "type": "chat" }, { - "id": "deepseek-ai/DeepSeek-V3-0324", - "name": "DeepSeek V3 0324", - "display_name": "DeepSeek V3 0324", + "id": "pamanseau/OpenReasoning-Nemotron-32B", + "name": "OpenReasoning Nemotron 32B", + "display_name": "OpenReasoning Nemotron 32B", "modalities": { "input": [ "text" @@ -171968,28 +176085,28 @@ ] }, "limit": { - "context": 163840, - "output": 163840 + "context": 32768, + "output": 65536 }, - "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": false + "supported": true, + "default": true }, "attachment": false, - "open_weights": true, - "release_date": "2025-03-24", - "last_updated": "2025-03-24", + "open_weights": false, + "release_date": "2025-08-21", + "last_updated": "2025-08-21", "cost": { - "input": 0.25, - "output": 0.88 + "input": 0.1, + "output": 0.4 }, "type": "chat" }, { - "id": "deepseek-ai/DeepSeek-V3.2-Exp", - "name": "DeepSeek V3.2 Exp", - "display_name": "DeepSeek V3.2 Exp", + "id": "LatitudeGames/Wayfarer-Large-70B-Llama-3.3", + "name": "Llama 3.3 70B Wayfarer", + "display_name": "Llama 3.3 70B Wayfarer", "modalities": { "input": [ "text" @@ -171999,28 +176116,27 @@ ] }, "limit": { - "context": 164000, - "output": 164000 + "context": 16384, + "output": 16384 }, - "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": false }, "attachment": false, - "open_weights": true, - "release_date": "2025-10-10", - "last_updated": "2025-10-10", + "open_weights": false, + "release_date": "2025-02-20", + "last_updated": "2025-02-20", "cost": { - "input": 0.27, - "output": 0.4 + "input": 0.700000007, + "output": 0.700000007 }, "type": "chat" }, { - "id": "deepseek-ai/DeepSeek-R1-0528", - "name": "DeepSeek R1 0528", - "display_name": "DeepSeek R1 0528", + "id": "baseten/Kimi-K2-Instruct-FP4", + "name": "Kimi K2 0711 Instruct FP4", + "display_name": "Kimi K2 0711 Instruct FP4", "modalities": { "input": [ "text" @@ -172030,88 +176146,57 @@ ] }, "limit": { - "context": 163840, - "output": 64000 + "context": 128000, + "output": 131072 }, - "temperature": true, "tool_call": false, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } + "supported": false }, "attachment": false, - "open_weights": true, - "knowledge": "2024-07", - "release_date": "2025-05-28", - "last_updated": "2025-05-28", + "open_weights": false, + "release_date": "2025-07-11", + "last_updated": "2025-07-11", "cost": { - "input": 0.5, - "output": 2.15 + "input": 0.1, + "output": 2 }, "type": "chat" }, { - "id": "Qwen/Qwen3.5-Plus", - "name": "Qwen3.5 Plus", - "display_name": "Qwen3.5 Plus", + "id": "inflection/inflection-3-pi", + "name": "Inflection 3 Pi", + "display_name": "Inflection 3 Pi", "modalities": { "input": [ - "text", - "image", - "video" + "text" ], "output": [ "text" ] }, "limit": { - "context": 1000000, - "output": 65536 + "context": 8000, + "output": 4096 }, - "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } + "supported": false }, "attachment": false, "open_weights": false, - "knowledge": "2025-04", - "release_date": "2026-02", - "last_updated": "2026-02", + "release_date": "2024-10-11", + "last_updated": "2024-10-11", "cost": { - "input": 0.4, - "output": 2.4, - "reasoning": 2.4 + "input": 2.499, + "output": 9.996 }, "type": "chat" }, { - "id": "Qwen/Qwen3-235B-A22B-Instruct-2507", - "name": "Qwen3 235B A22B Instruct 2507", - "display_name": "Qwen3 235B A22B Instruct 2507", + "id": "inflection/inflection-3-productivity", + "name": "Inflection 3 Productivity", + "display_name": "Inflection 3 Productivity", "modalities": { "input": [ "text" @@ -172121,32 +176206,30 @@ ] }, "limit": { - "context": 262000, - "output": 262000 + "context": 8000, + "output": 4096 }, - "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": false }, "attachment": false, - "open_weights": true, - "release_date": "2025-07-23", - "last_updated": "2025-07-23", + "open_weights": false, + "release_date": "2024-10-11", + "last_updated": "2024-10-11", "cost": { - "input": 0.09, - "output": 0.6 + "input": 2.499, + "output": 9.996 }, "type": "chat" }, { - "id": "Qwen/Qwen2.5-VL-32B-Instruct", - "name": "Qwen2.5 VL 32B Instruct", - "display_name": "Qwen2.5 VL 32B Instruct", + "id": "ReadyArt/MS3.2-The-Omega-Directive-24B-Unslop-v2.0", + "name": "Omega Directive 24B Unslop v2.0", + "display_name": "Omega Directive 24B Unslop v2.0", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" @@ -172154,100 +176237,56 @@ }, "limit": { "context": 16384, - "output": 16384 + "output": 32768 }, - "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": false }, - "attachment": true, - "open_weights": true, - "release_date": "2025-03-24", - "last_updated": "2025-03-24", + "attachment": false, + "open_weights": false, + "release_date": "2025-12-08", + "last_updated": "2025-12-08", "cost": { - "input": 0.2, - "output": 0.6 + "input": 0.5, + "output": 0.5 }, "type": "chat" - } - ] - }, - "opencode": { - "id": "opencode", - "name": "OpenCode Zen", - "display_name": "OpenCode Zen", - "api": "https://opencode.ai/zen/v1", - "doc": "https://opencode.ai/docs/zen", - "models": [ + }, { - "id": "claude-opus-4-5", - "name": "Claude Opus 4.5", - "display_name": "Claude Opus 4.5", + "id": "MiniMaxAI/MiniMax-M1-80k", + "name": "MiniMax M1 80K", + "display_name": "MiniMax M1 80K", "modalities": { "input": [ - "text", - "image", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 64000 + "context": 1000000, + "output": 131072 }, - "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": false - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": false, - "mode": "mixed", - "budget": { - "min": 1024, - "unit": "tokens" - }, - "effort": "high", - "effort_options": [ - "low", - "medium", - "high" - ], - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ], - "notes": [ - "Claude Opus 4.5 uses manual thinking.type = \"enabled\" with budget_tokens; effort can be used alongside the thinking budget.", - "Interleaved thinking requires the interleaved-thinking-2025-05-14 beta header." - ] - } + "supported": false }, - "attachment": true, + "attachment": false, "open_weights": false, - "knowledge": "2025-03-31", - "release_date": "2025-11-24", - "last_updated": "2025-11-24", + "release_date": "2025-06-16", + "last_updated": "2025-06-16", "cost": { - "input": 5, - "output": 25, - "cache_read": 0.5, - "cache_write": 6.25 + "input": 0.6052, + "output": 2.4225000000000003 }, "type": "chat" }, { - "id": "mimo-v2-flash-free", - "name": "MiMo V2 Flash Free", - "display_name": "MiMo V2 Flash Free", + "id": "upstage/solar-pro-3", + "name": "Solar Pro 3", + "display_name": "Solar Pro 3", "modalities": { "input": [ "text" @@ -172257,197 +176296,101 @@ ] }, "limit": { - "context": 262144, - "output": 65536 + "context": 128000, + "output": 128000 }, - "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } + "supported": false }, "attachment": false, - "open_weights": true, - "knowledge": "2024-12", - "release_date": "2025-12-16", - "last_updated": "2025-12-16", + "open_weights": false, + "release_date": "2026-03-03", + "last_updated": "2026-03-03", "cost": { - "input": 0, - "output": 0, - "cache_read": 0 + "input": 0.15, + "output": 0.6, + "cache_read": 0.015 }, "type": "chat" }, { - "id": "claude-sonnet-4", - "name": "Claude Sonnet 4", - "display_name": "Claude Sonnet 4", + "id": "allenai/olmo-3-32b-think", + "name": "Olmo 3 32B Think", + "display_name": "Olmo 3 32B Think", "modalities": { "input": [ - "text", - "image", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 1000000, - "output": 64000 + "context": 128000, + "output": 8192 }, - "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": true, - "default": false - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": false, - "mode": "budget", - "budget": { - "min": 1024, - "unit": "tokens" - }, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ], - "notes": [ - "Claude 4 manual thinking uses thinking.type = \"enabled\" with budget_tokens.", - "Interleaved thinking requires the interleaved-thinking-2025-05-14 beta header for this model family." - ] - } + "default": true }, - "attachment": true, + "attachment": false, "open_weights": false, - "knowledge": "2025-03-31", - "release_date": "2025-05-22", - "last_updated": "2025-05-22", - "cost": { - "input": 3, - "output": 15, - "cache_read": 0.3, - "cache_write": 3.75, - "tiers": [ - { - "input": 6, - "output": 22.5, - "cache_read": 0.6, - "cache_write": 7.5, - "tier": { - "type": "context", - "size": 200000 - } - } - ], - "context_over_200k": { - "input": 6, - "output": 22.5, - "cache_read": 0.6, - "cache_write": 7.5 - } + "release_date": "2025-11-01", + "last_updated": "2025-11-01", + "cost": { + "input": 0.3, + "output": 0.44999999999999996 }, "type": "chat" }, { - "id": "claude-sonnet-4-6", - "name": "Claude Sonnet 4.6", - "display_name": "Claude Sonnet 4.6", + "id": "essentialai/rnj-1-instruct", + "name": "RNJ-1 Instruct 8B", + "display_name": "RNJ-1 Instruct 8B", "modalities": { "input": [ - "text", - "image", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 1000000, - "output": 64000 + "context": 128000, + "output": 8192 }, - "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": false - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": false, - "mode": "mixed", - "budget": { - "min": 1024, - "unit": "tokens" - }, - "effort": "high", - "effort_options": [ - "low", - "medium", - "high", - "max" - ], - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ], - "notes": [ - "Anthropic recommends adaptive thinking with effort for Claude 4.6; budget_tokens remains a deprecated compatibility path.", - "Anthropic API defaults effort to high; lower effort levels should be chosen per workload." - ] - } + "supported": false }, - "attachment": true, + "attachment": false, "open_weights": false, - "knowledge": "2025-08-31", - "release_date": "2026-02-17", - "last_updated": "2026-02-17", + "release_date": "2025-12-13", + "last_updated": "2025-12-13", "cost": { - "input": 3, - "output": 15, - "cache_read": 0.3, - "cache_write": 3.75 + "input": 0.15, + "output": 0.15 }, "type": "chat" }, { - "id": "grok-build-0.1", - "name": "Grok Build 0.1", - "display_name": "Grok Build 0.1", + "id": "deepseek/deepseek-v4-flash", + "name": "DeepSeek V4 Flash", + "display_name": "DeepSeek V4 Flash", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 256000, - "output": 256000 + "context": 1048576, + "output": 384000 }, - "temperature": true, "tool_call": true, "reasoning": { "supported": true, @@ -172455,137 +176398,94 @@ }, "extra_capabilities": { "reasoning": { - "supported": true + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] } }, - "attachment": true, + "attachment": false, "open_weights": false, - "release_date": "2026-05-20", - "last_updated": "2026-05-20", + "release_date": "2026-04-24", + "last_updated": "2026-04-24", "cost": { - "input": 1, - "output": 2, - "cache_read": 0.2 + "input": 0.14, + "output": 0.28, + "cache_read": 0.028 }, "type": "chat" }, { - "id": "gpt-5.2", - "name": "GPT-5.2", - "display_name": "GPT-5.2", + "id": "deepseek/deepseek-v4-flash:thinking", + "name": "DeepSeek V4 Flash (Thinking)", + "display_name": "DeepSeek V4 Flash (Thinking)", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 400000, - "output": 128000 + "context": 1048576, + "output": 384000 }, - "temperature": false, "tool_call": true, "reasoning": { "supported": true, - "default": false - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": false, - "mode": "effort", - "effort": "none", - "effort_options": [ - "none", - "low", - "medium", - "high", - "xhigh" - ], - "verbosity": "medium", - "verbosity_options": [ - "low", - "medium", - "high" - ], - "visibility": "hidden" - } + "default": true }, - "attachment": true, + "attachment": false, "open_weights": false, - "knowledge": "2025-08-31", - "release_date": "2025-12-11", - "last_updated": "2025-12-11", + "release_date": "2026-04-24", + "last_updated": "2026-04-24", "cost": { - "input": 1.75, - "output": 14, - "cache_read": 0.175 + "input": 0.14, + "output": 0.28, + "cache_read": 0.028 }, "type": "chat" }, { - "id": "gpt-5-codex", - "name": "GPT-5 Codex", - "display_name": "GPT-5 Codex", + "id": "deepseek/deepseek-v4-pro-cheaper:thinking", + "name": "DeepSeek V4 Pro Cheaper (Thinking)", + "display_name": "DeepSeek V4 Pro Cheaper (Thinking)", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 400000, - "output": 128000 + "context": 1048576, + "output": 384000 }, - "temperature": false, "tool_call": true, "reasoning": { "supported": true, "default": true }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": true, - "mode": "effort", - "effort": "medium", - "effort_options": [ - "minimal", - "low", - "medium", - "high" - ], - "verbosity": "medium", - "verbosity_options": [ - "low", - "medium", - "high" - ], - "visibility": "hidden" - } - }, - "attachment": true, + "attachment": false, "open_weights": false, - "knowledge": "2024-09-30", - "release_date": "2025-09-15", - "last_updated": "2025-09-15", + "release_date": "2026-04-25", + "last_updated": "2026-04-25", "cost": { - "input": 1.07, - "output": 8.5, - "cache_read": 0.107 + "input": 0.435, + "output": 0.87, + "cache_read": 0.003625 }, "type": "chat" }, { - "id": "hy3-preview-free", - "name": "Hy3 preview Free", - "display_name": "Hy3 preview Free", + "id": "deepseek/deepseek-prover-v2-671b", + "name": "DeepSeek Prover v2 671B", + "display_name": "DeepSeek Prover v2 671B", "modalities": { "input": [ "text" @@ -172595,36 +176495,27 @@ ] }, "limit": { - "context": 256000, - "output": 64000 + "context": 160000, + "output": 16384 }, - "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true - } + "supported": false }, "attachment": false, - "open_weights": true, - "knowledge": "2025-06", - "release_date": "2026-04-20", - "last_updated": "2026-04-20", + "open_weights": false, + "release_date": "2025-04-30", + "last_updated": "2025-04-30", "cost": { - "input": 0, - "output": 0, - "cache_read": 0 + "input": 1, + "output": 2.5 }, "type": "chat" }, { - "id": "glm-4.6", - "name": "GLM-4.6", - "display_name": "GLM-4.6", + "id": "deepseek/deepseek-latest", + "name": "DeepSeek Latest", + "display_name": "DeepSeek Latest", "modalities": { "input": [ "text" @@ -172634,36 +176525,29 @@ ] }, "limit": { - "context": 204800, - "output": 131072 + "context": 1048576, + "output": 384000 }, - "temperature": true, "tool_call": true, "reasoning": { "supported": true, "default": true }, - "extra_capabilities": { - "reasoning": { - "supported": true - } - }, "attachment": false, - "open_weights": true, - "knowledge": "2025-04", - "release_date": "2025-09-30", - "last_updated": "2025-09-30", + "open_weights": false, + "release_date": "2026-05-03", + "last_updated": "2026-05-03", "cost": { - "input": 0.6, + "input": 1.1, "output": 2.2, - "cache_read": 0.1 + "cache_read": 0.11 }, "type": "chat" }, { - "id": "kimi-k2-thinking", - "name": "Kimi K2 Thinking", - "display_name": "Kimi K2 Thinking", + "id": "deepseek/deepseek-v4-pro", + "name": "DeepSeek V4 Pro", + "display_name": "DeepSeek V4 Pro", "modalities": { "input": [ "text" @@ -172673,10 +176557,9 @@ ] }, "limit": { - "context": 262144, - "output": 262144 + "context": 1048576, + "output": 384000 }, - "temperature": true, "tool_call": true, "reasoning": { "supported": true, @@ -172694,28 +176577,23 @@ } }, "attachment": false, - "open_weights": true, - "knowledge": "2024-10", - "release_date": "2025-09-05", - "last_updated": "2025-09-05", + "open_weights": false, + "release_date": "2026-04-24", + "last_updated": "2026-04-24", "cost": { - "input": 0.4, - "output": 2.5, - "cache_read": 0.4 + "input": 1.1, + "output": 2.2, + "cache_read": 0.11 }, "type": "chat" }, { - "id": "gemini-3-pro", - "name": "Gemini 3 Pro", - "display_name": "Gemini 3 Pro", + "id": "deepseek/deepseek-v4-pro:thinking", + "name": "DeepSeek V4 Pro (Thinking)", + "display_name": "DeepSeek V4 Pro (Thinking)", "modalities": { "input": [ - "text", - "image", - "video", - "audio", - "pdf" + "text" ], "output": [ "text" @@ -172723,181 +176601,95 @@ }, "limit": { "context": 1048576, - "output": 65536 + "output": 384000 }, - "temperature": true, "tool_call": true, "reasoning": { "supported": true, "default": true }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": true, - "mode": "level", - "level": "high", - "level_options": [ - "low", - "high" - ], - "summaries": true, - "visibility": "summary", - "continuation": [ - "thought_signatures" - ] - } - }, - "attachment": true, + "attachment": false, "open_weights": false, - "knowledge": "2025-01", - "release_date": "2025-11-18", - "last_updated": "2025-11-18", + "release_date": "2026-04-24", + "last_updated": "2026-04-24", "cost": { - "input": 2, - "output": 12, - "cache_read": 0.2, - "tiers": [ - { - "input": 4, - "output": 18, - "cache_read": 0.4, - "tier": { - "type": "context", - "size": 200000 - } - } - ], - "context_over_200k": { - "input": 4, - "output": 18, - "cache_read": 0.4 - } + "input": 1.1, + "output": 2.2, + "cache_read": 0.11 }, "type": "chat" }, { - "id": "gpt-5", - "name": "GPT-5", - "display_name": "GPT-5", + "id": "deepseek/deepseek-v3.2-speciale", + "name": "DeepSeek V3.2 Speciale", + "display_name": "DeepSeek V3.2 Speciale", "modalities": { "input": [ "text", - "image" + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 400000, - "output": 128000 + "context": 163000, + "output": 65536 }, - "temperature": false, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": true, "default": true }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": true, - "mode": "effort", - "effort": "medium", - "effort_options": [ - "minimal", - "low", - "medium", - "high" - ], - "verbosity": "medium", - "verbosity_options": [ - "low", - "medium", - "high" - ], - "visibility": "hidden" - } - }, "attachment": true, "open_weights": false, - "knowledge": "2024-09-30", - "release_date": "2025-08-07", - "last_updated": "2025-08-07", + "release_date": "2025-12-02", + "last_updated": "2025-12-02", "cost": { - "input": 1.07, - "output": 8.5, - "cache_read": 0.107 + "input": 0.27999999999999997, + "output": 0.42000000000000004 }, "type": "chat" }, { - "id": "claude-haiku-4-5", - "name": "Claude Haiku 4.5", - "display_name": "Claude Haiku 4.5", + "id": "deepseek/deepseek-v4-pro-cheaper", + "name": "DeepSeek V4 Pro Cheaper", + "display_name": "DeepSeek V4 Pro Cheaper", "modalities": { "input": [ - "text", - "image", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 64000 + "context": 1048576, + "output": 384000 }, - "temperature": true, "tool_call": true, "reasoning": { "supported": true, - "default": false - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": false, - "mode": "budget", - "budget": { - "min": 1024, - "unit": "tokens" - }, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ], - "notes": [ - "Claude 4 manual thinking uses thinking.type = \"enabled\" with budget_tokens.", - "Interleaved thinking requires the interleaved-thinking-2025-05-14 beta header for this model family." - ] - } + "default": true }, - "attachment": true, + "attachment": false, "open_weights": false, - "knowledge": "2025-02-28", - "release_date": "2025-10-15", - "last_updated": "2025-10-15", + "release_date": "2026-04-25", + "last_updated": "2026-04-25", "cost": { - "input": 1, - "output": 5, - "cache_read": 0.1, - "cache_write": 1.25 + "input": 0.435, + "output": 0.87, + "cache_read": 0.003625 }, "type": "chat" }, { - "id": "gpt-5.4-pro", - "name": "GPT-5.4 Pro", - "display_name": "GPT-5.4 Pro", + "id": "deepseek/deepseek-v3.2:thinking", + "name": "DeepSeek V3.2 Thinking", + "display_name": "DeepSeek V3.2 Thinking", "modalities": { "input": [ "text", - "image", "pdf" ], "output": [ @@ -172905,55 +176697,31 @@ ] }, "limit": { - "context": 1050000, - "output": 128000 + "context": 163000, + "output": 65536 }, - "temperature": false, "tool_call": true, "reasoning": { "supported": true, "default": true }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": true, - "mode": "effort", - "effort": "high", - "effort_options": [ - "medium", - "high", - "xhigh" - ], - "verbosity": "medium", - "verbosity_options": [ - "low", - "medium", - "high" - ], - "visibility": "hidden" - } - }, "attachment": true, "open_weights": false, - "knowledge": "2025-08-31", - "release_date": "2026-03-05", - "last_updated": "2026-03-05", + "release_date": "2025-12-01", + "last_updated": "2025-12-01", "cost": { - "input": 30, - "output": 180, - "cache_read": 30 + "input": 0.27999999999999997, + "output": 0.42000000000000004 }, "type": "chat" }, { - "id": "gpt-5.4", - "name": "GPT-5.4", - "display_name": "GPT-5.4", + "id": "deepseek/deepseek-v3.2", + "name": "DeepSeek V3.2", + "display_name": "DeepSeek V3.2", "modalities": { "input": [ "text", - "image", "pdf" ], "output": [ @@ -172961,117 +176729,65 @@ ] }, "limit": { - "context": 1050000, - "output": 128000 + "context": 163000, + "output": 65536 }, - "temperature": false, "tool_call": true, "reasoning": { - "supported": true, - "default": false + "supported": true }, "extra_capabilities": { "reasoning": { - "supported": true, - "default_enabled": false, - "mode": "effort", - "effort": "none", - "effort_options": [ - "none", - "low", - "medium", - "high", - "xhigh" - ], - "verbosity": "medium", - "verbosity_options": [ - "low", - "medium", - "high" - ], - "visibility": "hidden" + "supported": true } }, "attachment": true, "open_weights": false, - "knowledge": "2025-08-31", - "release_date": "2026-03-05", - "last_updated": "2026-03-05", + "release_date": "2025-12-01", + "last_updated": "2025-12-01", "cost": { - "input": 2.5, - "output": 15, - "cache_read": 0.25, - "tiers": [ - { - "input": 5, - "output": 22.5, - "cache_read": 0.5, - "tier": { - "type": "context", - "size": 272000 - } - } - ], - "context_over_200k": { - "input": 5, - "output": 22.5, - "cache_read": 0.5 - } + "input": 0.27999999999999997, + "output": 0.42000000000000004 }, "type": "chat" }, { - "id": "qwen3.5-plus", - "name": "Qwen3.5 Plus", - "display_name": "Qwen3.5 Plus", + "id": "minimax/minimax-m3:thinking", + "name": "MiniMax M3 Thinking", + "display_name": "MiniMax M3 Thinking", "modalities": { "input": [ "text", - "image", - "video" + "image" ], "output": [ "text" ] }, "limit": { - "context": 262144, - "output": 65536 + "context": 512000, + "output": 80000 }, - "temperature": true, "tool_call": true, "reasoning": { "supported": true, "default": true }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } - }, "attachment": true, "open_weights": false, - "knowledge": "2025-04", - "release_date": "2026-02-16", - "last_updated": "2026-02-16", + "release_date": "2026-06-01", + "last_updated": "2026-06-01", "cost": { - "input": 0.2, + "input": 0.3, "output": 1.2, - "cache_read": 0.02, - "cache_write": 0.25 + "cache_read": 0.06 }, "type": "chat" }, { - "id": "minimax-m2.1", - "name": "MiniMax M2.1", - "display_name": "MiniMax M2.1", + "id": "minimax/minimax-m2.5", + "name": "MiniMax M2.5", + "display_name": "MiniMax M2.5", "modalities": { "input": [ "text" @@ -173084,7 +176800,6 @@ "context": 204800, "output": 131072 }, - "temperature": true, "tool_call": true, "reasoning": { "supported": true, @@ -173092,46 +176807,35 @@ }, "extra_capabilities": { "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] + "supported": true } }, "attachment": false, - "open_weights": true, - "knowledge": "2025-01", - "release_date": "2025-12-23", - "last_updated": "2025-12-23", + "open_weights": false, + "release_date": "2026-02-12", + "last_updated": "2026-02-12", "cost": { "input": 0.3, - "output": 1.2, - "cache_read": 0.1 + "output": 1.2 }, "type": "chat" }, { - "id": "gpt-5.5", - "name": "GPT-5.5", - "display_name": "GPT-5.5", + "id": "minimax/minimax-m2.1", + "name": "MiniMax M2.1", + "display_name": "MiniMax M2.1", "modalities": { "input": [ - "text", - "image", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 1050000, - "output": 128000 + "context": 200000, + "output": 131072 }, - "temperature": false, "tool_call": true, "reasoning": { "supported": true, @@ -173139,149 +176843,85 @@ }, "extra_capabilities": { "reasoning": { - "supported": true, - "default_enabled": true, - "mode": "effort", - "effort": "medium", - "effort_options": [ - "low", - "medium", - "high", - "xhigh" - ], - "verbosity": "medium", - "verbosity_options": [ - "low", - "medium", - "high" - ], - "visibility": "hidden" + "supported": true } }, - "attachment": true, + "attachment": false, "open_weights": false, - "knowledge": "2025-12-01", - "release_date": "2026-04-23", - "last_updated": "2026-04-23", + "release_date": "2025-12-19", + "last_updated": "2025-12-19", "cost": { - "input": 5, - "output": 30, - "cache_read": 0.5, - "tiers": [ - { - "input": 10, - "output": 45, - "cache_read": 1, - "tier": { - "type": "context", - "size": 272000 - } - } - ], - "context_over_200k": { - "input": 10, - "output": 45, - "cache_read": 1 - } + "input": 0.33, + "output": 1.32 }, "type": "chat" }, { - "id": "kimi-k2.6", - "name": "Kimi K2.6", - "display_name": "Kimi K2.6", + "id": "minimax/minimax-m2.7-turbo", + "name": "MiniMax M2.7 Turbo", + "display_name": "MiniMax M2.7 Turbo", "modalities": { "input": [ - "text", - "image", - "video" + "text" ], "output": [ "text" ] }, "limit": { - "context": 262144, - "output": 65536 + "context": 204800, + "output": 131072 }, - "temperature": true, "tool_call": true, "reasoning": { "supported": true, "default": true }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } - }, - "attachment": true, - "open_weights": true, - "knowledge": "2024-10", - "release_date": "2026-04-21", - "last_updated": "2026-04-21", + "attachment": false, + "open_weights": false, + "release_date": "2026-03-18", + "last_updated": "2026-03-18", "cost": { - "input": 0.95, - "output": 4, - "cache_read": 0.16 + "input": 0.6, + "output": 2.4 }, "type": "chat" }, { - "id": "glm-4.7", - "name": "GLM-4.7", - "display_name": "GLM-4.7", + "id": "minimax/minimax-01", + "name": "MiniMax 01", + "display_name": "MiniMax 01", "modalities": { "input": [ - "text" + "text", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 204800, - "output": 131072 + "context": 1000192, + "output": 16384 }, - "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } + "supported": false }, - "attachment": false, - "open_weights": true, - "knowledge": "2025-04", - "release_date": "2025-12-22", - "last_updated": "2025-12-22", + "attachment": true, + "open_weights": false, + "release_date": "2025-01-15", + "last_updated": "2025-01-15", "cost": { - "input": 0.6, - "output": 2.2, - "cache_read": 0.1 + "input": 0.1394, + "output": 1.1219999999999999 }, "type": "chat" }, { - "id": "gpt-5.1", - "name": "GPT-5.1", - "display_name": "GPT-5.1", + "id": "minimax/minimax-m3", + "name": "MiniMax M3", + "display_name": "MiniMax M3", "modalities": { "input": [ "text", @@ -173292,52 +176932,63 @@ ] }, "limit": { - "context": 400000, - "output": 128000 + "context": 512000, + "output": 80000 }, - "temperature": false, "tool_call": true, "reasoning": { - "supported": true, - "default": false + "supported": true }, "extra_capabilities": { "reasoning": { - "supported": true, - "default_enabled": false, - "mode": "effort", - "effort": "none", - "effort_options": [ - "none", - "low", - "medium", - "high" - ], - "verbosity": "medium", - "verbosity_options": [ - "low", - "medium", - "high" - ], - "visibility": "hidden" + "supported": true } }, "attachment": true, "open_weights": false, - "knowledge": "2024-09-30", - "release_date": "2025-11-13", - "last_updated": "2025-11-13", + "release_date": "2026-06-01", + "last_updated": "2026-06-01", "cost": { - "input": 1.07, - "output": 8.5, - "cache_read": 0.107 + "input": 0.3, + "output": 1.2, + "cache_read": 0.06 }, "type": "chat" }, { - "id": "gpt-5-nano", - "name": "GPT-5 Nano", - "display_name": "GPT-5 Nano", + "id": "minimax/minimax-m2-her", + "name": "MiniMax M2-her", + "display_name": "MiniMax M2-her", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 65532, + "output": 2048 + }, + "tool_call": false, + "reasoning": { + "supported": false + }, + "attachment": false, + "open_weights": false, + "release_date": "2026-01-24", + "last_updated": "2026-01-24", + "cost": { + "input": 0.30200000000000005, + "output": 1.2069999999999999 + }, + "type": "chat" + }, + { + "id": "minimax/minimax-latest", + "name": "MiniMax Latest", + "display_name": "MiniMax Latest", "modalities": { "input": [ "text", @@ -173348,238 +176999,173 @@ ] }, "limit": { - "context": 400000, - "output": 128000 + "context": 512000, + "output": 80000 }, - "temperature": false, "tool_call": true, "reasoning": { "supported": true, "default": true }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": true, - "mode": "effort", - "effort": "medium", - "effort_options": [ - "minimal", - "low", - "medium", - "high" - ], - "verbosity": "medium", - "verbosity_options": [ - "low", - "medium", - "high" - ], - "visibility": "hidden" - } - }, "attachment": true, "open_weights": false, - "knowledge": "2024-05-30", - "release_date": "2025-08-07", - "last_updated": "2025-08-07", + "release_date": "2026-05-03", + "last_updated": "2026-05-03", "cost": { - "input": 0.05, - "output": 0.4, - "cache_read": 0.005 + "input": 0.3, + "output": 1.2, + "cache_read": 0.06 }, "type": "chat" }, { - "id": "claude-opus-4-1", - "name": "Claude Opus 4.1", - "display_name": "Claude Opus 4.1", + "id": "minimax/minimax-m2.7", + "name": "MiniMax M2.7", + "display_name": "MiniMax M2.7", "modalities": { "input": [ - "text", - "image", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 32000 + "context": 204800, + "output": 131072 }, - "temperature": true, "tool_call": true, "reasoning": { "supported": true, - "default": false + "default": true }, "extra_capabilities": { "reasoning": { "supported": true, - "default_enabled": false, - "mode": "budget", - "budget": { - "min": 1024, - "unit": "tokens" - }, "interleaved": true, "summaries": true, "visibility": "summary", "continuation": [ "thinking_blocks" - ], - "notes": [ - "Claude 4 manual thinking uses thinking.type = \"enabled\" with budget_tokens.", - "Interleaved thinking requires the interleaved-thinking-2025-05-14 beta header for this model family." ] } }, - "attachment": true, + "attachment": false, "open_weights": false, - "knowledge": "2025-03-31", - "release_date": "2025-08-05", - "last_updated": "2025-08-05", + "release_date": "2026-03-18", + "last_updated": "2026-03-18", "cost": { - "input": 15, - "output": 75, - "cache_read": 1.5, - "cache_write": 18.75 + "input": 0.3, + "output": 1.2 }, "type": "chat" }, { - "id": "gpt-5.1-codex-max", - "name": "GPT-5.1 Codex Max", - "display_name": "GPT-5.1 Codex Max", + "id": "kwaipilot/kat-coder-pro-v2", + "name": "KAT Coder Pro V2", + "display_name": "KAT Coder Pro V2", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 400000, - "output": 128000 + "context": 256000, + "output": 80000 }, - "temperature": false, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": false - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": false, - "mode": "effort", - "effort": "none", - "effort_options": [ - "none", - "low", - "medium", - "high" - ], - "verbosity": "medium", - "verbosity_options": [ - "low", - "medium", - "high" - ], - "visibility": "hidden" - } + "supported": false }, - "attachment": true, + "attachment": false, "open_weights": false, - "knowledge": "2024-09-30", - "release_date": "2025-11-13", - "last_updated": "2025-11-13", + "release_date": "2026-03-28", + "last_updated": "2026-03-28", "cost": { - "input": 1.25, - "output": 10, - "cache_read": 0.125 + "input": 0.3, + "output": 1.2 }, "type": "chat" }, { - "id": "gpt-5.1-codex-mini", - "name": "GPT-5.1 Codex Mini", - "display_name": "GPT-5.1 Codex Mini", + "id": "mlabonne/NeuralDaredevil-8B-abliterated", + "name": "Neural Daredevil 8B abliterated", + "display_name": "Neural Daredevil 8B abliterated", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 400000, - "output": 128000 + "context": 8192, + "output": 8192 }, - "temperature": false, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": false + "supported": false }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": false, - "mode": "effort", - "effort": "none", - "effort_options": [ - "none", - "low", - "medium", - "high" - ], - "verbosity": "medium", - "verbosity_options": [ - "low", - "medium", - "high" - ], - "visibility": "hidden" - } + "attachment": false, + "open_weights": false, + "release_date": "2024-12-01", + "last_updated": "2024-12-01", + "cost": { + "input": 0.44, + "output": 0.44 }, - "attachment": true, + "type": "chat" + }, + { + "id": "VongolaChouko/Starcannon-Unleashed-12B-v1.0", + "name": "Mistral Nemo Starcannon 12b v1", + "display_name": "Mistral Nemo Starcannon 12b v1", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 16384, + "output": 8192 + }, + "tool_call": false, + "reasoning": { + "supported": false + }, + "attachment": false, "open_weights": false, - "knowledge": "2024-09-30", - "release_date": "2025-11-13", - "last_updated": "2025-11-13", + "release_date": "2024-07-01", + "last_updated": "2024-07-01", "cost": { - "input": 0.25, - "output": 2, - "cache_read": 0.025 + "input": 0.49299999999999994, + "output": 0.49299999999999994 }, "type": "chat" }, { - "id": "mimo-v2-omni-free", - "name": "MiMo V2 Omni Free", - "display_name": "MiMo V2 Omni Free", + "id": "TEE/minimax-m2.5", + "name": "MiniMax M2.5 TEE", + "display_name": "MiniMax M2.5 TEE", "modalities": { "input": [ - "text", - "image", - "audio", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 262144, - "output": 64000 + "context": 196608, + "output": 131072 }, - "temperature": true, "tool_call": true, "reasoning": { "supported": true, @@ -173587,31 +177173,23 @@ }, "extra_capabilities": { "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] + "supported": true } }, - "attachment": true, - "open_weights": true, - "knowledge": "2024-12", - "release_date": "2026-03-18", - "last_updated": "2026-03-18", + "attachment": false, + "open_weights": false, + "release_date": "2026-04-20", + "last_updated": "2026-04-20", "cost": { - "input": 0, - "output": 0, - "cache_read": 0 + "input": 0.2, + "output": 1.38 }, "type": "chat" }, { - "id": "ring-2.6-1t-free", - "name": "Ring 2.6 1T Free", - "display_name": "Ring 2.6 1T Free", + "id": "TEE/glm-4.7", + "name": "GLM 4.7 TEE", + "display_name": "GLM 4.7 TEE", "modalities": { "input": [ "text" @@ -173621,14 +177199,12 @@ ] }, "limit": { - "context": 262000, - "output": 66000 + "context": 131000, + "output": 65535 }, - "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": true + "supported": true }, "extra_capabilities": { "reasoning": { @@ -173642,20 +177218,19 @@ } }, "attachment": false, - "open_weights": true, - "knowledge": "2025-06", - "release_date": "2026-05-08", - "last_updated": "2026-05-08", + "open_weights": false, + "release_date": "2026-01-29", + "last_updated": "2026-01-29", "cost": { - "input": 0, - "output": 0 + "input": 0.85, + "output": 3.3 }, "type": "chat" }, { - "id": "nemotron-3-ultra-free", - "name": "Nemotron 3 Ultra Free", - "display_name": "Nemotron 3 Ultra Free", + "id": "TEE/llama3-3-70b", + "name": "Llama 3.3 70B", + "display_name": "Llama 3.3 70B", "modalities": { "input": [ "text" @@ -173665,42 +177240,27 @@ ] }, "limit": { - "context": 1000000, - "output": 128000 + "context": 128000, + "output": 16384 }, - "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } + "supported": false }, "attachment": false, - "open_weights": true, - "knowledge": "2026-02", - "release_date": "2026-06-04", - "last_updated": "2026-06-04", + "open_weights": false, + "release_date": "2025-07-03", + "last_updated": "2025-07-03", "cost": { - "input": 0, - "output": 0, - "cache_read": 0 + "input": 2, + "output": 2 }, "type": "chat" }, { - "id": "trinity-large-preview-free", - "name": "Trinity Large Preview", - "display_name": "Trinity Large Preview", + "id": "TEE/gemma-4-31b-it", + "name": "Gemma 4 31B IT TEE", + "display_name": "Gemma 4 31B IT TEE", "modalities": { "input": [ "text" @@ -173710,164 +177270,106 @@ ] }, "limit": { - "context": 131072, - "output": 131072 + "context": 262144, + "output": 262144 }, - "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "attachment": false, - "open_weights": true, - "knowledge": "2025-06", - "release_date": "2026-01-28", - "last_updated": "2026-01-28", + "open_weights": false, + "release_date": "2026-05-26", + "last_updated": "2026-05-26", "cost": { - "input": 0, - "output": 0 + "input": 0.15, + "output": 0.46 }, "type": "chat" }, { - "id": "claude-fable-5", - "name": "Claude Fable 5", - "display_name": "Claude Fable 5", + "id": "TEE/qwen3-30b-a3b-instruct-2507", + "name": "Qwen3 30B A3B Instruct 2507 TEE", + "display_name": "Qwen3 30B A3B Instruct 2507 TEE", "modalities": { "input": [ - "text", - "image", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 1000000, - "output": 128000 + "context": 262000, + "output": 32768 }, - "temperature": false, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": true, - "mode": "effort", - "effort": "high", - "effort_options": [ - "low", - "medium", - "high", - "xhigh", - "max" - ], - "interleaved": true, - "summaries": true, - "visibility": "omitted", - "continuation": [ - "thinking_blocks" - ], - "notes": [ - "Adaptive thinking is always on for Claude Fable 5 and Claude Mythos 5; thinking.type = \"disabled\" is rejected.", - "Manual budget_tokens requests return 400 on Claude Fable 5 and Claude Mythos 5.", - "thinking.display defaults to omitted; set display to summarized to receive readable thinking summaries." - ] - } + "supported": false }, - "attachment": true, + "attachment": false, "open_weights": false, - "knowledge": "2026-01-31", - "release_date": "2026-06-09", - "last_updated": "2026-06-09", + "release_date": "2025-07-29", + "last_updated": "2025-07-29", "cost": { - "input": 10, - "output": 50, - "cache_read": 1, - "cache_write": 12.5 + "input": 0.15, + "output": 0.44999999999999996 }, "type": "chat" }, { - "id": "gemini-3-flash", - "name": "Gemini 3 Flash", - "display_name": "Gemini 3 Flash", + "id": "TEE/glm-5.1", + "name": "GLM 5.1 TEE", + "display_name": "GLM 5.1 TEE", "modalities": { "input": [ - "text", - "image", - "video", - "audio", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 1048576, - "output": 65536 + "context": 202752, + "output": 65535 }, - "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": true + "supported": true }, "extra_capabilities": { "reasoning": { - "supported": true, - "default_enabled": true, - "mode": "level", - "level": "high", - "level_options": [ - "minimal", - "low", - "medium", - "high" - ], - "summaries": true, - "visibility": "summary", - "continuation": [ - "thought_signatures" - ] + "supported": true } }, - "attachment": true, + "attachment": false, "open_weights": false, - "knowledge": "2025-01", - "release_date": "2025-12-17", - "last_updated": "2025-12-17", + "release_date": "2026-04-20", + "last_updated": "2026-04-20", "cost": { - "input": 0.5, - "output": 3, - "cache_read": 0.05 + "input": 1.5, + "output": 5.25, + "cache_read": 0.3 }, "type": "chat" }, { - "id": "qwen3.6-plus", - "name": "Qwen3.6 Plus", - "display_name": "Qwen3.6 Plus", + "id": "TEE/deepseek-v4-pro", + "name": "DeepSeek V4 Pro TEE", + "display_name": "DeepSeek V4 Pro TEE", "modalities": { "input": [ - "text", - "image", - "video" + "text" ], "output": [ "text" ] }, "limit": { - "context": 262144, + "context": 800000, "output": 65536 }, - "temperature": true, "tool_call": true, "reasoning": { "supported": true, @@ -173884,222 +177386,156 @@ ] } }, - "attachment": true, + "attachment": false, "open_weights": false, - "knowledge": "2025-04", - "release_date": "2026-04-02", - "last_updated": "2026-04-02", + "release_date": "2026-04-25", + "last_updated": "2026-04-25", "cost": { - "input": 0.5, - "output": 3, - "cache_read": 0.05, - "cache_write": 0.625 + "input": 1.5, + "output": 5.25, + "cache_read": 0.15 }, "type": "chat" }, { - "id": "mimo-v2.5-free", - "name": "MiMo V2.5 Free", - "display_name": "MiMo V2.5 Free", + "id": "TEE/deepseek-v4-pro:thinking", + "name": "DeepSeek V4 Pro Thinking TEE", + "display_name": "DeepSeek V4 Pro Thinking TEE", "modalities": { "input": [ - "text", - "image", - "audio", - "video" + "text" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 32000 + "context": 800000, + "output": 65536 }, - "temperature": true, "tool_call": true, "reasoning": { "supported": true, "default": true }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } - }, - "attachment": true, - "open_weights": true, - "knowledge": "2024-12", - "release_date": "2026-04-24", - "last_updated": "2026-04-24", + "attachment": false, + "open_weights": false, + "release_date": "2026-04-29", + "last_updated": "2026-04-29", "cost": { - "input": 0, - "output": 0, - "cache_read": 0 + "input": 1.5, + "output": 5.25, + "cache_read": 0.15 }, "type": "chat" }, { - "id": "gpt-5.4-nano", - "name": "GPT-5.4 Nano", - "display_name": "GPT-5.4 Nano", + "id": "TEE/gemma4-31b:thinking", + "name": "Gemma 4 31B Thinking TEE", + "display_name": "Gemma 4 31B Thinking TEE", "modalities": { "input": [ - "text", - "image", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 400000, - "output": 128000 + "context": 262144, + "output": 131072 }, - "temperature": false, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": true, - "default": false - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": false, - "mode": "effort", - "effort": "none", - "effort_options": [ - "none", - "low", - "medium", - "high", - "xhigh" - ], - "verbosity": "medium", - "verbosity_options": [ - "low", - "medium", - "high" - ], - "visibility": "hidden" - } + "default": true }, - "attachment": true, + "attachment": false, "open_weights": false, - "knowledge": "2025-08-31", - "release_date": "2026-03-17", - "last_updated": "2026-03-17", + "release_date": "2026-05-02", + "last_updated": "2026-05-02", "cost": { - "input": 0.2, - "output": 1.25, - "cache_read": 0.02 + "input": 0.45, + "output": 1 }, "type": "chat" }, { - "id": "claude-3-5-haiku", - "name": "Claude Haiku 3.5", - "display_name": "Claude Haiku 3.5", + "id": "TEE/kimi-k2.5", + "name": "Kimi K2.5 TEE", + "display_name": "Kimi K2.5 TEE", "modalities": { "input": [ - "text", - "image", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 8192 + "context": 128000, + "output": 65535 }, - "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": false + "supported": true }, - "attachment": true, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } + }, + "attachment": false, "open_weights": false, - "knowledge": "2024-07-31", - "release_date": "2024-10-22", - "last_updated": "2024-10-22", + "release_date": "2026-01-29", + "last_updated": "2026-01-29", "cost": { - "input": 0.8, - "output": 4, - "cache_read": 0.08, - "cache_write": 1 + "input": 0.3, + "output": 1.9 }, "type": "chat" }, { - "id": "gpt-5.3-codex", - "name": "GPT-5.3 Codex", - "display_name": "GPT-5.3 Codex", + "id": "TEE/qwen2.5-vl-72b-instruct", + "name": "Qwen2.5 VL 72B TEE", + "display_name": "Qwen2.5 VL 72B TEE", "modalities": { "input": [ "text", - "image", - "pdf" + "image" ], "output": [ "text" ] }, "limit": { - "context": 400000, - "output": 128000 + "context": 65536, + "output": 8192 }, - "temperature": false, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": true, - "mode": "effort", - "effort": "medium", - "effort_options": [ - "low", - "medium", - "high", - "xhigh" - ], - "verbosity": "medium", - "verbosity_options": [ - "low", - "medium", - "high" - ], - "visibility": "hidden" - } + "supported": false }, "attachment": true, "open_weights": false, - "knowledge": "2025-08-31", - "release_date": "2026-02-24", - "last_updated": "2026-02-24", + "release_date": "2025-02-01", + "last_updated": "2025-02-01", "cost": { - "input": 1.75, - "output": 14, - "cache_read": 0.175 + "input": 0.7, + "output": 0.7 }, "type": "chat" }, { - "id": "gpt-5.3-codex-spark", - "name": "GPT-5.3 Codex Spark", - "display_name": "GPT-5.3 Codex Spark", + "id": "TEE/gpt-oss-120b", + "name": "GPT-OSS 120B TEE", + "display_name": "GPT-OSS 120B TEE", "modalities": { "input": [ "text" @@ -174109,52 +177545,32 @@ ] }, "limit": { - "context": 128000, - "output": 128000 + "context": 131072, + "output": 16384 }, - "temperature": false, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": true + "supported": true }, "extra_capabilities": { "reasoning": { - "supported": true, - "default_enabled": true, - "mode": "effort", - "effort": "medium", - "effort_options": [ - "low", - "medium", - "high", - "xhigh" - ], - "verbosity": "medium", - "verbosity_options": [ - "low", - "medium", - "high" - ], - "visibility": "hidden" + "supported": true } }, "attachment": false, "open_weights": false, - "knowledge": "2025-08-31", - "release_date": "2026-02-12", - "last_updated": "2026-02-12", + "release_date": "2025-08-05", + "last_updated": "2025-08-05", "cost": { - "input": 1.75, - "output": 14, - "cache_read": 0.175 + "input": 2, + "output": 2 }, "type": "chat" }, { - "id": "qwen3.6-plus-free", - "name": "Qwen3.6 Plus Free", - "display_name": "Qwen3.6 Plus Free", + "id": "TEE/qwen3.5-27b", + "name": "Qwen3.5 27B TEE", + "display_name": "Qwen3.5 27B TEE", "modalities": { "input": [ "text", @@ -174169,11 +177585,9 @@ "context": 262144, "output": 65536 }, - "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": true + "supported": true }, "extra_capabilities": { "reasoning": { @@ -174188,61 +177602,49 @@ }, "attachment": true, "open_weights": false, - "knowledge": "2025-04", - "release_date": "2026-04-02", - "last_updated": "2026-04-02", + "release_date": "2026-03-13", + "last_updated": "2026-03-13", "cost": { - "input": 0, - "output": 0, - "cache_read": 0 + "input": 0.3, + "output": 2.4 }, "type": "chat" }, { - "id": "gpt-5.5-pro", - "name": "GPT-5.5 Pro", - "display_name": "GPT-5.5 Pro", + "id": "TEE/gemma-4-26b-a4b-uncensored", + "name": "Gemma 4 26B A4B Uncensored TEE", + "display_name": "Gemma 4 26B A4B Uncensored TEE", "modalities": { "input": [ "text", - "image", - "pdf" + "image" ], "output": [ "text" ] }, "limit": { - "context": 1050000, - "output": 128000 + "context": 65536, + "output": 65536 }, - "temperature": false, "tool_call": true, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true - } + "supported": false }, "attachment": true, "open_weights": false, - "knowledge": "2025-12-01", - "release_date": "2026-04-24", - "last_updated": "2026-04-24", + "release_date": "2026-05-23", + "last_updated": "2026-05-23", "cost": { - "input": 30, - "output": 180, - "cache_read": 30 + "input": 0.15, + "output": 0.7 }, "type": "chat" }, { - "id": "minimax-m2.1-free", - "name": "MiniMax M2.1 Free", - "display_name": "MiniMax M2.1 Free", + "id": "TEE/deepseek-v3.1", + "name": "DeepSeek V3.1 TEE", + "display_name": "DeepSeek V3.1 TEE", "modalities": { "input": [ "text" @@ -174252,165 +177654,105 @@ ] }, "limit": { - "context": 204800, - "output": 131072 + "context": 164000, + "output": 8192 }, - "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true - } + "supported": false }, "attachment": false, - "open_weights": true, - "knowledge": "2025-01", - "release_date": "2025-12-23", - "last_updated": "2025-12-23", + "open_weights": false, + "release_date": "2025-08-21", + "last_updated": "2025-08-21", "cost": { - "input": 0, - "output": 0, - "cache_read": 0 + "input": 1, + "output": 2.5 }, "type": "chat" }, { - "id": "gemini-3.1-pro", - "name": "Gemini 3.1 Pro Preview", - "display_name": "Gemini 3.1 Pro Preview", + "id": "TEE/kimi-k2.6", + "name": "Kimi K2.6 TEE", + "display_name": "Kimi K2.6 TEE", "modalities": { "input": [ "text", - "image", - "video", - "audio", - "pdf" + "image" ], "output": [ "text" ] }, "limit": { - "context": 1048576, + "context": 262144, "output": 65536 }, - "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": true }, "extra_capabilities": { "reasoning": { - "supported": true, - "default_enabled": true, - "mode": "level", - "level": "high", - "level_options": [ - "low", - "high" - ], - "summaries": true, - "visibility": "summary", - "continuation": [ - "thought_signatures" - ] + "supported": true } }, "attachment": true, "open_weights": false, - "knowledge": "2025-01", - "release_date": "2026-02-19", - "last_updated": "2026-02-19", + "release_date": "2026-04-21", + "last_updated": "2026-04-21", "cost": { - "input": 2, - "output": 12, - "cache_read": 0.2, - "tiers": [ - { - "input": 4, - "output": 18, - "cache_read": 0.4, - "tier": { - "type": "context", - "size": 200000 - } - } - ], - "context_over_200k": { - "input": 4, - "output": 18, - "cache_read": 0.4 - } + "input": 1.5, + "output": 5.25, + "cache_read": 0.375 }, "type": "chat" }, { - "id": "gemini-3.5-flash", - "name": "Gemini 3.5 Flash", - "display_name": "Gemini 3.5 Flash", + "id": "TEE/qwen3.5-397b-a17b", + "name": "Qwen3.5 397B A17B TEE", + "display_name": "Qwen3.5 397B A17B TEE", "modalities": { "input": [ - "text", - "image", - "video", - "audio", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 1048576, + "context": 258048, "output": 65536 }, - "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": true + "supported": true }, "extra_capabilities": { "reasoning": { "supported": true, - "default_enabled": true, - "mode": "level", - "level": "high", - "level_options": [ - "minimal", - "low", - "medium", - "high" - ], + "interleaved": true, "summaries": true, "visibility": "summary", "continuation": [ - "thought_signatures" + "thinking_blocks" ] } }, - "attachment": true, + "attachment": false, "open_weights": false, - "knowledge": "2025-01", - "release_date": "2026-05-19", - "last_updated": "2026-05-19", + "release_date": "2026-02-28", + "last_updated": "2026-02-28", "cost": { - "input": 1.5, - "output": 9, - "cache_read": 0.15, - "input_audio": 1.5 + "input": 0.6, + "output": 3.6 }, "type": "chat" }, { - "id": "deepseek-v4-flash-free", - "name": "DeepSeek V4 Flash Free", - "display_name": "DeepSeek V4 Flash Free", + "id": "TEE/kimi-k2.5-thinking", + "name": "Kimi K2.5 Thinking TEE", + "display_name": "Kimi K2.5 Thinking TEE", "modalities": { "input": [ "text" @@ -174420,10 +177762,41 @@ ] }, "limit": { - "context": 200000, - "output": 128000 + "context": 128000, + "output": 65535 + }, + "tool_call": false, + "reasoning": { + "supported": true, + "default": true + }, + "attachment": false, + "open_weights": false, + "release_date": "2026-01-29", + "last_updated": "2026-01-29", + "cost": { + "input": 0.3, + "output": 1.9 + }, + "type": "chat" + }, + { + "id": "TEE/qwen3.6-35b-a3b-uncensored", + "name": "Qwen3.6 35B A3B Uncensored TEE", + "display_name": "Qwen3.6 35B A3B Uncensored TEE", + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 131072, + "output": 131072 }, - "temperature": true, "tool_call": true, "reasoning": { "supported": true, @@ -174440,79 +177813,55 @@ ] } }, - "attachment": false, - "open_weights": true, - "knowledge": "2025-05", - "release_date": "2026-04-24", - "last_updated": "2026-04-24", + "attachment": true, + "open_weights": false, + "release_date": "2026-05-23", + "last_updated": "2026-05-23", "cost": { - "input": 0, - "output": 0, - "cache_read": 0 + "input": 0.3, + "output": 1.5 }, "type": "chat" }, { - "id": "gpt-5.2-codex", - "name": "GPT-5.2 Codex", - "display_name": "GPT-5.2 Codex", + "id": "TEE/glm-4.7-flash", + "name": "GLM 4.7 Flash TEE", + "display_name": "GLM 4.7 Flash TEE", "modalities": { "input": [ - "text", - "image", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 400000, - "output": 128000 + "context": 203000, + "output": 65535 }, - "temperature": false, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": true + "supported": true }, "extra_capabilities": { "reasoning": { - "supported": true, - "default_enabled": true, - "mode": "effort", - "effort": "medium", - "effort_options": [ - "low", - "medium", - "high", - "xhigh" - ], - "verbosity": "medium", - "verbosity_options": [ - "low", - "medium", - "high" - ], - "visibility": "hidden" + "supported": true } }, - "attachment": true, + "attachment": false, "open_weights": false, - "knowledge": "2025-08-31", - "release_date": "2026-01-14", - "last_updated": "2026-01-14", + "release_date": "2026-01-19", + "last_updated": "2026-01-19", "cost": { - "input": 1.75, - "output": 14, - "cache_read": 0.175 + "input": 0.15, + "output": 0.5 }, "type": "chat" }, { - "id": "minimax-m2.7", - "name": "MiniMax M2.7", - "display_name": "MiniMax M2.7", + "id": "TEE/gemma4-31b", + "name": "Gemma 4 31B", + "display_name": "Gemma 4 31B", "modalities": { "input": [ "text" @@ -174522,42 +177871,57 @@ ] }, "limit": { - "context": 204800, + "context": 262144, "output": 131072 }, - "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": true + "supported": false }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } + "attachment": false, + "open_weights": false, + "release_date": "2026-04-04", + "last_updated": "2026-04-04", + "cost": { + "input": 0.45, + "output": 1 + }, + "type": "chat" + }, + { + "id": "TEE/gemma-3-27b-it", + "name": "Gemma 3 27B TEE", + "display_name": "Gemma 3 27B TEE", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 131072, + "output": 8192 + }, + "tool_call": false, + "reasoning": { + "supported": false }, "attachment": false, - "open_weights": true, - "knowledge": "2025-01", - "release_date": "2026-03-18", - "last_updated": "2026-03-18", + "open_weights": false, + "release_date": "2025-03-10", + "last_updated": "2025-03-10", "cost": { - "input": 0.3, - "output": 1.2, - "cache_read": 0.06 + "input": 0.2, + "output": 0.8 }, "type": "chat" }, { - "id": "deepseek-v4-flash", - "name": "DeepSeek V4 Flash", - "display_name": "DeepSeek V4 Flash", + "id": "TEE/gpt-oss-20b", + "name": "GPT-OSS 20B TEE", + "display_name": "GPT-OSS 20B TEE", "modalities": { "input": [ "text" @@ -174567,61 +177931,47 @@ ] }, "limit": { - "context": 1000000, - "output": 384000 + "context": 131072, + "output": 8192 }, - "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": true + "supported": true }, "extra_capabilities": { "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] + "supported": true } }, "attachment": false, - "open_weights": true, - "knowledge": "2025-05", - "release_date": "2026-04-24", - "last_updated": "2026-04-24", + "open_weights": false, + "release_date": "2025-08-05", + "last_updated": "2025-08-05", "cost": { - "input": 0.14, - "output": 0.28, - "cache_read": 0.03 + "input": 0.2, + "output": 0.8 }, "type": "chat" }, { - "id": "kimi-k2.5-free", - "name": "Kimi K2.5 Free", - "display_name": "Kimi K2.5 Free", + "id": "TEE/glm-5", + "name": "GLM 5 TEE", + "display_name": "GLM 5 TEE", "modalities": { "input": [ - "text", - "image", - "video" + "text" ], "output": [ "text" ] }, "limit": { - "context": 262144, - "output": 262144 + "context": 203000, + "output": 65535 }, - "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": true + "supported": true }, "extra_capabilities": { "reasoning": { @@ -174634,84 +177984,87 @@ ] } }, - "attachment": true, - "open_weights": true, - "knowledge": "2024-10", - "release_date": "2026-01-27", - "last_updated": "2026-01-27", + "attachment": false, + "open_weights": false, + "release_date": "2026-02-11", + "last_updated": "2026-02-11", "cost": { - "input": 0, - "output": 0, - "cache_read": 0 + "input": 1.2, + "output": 3.5 }, "type": "chat" }, { - "id": "claude-opus-4-8", - "name": "Claude Opus 4.8", - "display_name": "Claude Opus 4.8", + "id": "TEE/glm-5.1-thinking", + "name": "GLM 5.1 Thinking TEE", + "display_name": "GLM 5.1 Thinking TEE", "modalities": { "input": [ - "text", - "image", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 1000000, - "output": 128000 + "context": 202752, + "output": 65535 }, - "temperature": false, "tool_call": true, "reasoning": { "supported": true, - "default": false + "default": true + }, + "attachment": false, + "open_weights": false, + "release_date": "2026-04-20", + "last_updated": "2026-04-20", + "cost": { + "input": 1.5, + "output": 5.25, + "cache_read": 0.3 + }, + "type": "chat" + }, + { + "id": "TEE/deepseek-v3.2", + "name": "DeepSeek V3.2 TEE", + "display_name": "DeepSeek V3.2 TEE", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 164000, + "output": 65536 + }, + "tool_call": false, + "reasoning": { + "supported": true }, "extra_capabilities": { "reasoning": { - "supported": true, - "default_enabled": false, - "mode": "effort", - "effort": "high", - "effort_options": [ - "low", - "medium", - "high", - "xhigh", - "max" - ], - "interleaved": true, - "summaries": true, - "visibility": "omitted", - "continuation": [ - "thinking_blocks" - ], - "notes": [ - "Claude Opus 4.7 and newer Opus models require thinking.type = \"adaptive\" to enable thinking explicitly.", - "Manual budget_tokens requests return 400 on Claude Opus 4.7 and newer adaptive-only Opus models.", - "task_budget is separate from thinking control and should not be treated as a thinking budget." - ] + "supported": true } }, - "attachment": true, + "attachment": false, "open_weights": false, - "release_date": "2026-05-28", - "last_updated": "2026-05-28", + "release_date": "2025-12-01", + "last_updated": "2025-12-01", "cost": { - "input": 5, - "output": 25, - "cache_read": 0.5, - "cache_write": 6.25 + "input": 0.5, + "output": 1 }, "type": "chat" }, { - "id": "nemotron-3-super-free", - "name": "Nemotron 3 Super Free", - "display_name": "Nemotron 3 Super Free", + "id": "TEE/qwen3.5-122b-a10b", + "name": "Qwen3.5 122B A10B TEE", + "display_name": "Qwen3.5 122B A10B TEE", "modalities": { "input": [ "text" @@ -174721,10 +178074,9 @@ ] }, "limit": { - "context": 204800, - "output": 128000 + "context": 262144, + "output": 262144 }, - "temperature": true, "tool_call": true, "reasoning": { "supported": true, @@ -174742,21 +178094,19 @@ } }, "attachment": false, - "open_weights": true, - "knowledge": "2026-02", - "release_date": "2026-03-11", - "last_updated": "2026-03-11", + "open_weights": false, + "release_date": "2026-05-26", + "last_updated": "2026-05-26", "cost": { - "input": 0, - "output": 0, - "cache_read": 0 + "input": 0.46, + "output": 3.68 }, "type": "chat" }, { - "id": "glm-5", - "name": "GLM-5", - "display_name": "GLM-5", + "id": "Sao10K/L3.1-70B-Hanami-x1", + "name": "Llama 3.1 70B Hanami", + "display_name": "Llama 3.1 70B Hanami", "modalities": { "input": [ "text" @@ -174766,98 +178116,57 @@ ] }, "limit": { - "context": 204800, - "output": 131072 + "context": 16384, + "output": 16384 }, - "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } + "supported": false }, "attachment": false, - "open_weights": true, - "knowledge": "2025-04", - "release_date": "2026-02-11", - "last_updated": "2026-02-11", + "open_weights": false, + "release_date": "2024-07-23", + "last_updated": "2024-07-23", "cost": { - "input": 1, - "output": 3.2, - "cache_read": 0.2 + "input": 0.49299999999999994, + "output": 0.49299999999999994 }, "type": "chat" }, { - "id": "gpt-5.1-codex", - "name": "GPT-5.1 Codex", - "display_name": "GPT-5.1 Codex", + "id": "Sao10K/L3-8B-Stheno-v3.2", + "name": "Sao10K Stheno 8b", + "display_name": "Sao10K Stheno 8b", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 400000, - "output": 128000 + "context": 16384, + "output": 8192 }, - "temperature": false, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": false - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": false, - "mode": "effort", - "effort": "none", - "effort_options": [ - "none", - "low", - "medium", - "high" - ], - "verbosity": "medium", - "verbosity_options": [ - "low", - "medium", - "high" - ], - "visibility": "hidden" - } + "supported": false }, - "attachment": true, + "attachment": false, "open_weights": false, - "knowledge": "2024-09-30", - "release_date": "2025-11-13", - "last_updated": "2025-11-13", + "release_date": "2024-11-29", + "last_updated": "2024-11-29", "cost": { - "input": 1.07, - "output": 8.5, - "cache_read": 0.107 + "input": 0.2006, + "output": 0.2006 }, "type": "chat" }, { - "id": "qwen3-coder", - "name": "Qwen3 Coder", - "display_name": "Qwen3 Coder", + "id": "Sao10K/L3.3-70B-Euryale-v2.3", + "name": "Llama 3.3 70B Euryale", + "display_name": "Llama 3.3 70B Euryale", "modalities": { "input": [ "text" @@ -174867,29 +178176,27 @@ ] }, "limit": { - "context": 262144, - "output": 65536 + "context": 20480, + "output": 16384 }, - "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": false }, "attachment": false, - "open_weights": true, - "knowledge": "2025-04", - "release_date": "2025-07-23", - "last_updated": "2025-07-23", + "open_weights": false, + "release_date": "2024-12-06", + "last_updated": "2024-12-06", "cost": { - "input": 0.45, - "output": 1.8 + "input": 0.49299999999999994, + "output": 0.49299999999999994 }, "type": "chat" }, { - "id": "big-pickle", - "name": "Big Pickle", - "display_name": "Big Pickle", + "id": "Sao10K/L3.1-70B-Euryale-v2.2", + "name": "Llama 3.1 70B Euryale", + "display_name": "Llama 3.1 70B Euryale", "modalities": { "input": [ "text" @@ -174899,43 +178206,27 @@ ] }, "limit": { - "context": 200000, - "output": 32000 + "context": 20480, + "output": 16384 }, - "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } + "supported": false }, "attachment": false, "open_weights": false, - "knowledge": "2025-01", - "release_date": "2025-10-17", - "last_updated": "2025-10-17", + "release_date": "2024-07-23", + "last_updated": "2024-07-23", "cost": { - "input": 0, - "output": 0, - "cache_read": 0, - "cache_write": 0 + "input": 0.306, + "output": 0.357 }, "type": "chat" }, { - "id": "ling-2.6-flash-free", - "name": "Ling 2.6 Flash Free", - "display_name": "Ling 2.6 Flash Free", + "id": "Steelskull/L3.3-MS-Evalebis-70b", + "name": "MS Evalebis 70b", + "display_name": "MS Evalebis 70b", "modalities": { "input": [ "text" @@ -174945,70 +178236,57 @@ ] }, "limit": { - "context": 262100, - "output": 32800 + "context": 16384, + "output": 16384 }, - "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": false }, "attachment": false, - "open_weights": true, - "knowledge": "2025-06", - "release_date": "2026-04-21", - "last_updated": "2026-04-21", + "open_weights": false, + "release_date": "2024-12-06", + "last_updated": "2024-12-06", "cost": { - "input": 0, - "output": 0 + "input": 0.49299999999999994, + "output": 0.49299999999999994 }, "type": "chat" }, { - "id": "minimax-m3-free", - "name": "MiniMax M3 Free", - "display_name": "MiniMax M3 Free", + "id": "Steelskull/L3.3-MS-Nevoria-70b", + "name": "Steelskull Nevoria 70b", + "display_name": "Steelskull Nevoria 70b", "modalities": { "input": [ - "text", - "image", - "video" + "text" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 32000 + "context": 16384, + "output": 16384 }, - "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true - } + "supported": false }, "attachment": false, - "open_weights": true, - "knowledge": "2025-01", - "release_date": "2026-05-31", - "last_updated": "2026-05-31", + "open_weights": false, + "release_date": "2024-12-06", + "last_updated": "2024-12-06", "cost": { - "input": 0, - "output": 0, - "cache_read": 0 + "input": 0.49299999999999994, + "output": 0.49299999999999994 }, "type": "chat" }, { - "id": "minimax-m2.5", - "name": "MiniMax M2.5", - "display_name": "MiniMax M2.5", + "id": "Steelskull/L3.3-Cu-Mai-R1-70b", + "name": "Llama 3.3 70B Cu Mai", + "display_name": "Llama 3.3 70B Cu Mai", "modalities": { "input": [ "text" @@ -175018,42 +178296,27 @@ ] }, "limit": { - "context": 204800, - "output": 131072 + "context": 16384, + "output": 16384 }, - "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } + "supported": false }, "attachment": false, - "open_weights": true, - "knowledge": "2025-01", - "release_date": "2026-02-12", - "last_updated": "2026-02-12", + "open_weights": false, + "release_date": "2024-12-06", + "last_updated": "2024-12-06", "cost": { - "input": 0.3, - "output": 1.2, - "cache_read": 0.06 + "input": 0.49299999999999994, + "output": 0.49299999999999994 }, "type": "chat" }, { - "id": "glm-4.7-free", - "name": "GLM-4.7 Free", - "display_name": "GLM-4.7 Free", + "id": "Steelskull/L3.3-MS-Evayale-70B", + "name": "Evayale 70b ", + "display_name": "Evayale 70b ", "modalities": { "input": [ "text" @@ -175063,176 +178326,133 @@ ] }, "limit": { - "context": 204800, - "output": 131072 + "context": 16384, + "output": 16384 }, - "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } + "supported": false }, "attachment": false, - "open_weights": true, - "knowledge": "2025-04", - "release_date": "2025-12-22", - "last_updated": "2025-12-22", + "open_weights": false, + "release_date": "2024-12-06", + "last_updated": "2024-12-06", "cost": { - "input": 0, - "output": 0, - "cache_read": 0 + "input": 0.49299999999999994, + "output": 0.49299999999999994 }, "type": "chat" }, { - "id": "claude-sonnet-4-5", - "name": "Claude Sonnet 4.5", - "display_name": "Claude Sonnet 4.5", + "id": "Steelskull/L3.3-Nevoria-R1-70b", + "name": "Steelskull Nevoria R1 70b", + "display_name": "Steelskull Nevoria R1 70b", "modalities": { "input": [ - "text", - "image", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 1000000, - "output": 64000 + "context": 16384, + "output": 16384 }, - "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": false - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": false, - "mode": "budget", - "budget": { - "min": 1024, - "unit": "tokens" - }, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ], - "notes": [ - "Claude 4 manual thinking uses thinking.type = \"enabled\" with budget_tokens.", - "Interleaved thinking requires the interleaved-thinking-2025-05-14 beta header for this model family." - ] - } + "supported": false }, - "attachment": true, + "attachment": false, "open_weights": false, - "knowledge": "2025-07-31", - "release_date": "2025-09-29", - "last_updated": "2025-09-29", + "release_date": "2024-12-06", + "last_updated": "2024-12-06", "cost": { - "input": 3, - "output": 15, - "cache_read": 0.3, - "cache_write": 3.75, - "tiers": [ - { - "input": 6, - "output": 22.5, - "cache_read": 0.6, - "cache_write": 7.5, - "tier": { - "type": "context", - "size": 200000 - } - } - ], - "context_over_200k": { - "input": 6, - "output": 22.5, - "cache_read": 0.6, - "cache_write": 7.5 - } + "input": 0.49299999999999994, + "output": 0.49299999999999994 }, "type": "chat" }, { - "id": "gpt-5.4-mini", - "name": "GPT-5.4 Mini", - "display_name": "GPT-5.4 Mini", + "id": "Steelskull/L3.3-Electra-R1-70b", + "name": "Steelskull Electra R1 70b", + "display_name": "Steelskull Electra R1 70b", "modalities": { "input": [ - "text", - "image", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 400000, - "output": 128000 + "context": 16384, + "output": 16384 }, - "temperature": false, + "tool_call": false, + "reasoning": { + "supported": false + }, + "attachment": false, + "open_weights": false, + "release_date": "2024-12-06", + "last_updated": "2024-12-06", + "cost": { + "input": 0.69989, + "output": 0.69989 + }, + "type": "chat" + } + ] + }, + "moark": { + "id": "moark", + "name": "Moark", + "display_name": "Moark", + "api": "https://moark.com/v1", + "doc": "https://moark.com/docs/openapi/v1#tag/%E6%96%87%E6%9C%AC%E7%94%9F%E6%88%90", + "models": [ + { + "id": "MiniMax-M2.1", + "name": "MiniMax-M2.1", + "display_name": "MiniMax-M2.1", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 204800, + "output": 131072 + }, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, - "default": false + "default": true }, "extra_capabilities": { "reasoning": { - "supported": true, - "default_enabled": false, - "mode": "effort", - "effort": "none", - "effort_options": [ - "none", - "low", - "medium", - "high", - "xhigh" - ], - "verbosity": "medium", - "verbosity_options": [ - "low", - "medium", - "high" - ], - "visibility": "hidden" + "supported": true } }, - "attachment": true, - "open_weights": false, - "knowledge": "2025-08-31", - "release_date": "2026-03-17", - "last_updated": "2026-03-17", + "attachment": false, + "open_weights": true, + "release_date": "2025-12-23", + "last_updated": "2025-12-23", "cost": { - "input": 0.75, - "output": 4.5, - "cache_read": 0.075 + "input": 2.1, + "output": 8.4 }, "type": "chat" }, { - "id": "mimo-v2-pro-free", - "name": "MiMo V2 Pro Free", - "display_name": "MiMo V2 Pro Free", + "id": "GLM-4.7", + "name": "GLM-4.7", + "display_name": "GLM-4.7", "modalities": { "input": [ "text" @@ -175242,8 +178462,8 @@ ] }, "limit": { - "context": 1048576, - "output": 64000 + "context": 204800, + "output": 131072 }, "temperature": true, "tool_call": true, @@ -175262,87 +178482,76 @@ ] } }, - "attachment": true, + "attachment": false, "open_weights": true, - "knowledge": "2024-12", - "release_date": "2026-03-18", - "last_updated": "2026-03-18", + "knowledge": "2025-04", + "release_date": "2025-12-22", + "last_updated": "2025-12-22", "cost": { - "input": 0, - "output": 0, - "cache_read": 0 + "input": 3.5, + "output": 14 }, "type": "chat" - }, + } + ] + }, + "lilac": { + "id": "lilac", + "name": "Lilac", + "display_name": "Lilac", + "api": "https://api.getlilac.com/v1", + "doc": "https://docs.getlilac.com/inference/models", + "models": [ { - "id": "claude-opus-4-6", - "name": "Claude Opus 4.6", - "display_name": "Claude Opus 4.6", + "id": "moonshotai/kimi-k2.6", + "name": "Kimi K2.6", + "display_name": "Kimi K2.6", "modalities": { "input": [ "text", - "image", - "pdf" + "image" ], "output": [ "text" ] }, "limit": { - "context": 1000000, - "output": 128000 + "context": 262144, + "output": 262144 }, "temperature": true, "tool_call": true, "reasoning": { "supported": true, - "default": false + "default": true }, "extra_capabilities": { "reasoning": { "supported": true, - "default_enabled": false, - "mode": "mixed", - "budget": { - "min": 1024, - "unit": "tokens" - }, - "effort": "high", - "effort_options": [ - "low", - "medium", - "high", - "max" - ], "interleaved": true, "summaries": true, "visibility": "summary", "continuation": [ "thinking_blocks" - ], - "notes": [ - "Anthropic recommends adaptive thinking with effort for Claude 4.6; budget_tokens remains a deprecated compatibility path.", - "Anthropic API defaults effort to high; lower effort levels should be chosen per workload." ] } }, "attachment": true, - "open_weights": false, - "knowledge": "2025-05-31", - "release_date": "2026-02-05", - "last_updated": "2026-03-13", + "open_weights": true, + "knowledge": "2025-01", + "release_date": "2026-04-21", + "last_updated": "2026-04-21", "cost": { - "input": 5, - "output": 25, - "cache_read": 0.5, - "cache_write": 6.25 + "input": 0.7, + "output": 3.5, + "cache_read": 0.2 }, "type": "chat" }, { - "id": "kimi-k2", - "name": "Kimi K2", - "display_name": "Kimi K2", + "id": "minimaxai/minimax-m2.7", + "name": "MiniMax M2.7", + "display_name": "MiniMax M2.7", "modalities": { "input": [ "text" @@ -175352,30 +178561,42 @@ ] }, "limit": { - "context": 262144, - "output": 262144 + "context": 204800, + "output": 204800 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } }, "attachment": false, "open_weights": true, - "knowledge": "2024-10", - "release_date": "2025-09-05", - "last_updated": "2025-09-05", + "knowledge": "2025-01", + "release_date": "2026-03-18", + "last_updated": "2026-03-18", "cost": { - "input": 0.4, - "output": 2.5, - "cache_read": 0.4 + "input": 0.3, + "output": 1.2, + "cache_read": 0.055 }, "type": "chat" }, { - "id": "kimi-k2.5", - "name": "Kimi K2.5", - "display_name": "Kimi K2.5", + "id": "google/gemma-4-31b-it", + "name": "Gemma 4 31B IT", + "display_name": "Gemma 4 31B IT", "modalities": { "input": [ "text", @@ -175387,8 +178608,8 @@ ] }, "limit": { - "context": 262144, - "output": 65536 + "context": 262100, + "output": 262100 }, "temperature": true, "tool_call": true, @@ -175409,94 +178630,85 @@ }, "attachment": true, "open_weights": true, - "knowledge": "2024-10", - "release_date": "2026-01-27", - "last_updated": "2026-01-27", + "knowledge": "2025-01", + "release_date": "2026-04-02", + "last_updated": "2026-04-02", "cost": { - "input": 0.6, - "output": 3, - "cache_read": 0.08 + "input": 0.11, + "output": 0.35 }, "type": "chat" }, { - "id": "claude-opus-4-7", - "name": "Claude Opus 4.7", - "display_name": "Claude Opus 4.7", + "id": "zai-org/glm-5.1", + "name": "GLM 5.1", + "display_name": "GLM 5.1", "modalities": { "input": [ - "text", - "image", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 1000000, - "output": 128000 + "context": 202800, + "output": 131072 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, - "default": false + "default": true }, "extra_capabilities": { "reasoning": { "supported": true, - "default_enabled": false, - "mode": "effort", - "effort": "high", - "effort_options": [ - "low", - "medium", - "high", - "xhigh", - "max" - ], "interleaved": true, "summaries": true, - "visibility": "omitted", + "visibility": "summary", "continuation": [ "thinking_blocks" - ], - "notes": [ - "Claude Opus 4.7 and newer Opus models require thinking.type = \"adaptive\" to enable thinking explicitly.", - "Manual budget_tokens requests return 400 on Claude Opus 4.7 and newer adaptive-only Opus models.", - "task_budget is separate from thinking control and should not be treated as a thinking budget." ] } }, - "attachment": true, - "open_weights": false, - "knowledge": "2026-01-31", - "release_date": "2026-04-16", - "last_updated": "2026-04-16", + "attachment": false, + "open_weights": true, + "knowledge": "2025-04", + "release_date": "2026-03-27", + "last_updated": "2026-03-27", "cost": { - "input": 5, - "output": 25, - "cache_read": 0.5, - "cache_write": 6.25 + "input": 0.9, + "output": 3, + "cache_read": 0.27 }, "type": "chat" - }, + } + ] + }, + "ambient": { + "id": "ambient", + "name": "Ambient", + "display_name": "Ambient", + "api": "https://api.ambient.xyz/v1", + "doc": "https://ambient.xyz", + "models": [ { - "id": "north-mini-code-free", - "name": "North Mini Code Free", - "display_name": "North Mini Code Free", + "id": "moonshotai/kimi-k2.6", + "name": "Kimi K2.6", + "display_name": "Kimi K2.6", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 256000, - "output": 64000 + "context": 262144, + "output": 262144 }, "temperature": true, "tool_call": true, @@ -175515,19 +178727,21 @@ ] } }, - "attachment": false, + "attachment": true, "open_weights": true, - "knowledge": "2025-09-23", - "release_date": "2026-06-09", - "last_updated": "2026-06-09", + "knowledge": "2025-01", + "release_date": "2026-04-21", + "last_updated": "2026-04-21", "cost": { - "input": 0, - "output": 0 + "input": 0.95, + "output": 4, + "cache_read": 0.2, + "cache_write": 0 }, "type": "chat" }, { - "id": "glm-5.1", + "id": "zai-org/GLM-5.1-FP8", "name": "GLM-5.1", "display_name": "GLM-5.1", "modalities": { @@ -175539,7 +178753,7 @@ ] }, "limit": { - "context": 204800, + "context": 202752, "output": 131072 }, "temperature": true, @@ -175561,20 +178775,29 @@ }, "attachment": false, "open_weights": true, - "knowledge": "2025-04", - "release_date": "2026-04-07", - "last_updated": "2026-04-07", + "release_date": "2026-03-27", + "last_updated": "2026-03-27", "cost": { "input": 1.4, "output": 4.4, - "cache_read": 0.26 + "cache_read": 0, + "cache_write": 0 }, "type": "chat" - }, + } + ] + }, + "upstage": { + "id": "upstage", + "name": "Upstage", + "display_name": "Upstage", + "api": "https://api.upstage.ai/v1/solar", + "doc": "https://developers.upstage.ai/docs/apis/chat", + "models": [ { - "id": "grok-code", - "name": "Grok Code Fast 1", - "display_name": "Grok Code Fast 1", + "id": "solar-pro2", + "name": "solar-pro2", + "display_name": "solar-pro2", "modalities": { "input": [ "text" @@ -175584,8 +178807,8 @@ ] }, "limit": { - "context": 256000, - "output": 256000 + "context": 65536, + "output": 8192 }, "temperature": true, "tool_call": true, @@ -175593,22 +178816,21 @@ "supported": true, "default": true }, - "attachment": true, + "attachment": false, "open_weights": false, - "release_date": "2025-08-20", - "last_updated": "2025-08-20", + "knowledge": "2025-03", + "release_date": "2025-05-20", + "last_updated": "2025-05-20", "cost": { - "input": 0, - "output": 0, - "cache_read": 0, - "cache_write": 0 + "input": 0.25, + "output": 0.25 }, "type": "chat" }, { - "id": "minimax-m2.5-free", - "name": "MiniMax M2.5 Free", - "display_name": "MiniMax M2.5 Free", + "id": "solar-pro3", + "name": "solar-pro3", + "display_name": "solar-pro3", "modalities": { "input": [ "text" @@ -175618,8 +178840,8 @@ ] }, "limit": { - "context": 204800, - "output": 131072 + "context": 131072, + "output": 8192 }, "temperature": true, "tool_call": true, @@ -175627,27 +178849,21 @@ "supported": true, "default": true }, - "extra_capabilities": { - "reasoning": { - "supported": true - } - }, "attachment": false, - "open_weights": true, - "knowledge": "2025-01", - "release_date": "2026-02-12", - "last_updated": "2026-02-12", + "open_weights": false, + "knowledge": "2025-03", + "release_date": "2026-01", + "last_updated": "2026-01", "cost": { - "input": 0, - "output": 0, - "cache_read": 0 + "input": 0.25, + "output": 0.25 }, "type": "chat" }, { - "id": "glm-5-free", - "name": "GLM-5 Free", - "display_name": "GLM-5 Free", + "id": "solar-mini", + "name": "solar-mini", + "display_name": "solar-mini", "modalities": { "input": [ "text" @@ -175657,98 +178873,99 @@ ] }, "limit": { - "context": 204800, - "output": 131072 + "context": 32768, + "output": 4096 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } + "supported": false }, "attachment": false, - "open_weights": true, - "knowledge": "2025-04", - "release_date": "2026-02-11", - "last_updated": "2026-02-11", + "open_weights": false, + "knowledge": "2024-09", + "release_date": "2024-06-12", + "last_updated": "2025-04-22", "cost": { - "input": 0, - "output": 0, - "cache_read": 0 + "input": 0.15, + "output": 0.15 }, "type": "chat" } ] }, - "openai": { - "id": "openai", - "name": "OpenAI", - "display_name": "OpenAI", - "doc": "https://platform.openai.com/docs/models", + "zhipuai-coding-plan": { + "id": "zhipuai-coding-plan", + "name": "Zhipu AI Coding Plan", + "display_name": "Zhipu AI Coding Plan", + "api": "https://open.bigmodel.cn/api/coding/paas/v4", + "doc": "https://docs.bigmodel.cn/cn/coding-plan/overview", "models": [ { - "id": "gpt-4o-2024-08-06", - "name": "GPT-4o (2024-08-06)", - "display_name": "GPT-4o (2024-08-06)", + "id": "glm-5.1", + "name": "GLM-5.1", + "display_name": "GLM-5.1", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 16384 + "context": 200000, + "output": 131072 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": true, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } + }, + "attachment": false, "open_weights": false, - "knowledge": "2023-09", - "release_date": "2024-08-06", - "last_updated": "2024-08-06", + "release_date": "2026-03-27", + "last_updated": "2026-03-27", "cost": { - "input": 2.5, - "output": 10, - "cache_read": 1.25 + "input": 0, + "output": 0, + "cache_read": 0, + "cache_write": 0 }, "type": "chat" }, { - "id": "gpt-5-pro", - "name": "GPT-5 Pro", - "display_name": "GPT-5 Pro", + "id": "glm-5v-turbo", + "name": "GLM-5V-Turbo", + "display_name": "GLM-5V-Turbo", "modalities": { "input": [ "text", - "image" + "image", + "video", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 400000, - "output": 272000 + "context": 200000, + "output": 131072 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, @@ -175757,47 +178974,43 @@ "extra_capabilities": { "reasoning": { "supported": true, - "default_enabled": true, - "mode": "fixed", - "effort": "high", - "verbosity": "medium", - "verbosity_options": [ - "low", - "medium", - "high" - ], - "visibility": "hidden" + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] } }, "attachment": true, "open_weights": false, - "knowledge": "2024-09-30", - "release_date": "2025-10-06", - "last_updated": "2025-10-06", + "release_date": "2026-04-01", + "last_updated": "2026-04-01", "cost": { - "input": 15, - "output": 120 + "input": 0, + "output": 0, + "cache_read": 0, + "cache_write": 0 }, "type": "chat" }, { - "id": "gpt-5-mini", - "name": "GPT-5 Mini", - "display_name": "GPT-5 Mini", + "id": "glm-5-turbo", + "name": "GLM-5-Turbo", + "display_name": "GLM-5-Turbo", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 400000, - "output": 128000 + "context": 200000, + "output": 131072 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, @@ -175806,209 +179019,170 @@ "extra_capabilities": { "reasoning": { "supported": true, - "default_enabled": true, - "mode": "effort", - "effort": "medium", - "effort_options": [ - "minimal", - "low", - "medium", - "high" - ], - "verbosity": "medium", - "verbosity_options": [ - "low", - "medium", - "high" - ], - "visibility": "hidden" + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] } }, - "attachment": true, + "attachment": false, "open_weights": false, - "knowledge": "2024-05-30", - "release_date": "2025-08-07", - "last_updated": "2025-08-07", + "release_date": "2026-03-16", + "last_updated": "2026-03-16", "cost": { - "input": 0.25, - "output": 2, - "cache_read": 0.025 + "input": 0, + "output": 0, + "cache_read": 0, + "cache_write": 0 }, "type": "chat" }, { - "id": "gpt-image-1", - "name": "gpt-image-1", - "display_name": "gpt-image-1", - "modalities": { - "input": [ - "text", - "image" - ], - "output": [ - "image" - ] - }, - "limit": { - "context": 8192, - "output": 8192 - }, - "temperature": false, - "tool_call": false, - "reasoning": { - "supported": false - }, - "attachment": true, - "open_weights": false, - "release_date": "2025-04-24", - "last_updated": "2025-04-24", - "type": "imageGeneration" - }, - { - "id": "gpt-4o", - "name": "GPT-4o", - "display_name": "GPT-4o", + "id": "glm-4.5-air", + "name": "GLM-4.5-Air", + "display_name": "GLM-4.5-Air", "modalities": { "input": [ - "text", - "image", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 16384 + "context": 131072, + "output": 98304 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": true, - "open_weights": false, - "knowledge": "2023-09", - "release_date": "2024-05-13", - "last_updated": "2024-08-06", + "attachment": false, + "open_weights": true, + "knowledge": "2025-04", + "release_date": "2025-07-28", + "last_updated": "2025-07-28", "cost": { - "input": 2.5, - "output": 10, - "cache_read": 1.25 + "input": 0, + "output": 0, + "cache_read": 0, + "cache_write": 0 }, "type": "chat" }, { - "id": "gpt-5.2", - "name": "GPT-5.2", - "display_name": "GPT-5.2", + "id": "glm-4.6v", + "name": "GLM-4.6V", + "display_name": "GLM-4.6V", "modalities": { "input": [ "text", - "image" + "image", + "video" ], "output": [ "text" ] }, "limit": { - "context": 400000, - "output": 128000 + "context": 128000, + "output": 32768 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, - "default": false - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": false, - "mode": "effort", - "effort": "none", - "effort_options": [ - "none", - "low", - "medium", - "high", - "xhigh" - ], - "verbosity": "medium", - "verbosity_options": [ - "low", - "medium", - "high" - ], - "visibility": "hidden" - } + "default": true }, "attachment": true, - "open_weights": false, - "knowledge": "2025-08-31", - "release_date": "2025-12-11", - "last_updated": "2025-12-11", + "open_weights": true, + "knowledge": "2025-04", + "release_date": "2025-12-08", + "last_updated": "2025-12-08", "cost": { - "input": 1.75, - "output": 14, - "cache_read": 0.175 + "input": 0.3, + "output": 0.9 }, "type": "chat" }, { - "id": "gpt-5-chat-latest", - "name": "GPT-5 Chat (latest)", - "display_name": "GPT-5 Chat (latest)", + "id": "glm-4.7", + "name": "GLM-4.7", + "display_name": "GLM-4.7", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 400000, - "output": 128000 + "context": 204800, + "output": 131072 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { "supported": true, "default": true }, - "attachment": true, - "open_weights": false, - "knowledge": "2024-09-30", - "release_date": "2025-08-07", - "last_updated": "2025-08-07", + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } + }, + "attachment": false, + "open_weights": true, + "knowledge": "2025-04", + "release_date": "2025-12-22", + "last_updated": "2025-12-22", "cost": { - "input": 1.25, - "output": 10, - "cache_read": 0.125 + "input": 0, + "output": 0, + "cache_read": 0, + "cache_write": 0 }, "type": "chat" - }, + } + ] + }, + "chutes": { + "id": "chutes", + "name": "Chutes", + "display_name": "Chutes", + "api": "https://llm.chutes.ai/v1", + "doc": "https://llm.chutes.ai/v1/models", + "models": [ { - "id": "gpt-5-codex", - "name": "GPT-5-Codex", - "display_name": "GPT-5-Codex", + "id": "moonshotai/Kimi-K2.6-TEE", + "name": "Kimi K2.6 TEE", + "display_name": "Kimi K2.6 TEE", "modalities": { "input": [ "text", - "image" + "image", + "video" ], "output": [ "text" ] }, "limit": { - "context": 400000, - "output": 128000 + "context": 262144, + "output": 65535 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, @@ -176017,55 +179191,45 @@ "extra_capabilities": { "reasoning": { "supported": true, - "default_enabled": true, - "mode": "effort", - "effort": "medium", - "effort_options": [ - "minimal", - "low", - "medium", - "high" - ], - "verbosity": "medium", - "verbosity_options": [ - "low", - "medium", - "high" - ], - "visibility": "hidden" + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] } }, - "attachment": false, - "open_weights": false, - "knowledge": "2024-09-30", - "release_date": "2025-09-15", - "last_updated": "2025-09-15", + "attachment": true, + "open_weights": true, + "knowledge": "2025-12", + "release_date": "2026-04-21", + "last_updated": "2026-04-21", "cost": { - "input": 1.25, - "output": 10, - "cache_read": 0.125 + "input": 0.95, + "output": 4, + "cache_read": 0.475 }, "type": "chat" }, { - "id": "o3", - "name": "o3", - "display_name": "o3", + "id": "moonshotai/Kimi-K2.5-TEE", + "name": "Kimi K2.5 TEE", + "display_name": "Kimi K2.5 TEE", "modalities": { "input": [ "text", "image", - "pdf" + "video" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 100000 + "context": 262144, + "output": 65535 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, @@ -176074,33 +179238,30 @@ "extra_capabilities": { "reasoning": { "supported": true, - "default_enabled": true, - "mode": "effort", - "effort": "medium", - "effort_options": [ - "low", - "medium", - "high" - ], - "visibility": "hidden" + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] } }, "attachment": true, - "open_weights": false, - "knowledge": "2024-05", - "release_date": "2025-04-16", - "last_updated": "2025-04-16", + "open_weights": true, + "knowledge": "2024-10", + "release_date": "2026-01", + "last_updated": "2026-01", "cost": { - "input": 2, - "output": 8, - "cache_read": 0.5 + "input": 0.44, + "output": 2, + "cache_read": 0.22 }, "type": "chat" }, { - "id": "gpt-5.3-chat-latest", - "name": "GPT-5.3 Chat (latest)", - "display_name": "GPT-5.3 Chat (latest)", + "id": "google/gemma-4-31B-turbo-TEE", + "name": "gemma 4 31B turbo TEE", + "display_name": "gemma 4 31B turbo TEE", "modalities": { "input": [ "text", @@ -176111,30 +179272,30 @@ ] }, "limit": { - "context": 128000, - "output": 16384 + "context": 131072, + "output": 65536 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "attachment": true, - "open_weights": false, - "knowledge": "2025-08-31", - "release_date": "2026-03-03", - "last_updated": "2026-03-03", + "open_weights": true, + "release_date": "2026-04-02", + "last_updated": "2026-04-02", "cost": { - "input": 1.75, - "output": 14, - "cache_read": 0.175 + "input": 0.13, + "output": 0.38, + "cache_read": 0.065 }, "type": "chat" }, { - "id": "text-embedding-3-small", - "name": "text-embedding-3-small", - "display_name": "text-embedding-3-small", + "id": "Qwen/Qwen3-32B-TEE", + "name": "Qwen3 32B TEE", + "display_name": "Qwen3 32B TEE", "modalities": { "input": [ "text" @@ -176144,29 +179305,31 @@ ] }, "limit": { - "context": 8191, - "output": 1536 + "context": 40960, + "output": 40960 }, - "temperature": false, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "attachment": false, - "open_weights": false, - "knowledge": "2024-01", - "release_date": "2024-01-25", - "last_updated": "2024-01-25", + "open_weights": true, + "knowledge": "2025-04", + "release_date": "2025-04", + "last_updated": "2025-04", "cost": { - "input": 0.02, - "output": 0 + "input": 0.08, + "output": 0.24, + "cache_read": 0.04 }, - "type": "embedding" + "type": "chat" }, { - "id": "gpt-4o-2024-11-20", - "name": "GPT-4o (2024-11-20)", - "display_name": "GPT-4o (2024-11-20)", + "id": "Qwen/Qwen2.5-VL-32B-Instruct", + "name": "Qwen2.5 VL 32B Instruct", + "display_name": "Qwen2.5 VL 32B Instruct", "modalities": { "input": [ "text", @@ -176177,129 +179340,107 @@ ] }, "limit": { - "context": 128000, + "context": 16384, "output": 16384 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": false }, "attachment": true, - "open_weights": false, - "knowledge": "2023-09", - "release_date": "2024-11-20", - "last_updated": "2024-11-20", + "open_weights": true, + "release_date": "2025-12-29", + "last_updated": "2026-04-25", "cost": { - "input": 2.5, - "output": 10, - "cache_read": 1.25 + "input": 0.0543, + "output": 0.2174, + "cache_read": 0.02715 }, "type": "chat" }, { - "id": "gpt-5", - "name": "GPT-5", - "display_name": "GPT-5", + "id": "Qwen/Qwen3-Next-80B-A3B-Instruct", + "name": "Qwen3 Next 80B A3B Instruct", + "display_name": "Qwen3 Next 80B A3B Instruct", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 400000, - "output": 128000 + "context": 262144, + "output": 262144 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": true, - "mode": "effort", - "effort": "medium", - "effort_options": [ - "minimal", - "low", - "medium", - "high" - ], - "verbosity": "medium", - "verbosity_options": [ - "low", - "medium", - "high" - ], - "visibility": "hidden" - } + "supported": false }, - "attachment": true, - "open_weights": false, - "knowledge": "2024-09-30", - "release_date": "2025-08-07", - "last_updated": "2025-08-07", + "attachment": false, + "open_weights": true, + "release_date": "2025-12-29", + "last_updated": "2026-04-25", "cost": { - "input": 1.25, - "output": 10, - "cache_read": 0.125 + "input": 0.1, + "output": 0.8, + "cache_read": 0.05 }, "type": "chat" }, { - "id": "gpt-image-1-mini", - "name": "gpt-image-1-mini", - "display_name": "gpt-image-1-mini", + "id": "Qwen/Qwen3-235B-A22B-Instruct-2507-TEE", + "name": "Qwen3 235B A22B Instruct 2507 TEE", + "display_name": "Qwen3 235B A22B Instruct 2507 TEE", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ - "text", - "image" + "text" ] }, "limit": { - "context": 8192, - "output": 8192 + "context": 262144, + "output": 65536 }, - "temperature": false, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { "supported": false }, - "attachment": true, - "open_weights": false, - "release_date": "2025-09-26", - "last_updated": "2025-09-26", - "type": "imageGeneration" + "attachment": false, + "open_weights": true, + "knowledge": "2025-04", + "release_date": "2025-04", + "last_updated": "2025-04", + "cost": { + "input": 0.1, + "output": 0.6, + "cache_read": 0.05 + }, + "type": "chat" }, { - "id": "gpt-5.4-pro", - "name": "GPT-5.4 Pro", - "display_name": "GPT-5.4 Pro", + "id": "Qwen/Qwen3-235B-A22B-Thinking-2507", + "name": "Qwen3 235B A22B Thinking 2507", + "display_name": "Qwen3 235B A22B Thinking 2507", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 1050000, - "output": 128000 + "context": 262144, + "output": 262144 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, @@ -176308,87 +179449,74 @@ "extra_capabilities": { "reasoning": { "supported": true, - "default_enabled": true, - "mode": "effort", - "effort": "high", - "effort_options": [ - "medium", - "high", - "xhigh" - ], - "verbosity": "medium", - "verbosity_options": [ - "low", - "medium", - "high" - ], - "visibility": "hidden" + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] } }, - "attachment": true, - "open_weights": false, - "knowledge": "2025-08-31", - "release_date": "2026-03-05", - "last_updated": "2026-03-05", + "attachment": false, + "open_weights": true, + "release_date": "2025-12-29", + "last_updated": "2026-04-25", "cost": { - "input": 30, - "output": 180, - "tiers": [ - { - "input": 60, - "output": 270, - "tier": { - "type": "context", - "size": 272000 - } - } - ], - "context_over_200k": { - "input": 60, - "output": 270 - } + "input": 0.11, + "output": 0.6, + "cache_read": 0.055 }, "type": "chat" }, { - "id": "gpt-4.1-mini", - "name": "GPT-4.1 mini", - "display_name": "GPT-4.1 mini", + "id": "Qwen/Qwen3.6-27B-TEE", + "name": "Qwen3.6 27B TEE", + "display_name": "Qwen3.6 27B TEE", "modalities": { "input": [ "text", - "image", - "pdf" + "image" ], "output": [ "text" ] }, "limit": { - "context": 1047576, - "output": 32768 + "context": 262144, + "output": 65536 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } }, "attachment": true, - "open_weights": false, - "knowledge": "2024-04", - "release_date": "2025-04-14", - "last_updated": "2025-04-14", + "open_weights": true, + "release_date": "2026-04-22", + "last_updated": "2026-04-22", "cost": { - "input": 0.4, - "output": 1.6, - "cache_read": 0.1 + "input": 0.195, + "output": 1.56, + "cache_read": 0.0975 }, "type": "chat" }, { - "id": "text-embedding-3-large", - "name": "text-embedding-3-large", - "display_name": "text-embedding-3-large", + "id": "Qwen/Qwen3Guard-Gen-0.6B", + "name": "Qwen3Guard Gen 0.6B", + "display_name": "Qwen3Guard Gen 0.6B", "modalities": { "input": [ "text" @@ -176398,254 +179526,170 @@ ] }, "limit": { - "context": 8191, - "output": 3072 + "context": 32768, + "output": 8192 }, - "temperature": false, + "temperature": true, "tool_call": false, "reasoning": { "supported": false }, "attachment": false, - "open_weights": false, - "knowledge": "2024-01", - "release_date": "2024-01-25", - "last_updated": "2024-01-25", + "open_weights": true, + "release_date": "2025-12-29", + "last_updated": "2026-04-25", "cost": { - "input": 0.13, - "output": 0 + "input": 0.01, + "output": 0.0109, + "cache_read": 0.005 }, - "type": "embedding" + "type": "chat" }, { - "id": "gpt-5.2-pro", - "name": "GPT-5.2 Pro", - "display_name": "GPT-5.2 Pro", + "id": "Qwen/Qwen3-Coder-Next-TEE", + "name": "Qwen3 Coder Next TEE", + "display_name": "Qwen3 Coder Next TEE", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 400000, - "output": 128000 + "context": 262144, + "output": 65536 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": true, - "mode": "effort", - "effort": "high", - "effort_options": [ - "medium", - "high", - "xhigh" - ], - "verbosity": "medium", - "verbosity_options": [ - "low", - "medium", - "high" - ], - "visibility": "hidden" - } + "supported": false }, - "attachment": true, - "open_weights": false, - "knowledge": "2025-08-31", - "release_date": "2025-12-11", - "last_updated": "2025-12-11", + "attachment": false, + "open_weights": true, + "release_date": "2026-04-25", + "last_updated": "2026-04-25", "cost": { - "input": 21, - "output": 168 + "input": 0.12, + "output": 0.75, + "cache_read": 0.06 }, "type": "chat" }, { - "id": "o3-pro", - "name": "o3-pro", - "display_name": "o3-pro", + "id": "Qwen/Qwen2.5-Coder-32B-Instruct", + "name": "Qwen2.5 Coder 32B Instruct", + "display_name": "Qwen2.5 Coder 32B Instruct", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 100000 + "context": 32768, + "output": 32768 }, - "temperature": false, - "tool_call": true, + "temperature": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": true, - "mode": "effort", - "effort": "medium", - "effort_options": [ - "low", - "medium", - "high" - ], - "visibility": "hidden" - } + "supported": false }, - "attachment": true, - "open_weights": false, - "knowledge": "2024-05", - "release_date": "2025-06-10", - "last_updated": "2025-06-10", + "attachment": false, + "open_weights": true, + "release_date": "2025-12-29", + "last_updated": "2026-04-25", "cost": { - "input": 20, - "output": 80 + "input": 0.0272, + "output": 0.1087, + "cache_read": 0.0136 }, "type": "chat" }, { - "id": "o4-mini", - "name": "o4-mini", - "display_name": "o4-mini", + "id": "Qwen/Qwen2.5-72B-Instruct", + "name": "Qwen2.5 72B Instruct", + "display_name": "Qwen2.5 72B Instruct", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 100000 + "context": 32768, + "output": 32768 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": true, - "mode": "effort", - "effort": "medium", - "effort_options": [ - "low", - "medium", - "high" - ], - "visibility": "hidden" - } + "supported": false }, - "attachment": true, - "open_weights": false, - "knowledge": "2024-05", - "release_date": "2025-04-16", - "last_updated": "2025-04-16", + "attachment": false, + "open_weights": true, + "release_date": "2025-12-29", + "last_updated": "2026-04-25", "cost": { - "input": 1.1, - "output": 4.4, - "cache_read": 0.275 + "input": 0.2989, + "output": 1.1957, + "cache_read": 0.14945 }, "type": "chat" }, { - "id": "gpt-5.4", - "name": "GPT-5.4", - "display_name": "GPT-5.4", + "id": "Qwen/Qwen3.5-397B-A17B-TEE", + "name": "Qwen3.5 397B A17B TEE", + "display_name": "Qwen3.5 397B A17B TEE", "modalities": { "input": [ "text", - "image", - "pdf" + "image" ], "output": [ "text" ] }, "limit": { - "context": 1050000, - "output": 128000 + "context": 262144, + "output": 65536 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, - "default": false + "default": true }, "extra_capabilities": { "reasoning": { "supported": true, - "default_enabled": false, - "mode": "effort", - "effort": "none", - "effort_options": [ - "none", - "low", - "medium", - "high", - "xhigh" - ], - "verbosity": "medium", - "verbosity_options": [ - "low", - "medium", - "high" - ], - "visibility": "hidden" + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] } }, "attachment": true, - "open_weights": false, - "knowledge": "2025-08-31", - "release_date": "2026-03-05", - "last_updated": "2026-03-05", + "open_weights": true, + "release_date": "2026-02-15", + "last_updated": "2026-02-15", "cost": { - "input": 2.5, - "output": 15, - "cache_read": 0.25, - "tiers": [ - { - "input": 5, - "output": 22.5, - "cache_read": 0.5, - "tier": { - "type": "context", - "size": 272000 - } - } - ], - "context_over_200k": { - "input": 5, - "output": 22.5, - "cache_read": 0.5 - } + "input": 0.39, + "output": 2.34, + "cache_read": 0.195 }, "type": "chat" }, { - "id": "o3-mini", - "name": "o3-mini", - "display_name": "o3-mini", + "id": "Qwen/Qwen3-30B-A3B", + "name": "Qwen3 30B A3B", + "display_name": "Qwen3 30B A3B", "modalities": { "input": [ "text" @@ -176655,10 +179699,10 @@ ] }, "limit": { - "context": 200000, - "output": 100000 + "context": 40960, + "output": 40960 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, @@ -176667,48 +179711,42 @@ "extra_capabilities": { "reasoning": { "supported": true, - "default_enabled": true, - "mode": "effort", - "effort": "medium", - "effort_options": [ - "low", - "medium", - "high" - ], - "visibility": "hidden" + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] } }, "attachment": false, - "open_weights": false, - "knowledge": "2024-05", - "release_date": "2024-12-20", - "last_updated": "2025-01-29", + "open_weights": true, + "release_date": "2025-12-29", + "last_updated": "2026-04-25", "cost": { - "input": 1.1, - "output": 4.4, - "cache_read": 0.55 + "input": 0.06, + "output": 0.22, + "cache_read": 0.03 }, "type": "chat" }, { - "id": "gpt-5.5", - "name": "GPT-5.5", - "display_name": "GPT-5.5", + "id": "openai/gpt-oss-120b-TEE", + "name": "gpt oss 120b TEE", + "display_name": "gpt oss 120b TEE", "modalities": { "input": [ - "text", - "image", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 1050000, - "output": 128000 + "context": 131072, + "output": 65536 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, @@ -176717,267 +179755,236 @@ "extra_capabilities": { "reasoning": { "supported": true, - "default_enabled": true, - "mode": "effort", - "effort": "medium", - "effort_options": [ - "low", - "medium", - "high", - "xhigh" - ], - "verbosity": "medium", - "verbosity_options": [ - "low", - "medium", - "high" - ], - "visibility": "hidden" + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] } }, - "attachment": true, - "open_weights": false, - "knowledge": "2025-12-01", - "release_date": "2026-04-23", - "last_updated": "2026-04-23", + "attachment": false, + "open_weights": true, + "release_date": "2025-12-29", + "last_updated": "2026-04-25", "cost": { - "input": 5, - "output": 30, - "cache_read": 0.5, - "tiers": [ - { - "input": 10, - "output": 45, - "cache_read": 1, - "tier": { - "type": "context", - "size": 272000 - } - } - ], - "context_over_200k": { - "input": 10, - "output": 45, - "cache_read": 1 - } + "input": 0.09, + "output": 0.36, + "cache_read": 0.045 }, "type": "chat" }, { - "id": "gpt-5.2-chat-latest", - "name": "GPT-5.2 Chat", - "display_name": "GPT-5.2 Chat", + "id": "XiaomiMiMo/MiMo-V2-Flash-TEE", + "name": "MiMo V2 Flash TEE", + "display_name": "MiMo V2 Flash TEE", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 16384 + "context": 262144, + "output": 65536 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, - "attachment": true, - "open_weights": false, - "knowledge": "2025-08-31", - "release_date": "2025-12-11", - "last_updated": "2025-12-11", + "attachment": false, + "open_weights": true, + "knowledge": "2024-12-01", + "release_date": "2025-12-16", + "last_updated": "2026-02-04", "cost": { - "input": 1.75, - "output": 14, - "cache_read": 0.175 + "input": 0.09, + "output": 0.29, + "cache_read": 0.045 }, "type": "chat" }, { - "id": "gpt-5.1", - "name": "GPT-5.1", - "display_name": "GPT-5.1", + "id": "NousResearch/Hermes-4-14B", + "name": "Hermes 4 14B", + "display_name": "Hermes 4 14B", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 400000, - "output": 128000 + "context": 40960, + "output": 40960 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, - "default": false + "default": true }, "extra_capabilities": { "reasoning": { "supported": true, - "default_enabled": false, - "mode": "effort", - "effort": "none", - "effort_options": [ - "none", - "low", - "medium", - "high" - ], - "verbosity": "medium", - "verbosity_options": [ - "low", - "medium", - "high" - ], - "visibility": "hidden" + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] } }, - "attachment": true, - "open_weights": false, - "knowledge": "2024-09-30", - "release_date": "2025-11-13", - "last_updated": "2025-11-13", + "attachment": false, + "open_weights": true, + "release_date": "2025-12-29", + "last_updated": "2026-04-25", "cost": { - "input": 1.25, - "output": 10, - "cache_read": 0.125 + "input": 0.0136, + "output": 0.0543, + "cache_read": 0.0068 }, "type": "chat" }, { - "id": "gpt-5-nano", - "name": "GPT-5 Nano", - "display_name": "GPT-5 Nano", + "id": "NousResearch/DeepHermes-3-Mistral-24B-Preview", + "name": "DeepHermes 3 Mistral 24B Preview", + "display_name": "DeepHermes 3 Mistral 24B Preview", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 400000, - "output": 128000 + "context": 32768, + "output": 32768 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": true, - "mode": "effort", - "effort": "medium", - "effort_options": [ - "minimal", - "low", - "medium", - "high" - ], - "verbosity": "medium", - "verbosity_options": [ - "low", - "medium", - "high" - ], - "visibility": "hidden" - } + "attachment": false, + "open_weights": true, + "release_date": "2025-12-29", + "last_updated": "2026-04-25", + "cost": { + "input": 0.0245, + "output": 0.0978, + "cache_read": 0.01225 }, - "attachment": true, - "open_weights": false, - "knowledge": "2024-05-30", - "release_date": "2025-08-07", - "last_updated": "2025-08-07", + "type": "chat" + }, + { + "id": "unsloth/Llama-3.2-1B-Instruct", + "name": "Llama 3.2 1B Instruct", + "display_name": "Llama 3.2 1B Instruct", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 16384, + "output": 8192 + }, + "temperature": true, + "tool_call": false, + "reasoning": { + "supported": false + }, + "attachment": false, + "open_weights": true, + "release_date": "2026-01-27", + "last_updated": "2026-04-25", "cost": { - "input": 0.05, - "output": 0.4, + "input": 0.01, + "output": 0.0109, "cache_read": 0.005 }, "type": "chat" }, { - "id": "gpt-4o-mini", - "name": "GPT-4o mini", - "display_name": "GPT-4o mini", + "id": "unsloth/gemma-3-12b-it", + "name": "gemma 3 12b it", + "display_name": "gemma 3 12b it", "modalities": { "input": [ "text", - "image", - "pdf" + "image" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 16384 + "context": 131072, + "output": 131072 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": false }, "attachment": true, - "open_weights": false, - "knowledge": "2023-09", - "release_date": "2024-07-18", - "last_updated": "2024-07-18", + "open_weights": true, + "release_date": "2025-12-29", + "last_updated": "2026-04-25", "cost": { - "input": 0.15, - "output": 0.6, - "cache_read": 0.075 + "input": 0.03, + "output": 0.1, + "cache_read": 0.015 }, "type": "chat" }, { - "id": "chatgpt-image-latest", - "name": "chatgpt-image-latest", - "display_name": "chatgpt-image-latest", + "id": "unsloth/gemma-3-4b-it", + "name": "gemma 3 4b it", + "display_name": "gemma 3 4b it", "modalities": { "input": [ "text", "image" ], "output": [ - "text", - "image" + "text" ] }, "limit": { - "context": 8192, - "output": 8192 + "context": 96000, + "output": 96000 }, - "temperature": false, + "temperature": true, "tool_call": false, "reasoning": { "supported": false }, "attachment": true, - "open_weights": false, - "release_date": "2025-12-16", - "last_updated": "2025-12-16", + "open_weights": true, + "release_date": "2025-12-29", + "last_updated": "2026-04-25", + "cost": { + "input": 0.01, + "output": 0.0272, + "cache_read": 0.005 + }, "type": "chat" }, { - "id": "gpt-5.1-codex-max", - "name": "GPT-5.1 Codex Max", - "display_name": "GPT-5.1 Codex Max", + "id": "unsloth/gemma-3-27b-it", + "name": "gemma 3 27b it", + "display_name": "gemma 3 27b it", "modalities": { "input": [ "text", @@ -176988,156 +179995,93 @@ ] }, "limit": { - "context": 400000, - "output": 128000 + "context": 128000, + "output": 65536 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": false - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": false, - "mode": "effort", - "effort": "none", - "effort_options": [ - "none", - "low", - "medium", - "high" - ], - "verbosity": "medium", - "verbosity_options": [ - "low", - "medium", - "high" - ], - "visibility": "hidden" - } + "supported": false }, "attachment": true, - "open_weights": false, - "knowledge": "2024-09-30", - "release_date": "2025-11-13", - "last_updated": "2025-11-13", + "open_weights": true, + "release_date": "2025-12-29", + "last_updated": "2026-04-25", "cost": { - "input": 1.25, - "output": 10, - "cache_read": 0.125 + "input": 0.0272, + "output": 0.1087, + "cache_read": 0.0136 }, "type": "chat" }, { - "id": "gpt-5.1-codex-mini", - "name": "GPT-5.1 Codex mini", - "display_name": "GPT-5.1 Codex mini", + "id": "unsloth/Mistral-Nemo-Instruct-2407", + "name": "Mistral Nemo Instruct 2407", + "display_name": "Mistral Nemo Instruct 2407", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 400000, - "output": 128000 + "context": 131072, + "output": 131072 }, - "temperature": false, - "tool_call": true, + "temperature": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": false - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": false, - "mode": "effort", - "effort": "none", - "effort_options": [ - "none", - "low", - "medium", - "high" - ], - "verbosity": "medium", - "verbosity_options": [ - "low", - "medium", - "high" - ], - "visibility": "hidden" - } + "supported": false }, - "attachment": true, - "open_weights": false, - "knowledge": "2024-09-30", - "release_date": "2025-11-13", - "last_updated": "2025-11-13", + "attachment": false, + "open_weights": true, + "release_date": "2025-12-29", + "last_updated": "2026-04-25", "cost": { - "input": 0.25, - "output": 2, - "cache_read": 0.025 + "input": 0.02, + "output": 0.04, + "cache_read": 0.01 }, "type": "chat" }, { - "id": "o1-pro", - "name": "o1-pro", - "display_name": "o1-pro", + "id": "unsloth/Llama-3.2-3B-Instruct", + "name": "Llama 3.2 3B Instruct", + "display_name": "Llama 3.2 3B Instruct", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 100000 + "context": 16384, + "output": 16384 }, - "temperature": false, - "tool_call": true, + "temperature": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": true, - "mode": "effort", - "effort": "medium", - "effort_options": [ - "low", - "medium", - "high" - ], - "visibility": "hidden" - } + "supported": false }, - "attachment": true, - "open_weights": false, - "knowledge": "2023-09", - "release_date": "2025-03-19", - "last_updated": "2025-03-19", + "attachment": false, + "open_weights": true, + "release_date": "2025-02-12", + "last_updated": "2026-04-25", "cost": { - "input": 150, - "output": 600 + "input": 0.01, + "output": 0.0136, + "cache_read": 0.005 }, "type": "chat" }, { - "id": "text-embedding-ada-002", - "name": "text-embedding-ada-002", - "display_name": "text-embedding-ada-002", + "id": "tngtech/DeepSeek-TNG-R1T2-Chimera-TEE", + "name": "DeepSeek TNG R1T2 Chimera TEE", + "display_name": "DeepSeek TNG R1T2 Chimera TEE", "modalities": { "input": [ "text" @@ -177147,43 +180091,43 @@ ] }, "limit": { - "context": 8192, - "output": 1536 + "context": 163840, + "output": 163840 }, - "temperature": false, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "attachment": false, - "open_weights": false, - "knowledge": "2022-12", - "release_date": "2022-12-15", - "last_updated": "2022-12-15", + "open_weights": true, + "release_date": "2026-04-25", + "last_updated": "2026-04-25", "cost": { - "input": 0.1, - "output": 0 + "input": 0.3, + "output": 1.1, + "cache_read": 0.15 }, - "type": "embedding" + "type": "chat" }, { - "id": "o3-deep-research", - "name": "o3-deep-research", - "display_name": "o3-deep-research", + "id": "zai-org/GLM-4.7-TEE", + "name": "GLM 4.7 TEE", + "display_name": "GLM 4.7 TEE", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 100000 + "context": 202752, + "output": 65535 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, @@ -177192,140 +180136,132 @@ "extra_capabilities": { "reasoning": { "supported": true, - "default_enabled": true, - "mode": "effort", - "effort": "medium", - "effort_options": [ - "low", - "medium", - "high" - ], - "visibility": "hidden" + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] } }, - "attachment": true, - "open_weights": false, - "knowledge": "2024-05", - "release_date": "2024-06-26", - "last_updated": "2024-06-26", + "attachment": false, + "open_weights": true, + "knowledge": "2025-04", + "release_date": "2025-12-22", + "last_updated": "2025-12-22", "cost": { - "input": 10, - "output": 40, - "cache_read": 2.5 + "input": 0.39, + "output": 1.75, + "cache_read": 0.195 }, "type": "chat" }, { - "id": "gpt-4.1", - "name": "GPT-4.1", - "display_name": "GPT-4.1", + "id": "zai-org/GLM-5-TEE", + "name": "GLM 5 TEE", + "display_name": "GLM 5 TEE", "modalities": { "input": [ - "text", - "image", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 1047576, - "output": 32768 + "context": 202752, + "output": 65535 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": true, - "open_weights": false, - "knowledge": "2024-04", - "release_date": "2025-04-14", - "last_updated": "2025-04-14", + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } + }, + "attachment": false, + "open_weights": true, + "release_date": "2026-02-11", + "last_updated": "2026-02-11", "cost": { - "input": 2, - "output": 8, - "cache_read": 0.5 + "input": 0.95, + "output": 2.55, + "cache_read": 0.475 }, "type": "chat" }, { - "id": "gpt-5.4-nano", - "name": "GPT-5.4 nano", - "display_name": "GPT-5.4 nano", + "id": "zai-org/GLM-5.1-TEE", + "name": "GLM 5.1 TEE", + "display_name": "GLM 5.1 TEE", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 400000, - "output": 128000 + "context": 202752, + "output": 65535 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, - "default": false + "default": true }, "extra_capabilities": { "reasoning": { "supported": true, - "default_enabled": false, - "mode": "effort", - "effort": "none", - "effort_options": [ - "none", - "low", - "medium", - "high", - "xhigh" - ], - "verbosity": "medium", - "verbosity_options": [ - "low", - "medium", - "high" - ], - "visibility": "hidden" + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] } }, - "attachment": true, - "open_weights": false, - "knowledge": "2025-08-31", - "release_date": "2026-03-17", - "last_updated": "2026-03-17", + "attachment": false, + "open_weights": true, + "release_date": "2026-03-27", + "last_updated": "2026-03-27", "cost": { - "input": 0.2, - "output": 1.25, - "cache_read": 0.02 + "input": 1.05, + "output": 3.5, + "cache_read": 0.525 }, "type": "chat" }, { - "id": "gpt-5.3-codex", - "name": "GPT-5.3 Codex", - "display_name": "GPT-5.3 Codex", + "id": "zai-org/GLM-4.6V", + "name": "GLM 4.6V", + "display_name": "GLM 4.6V", "modalities": { "input": [ "text", - "image", - "pdf" + "image" ], "output": [ "text" ] }, "limit": { - "context": 400000, - "output": 128000 + "context": 131072, + "output": 65536 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, @@ -177334,55 +180270,42 @@ "extra_capabilities": { "reasoning": { "supported": true, - "default_enabled": true, - "mode": "effort", - "effort": "medium", - "effort_options": [ - "low", - "medium", - "high", - "xhigh" - ], - "verbosity": "medium", - "verbosity_options": [ - "low", - "medium", - "high" - ], - "visibility": "hidden" + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] } }, "attachment": true, - "open_weights": false, - "knowledge": "2025-08-31", - "release_date": "2026-02-05", - "last_updated": "2026-02-05", + "open_weights": true, + "release_date": "2025-12-29", + "last_updated": "2026-04-25", "cost": { - "input": 1.75, - "output": 14, - "cache_read": 0.175 + "input": 0.3, + "output": 0.9, + "cache_read": 0.15 }, "type": "chat" }, { - "id": "gpt-5.3-codex-spark", - "name": "GPT-5.3 Codex Spark", - "display_name": "GPT-5.3 Codex Spark", + "id": "zai-org/GLM-5-Turbo", + "name": "GLM 5 Turbo", + "display_name": "GLM 5 Turbo", "modalities": { "input": [ - "text", - "image", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 32000 + "context": 202752, + "output": 65535 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, @@ -177391,108 +180314,75 @@ "extra_capabilities": { "reasoning": { "supported": true, - "default_enabled": true, - "mode": "effort", - "effort": "medium", - "effort_options": [ - "low", - "medium", - "high", - "xhigh" - ], - "verbosity": "medium", - "verbosity_options": [ - "low", - "medium", - "high" - ], - "visibility": "hidden" + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] } }, - "attachment": true, - "open_weights": false, - "knowledge": "2025-08-31", - "release_date": "2026-02-05", - "last_updated": "2026-02-05", + "attachment": false, + "open_weights": true, + "release_date": "2026-03-11", + "last_updated": "2026-04-25", "cost": { - "input": 1.75, - "output": 14, - "cache_read": 0.175 + "input": 0.4891, + "output": 1.9565, + "cache_read": 0.24455 }, "type": "chat" }, { - "id": "gpt-5.5-pro", - "name": "GPT-5.5 Pro", - "display_name": "GPT-5.5 Pro", + "id": "zai-org/GLM-4.7-FP8", + "name": "GLM 4.7 FP8", + "display_name": "GLM 4.7 FP8", "modalities": { "input": [ - "text", - "image", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 1050000, - "output": 128000 + "context": 202752, + "output": 65535 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, "default": true }, - "extra_capabilities": { - "reasoning": { - "supported": true - } - }, - "attachment": true, - "open_weights": false, - "knowledge": "2025-12-01", - "release_date": "2026-04-23", - "last_updated": "2026-04-23", + "attachment": false, + "open_weights": true, + "release_date": "2026-01-27", + "last_updated": "2026-04-25", "cost": { - "input": 30, - "output": 180, - "tiers": [ - { - "input": 60, - "output": 270, - "tier": { - "type": "context", - "size": 272000 - } - } - ], - "context_over_200k": { - "input": 60, - "output": 270 - } + "input": 0.2989, + "output": 1.1957, + "cache_read": 0.14945 }, "type": "chat" }, { - "id": "o4-mini-deep-research", - "name": "o4-mini-deep-research", - "display_name": "o4-mini-deep-research", + "id": "deepseek-ai/DeepSeek-V3.2-TEE", + "name": "DeepSeek V3.2 TEE", + "display_name": "DeepSeek V3.2 TEE", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 100000 + "context": 131072, + "output": 65536 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, @@ -177501,33 +180391,29 @@ "extra_capabilities": { "reasoning": { "supported": true, - "default_enabled": true, - "mode": "effort", - "effort": "medium", - "effort_options": [ - "low", - "medium", - "high" - ], - "visibility": "hidden" + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] } }, - "attachment": true, - "open_weights": false, - "knowledge": "2024-05", - "release_date": "2024-06-26", - "last_updated": "2024-06-26", + "attachment": false, + "open_weights": true, + "release_date": "2025-12-29", + "last_updated": "2026-04-25", "cost": { - "input": 2, - "output": 8, - "cache_read": 0.5 + "input": 0.28, + "output": 0.42, + "cache_read": 0.14 }, "type": "chat" }, { - "id": "gpt-3.5-turbo", - "name": "GPT-3.5-turbo", - "display_name": "GPT-3.5-turbo", + "id": "deepseek-ai/DeepSeek-V3-0324-TEE", + "name": "DeepSeek V3 0324 TEE", + "display_name": "DeepSeek V3 0324 TEE", "modalities": { "input": [ "text" @@ -177537,45 +180423,42 @@ ] }, "limit": { - "context": 16385, - "output": 4096 + "context": 163840, + "output": 65536 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { "supported": false }, "attachment": false, - "open_weights": false, - "knowledge": "2021-09-01", - "release_date": "2023-03-01", - "last_updated": "2023-11-06", + "open_weights": true, + "release_date": "2025-12-29", + "last_updated": "2026-04-25", "cost": { - "input": 0.5, - "output": 1.5, - "cache_read": 0 + "input": 0.25, + "output": 1, + "cache_read": 0.125 }, "type": "chat" }, { - "id": "gpt-5.2-codex", - "name": "GPT-5.2 Codex", - "display_name": "GPT-5.2 Codex", + "id": "deepseek-ai/DeepSeek-V3.1-TEE", + "name": "DeepSeek V3.1 TEE", + "display_name": "DeepSeek V3.1 TEE", "modalities": { "input": [ - "text", - "image", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 400000, - "output": 128000 + "context": 163840, + "output": 65536 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, @@ -177584,186 +180467,162 @@ "extra_capabilities": { "reasoning": { "supported": true, - "default_enabled": true, - "mode": "effort", - "effort": "medium", - "effort_options": [ - "low", - "medium", - "high", - "xhigh" - ], - "verbosity": "medium", - "verbosity_options": [ - "low", - "medium", - "high" - ], - "visibility": "hidden" + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] } }, - "attachment": true, - "open_weights": false, - "knowledge": "2025-08-31", - "release_date": "2025-12-11", - "last_updated": "2025-12-11", + "attachment": false, + "open_weights": true, + "release_date": "2025-12-29", + "last_updated": "2026-04-25", "cost": { - "input": 1.75, - "output": 14, - "cache_read": 0.175 + "input": 0.27, + "output": 1, + "cache_read": 0.135 }, "type": "chat" }, { - "id": "gpt-5.1-codex", - "name": "GPT-5.1 Codex", - "display_name": "GPT-5.1 Codex", + "id": "deepseek-ai/DeepSeek-R1-Distill-Llama-70B", + "name": "DeepSeek R1 Distill Llama 70B", + "display_name": "DeepSeek R1 Distill Llama 70B", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 400000, - "output": 128000 + "context": 131072, + "output": 131072 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, - "default": false + "default": true }, "extra_capabilities": { "reasoning": { "supported": true, - "default_enabled": false, - "mode": "effort", - "effort": "none", - "effort_options": [ - "none", - "low", - "medium", - "high" - ], - "verbosity": "medium", - "verbosity_options": [ - "low", - "medium", - "high" - ], - "visibility": "hidden" + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] } }, - "attachment": true, - "open_weights": false, - "knowledge": "2024-09-30", - "release_date": "2025-11-13", - "last_updated": "2025-11-13", + "attachment": false, + "open_weights": true, + "release_date": "2025-12-29", + "last_updated": "2026-04-25", "cost": { - "input": 1.25, - "output": 10, - "cache_read": 0.125 + "input": 0.0272, + "output": 0.1087, + "cache_read": 0.0136 }, "type": "chat" }, { - "id": "gpt-4o-2024-05-13", - "name": "GPT-4o (2024-05-13)", - "display_name": "GPT-4o (2024-05-13)", + "id": "deepseek-ai/DeepSeek-R1-0528-TEE", + "name": "DeepSeek R1 0528 TEE", + "display_name": "DeepSeek R1 0528 TEE", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 4096 + "context": 163840, + "output": 65536 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": true, - "open_weights": false, - "knowledge": "2023-09", - "release_date": "2024-05-13", - "last_updated": "2024-05-13", + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } + }, + "attachment": false, + "open_weights": true, + "knowledge": "2024-07", + "release_date": "2025-01-20", + "last_updated": "2025-05-29", "cost": { - "input": 5, - "output": 15 + "input": 0.45, + "output": 2.15, + "cache_read": 0.225 }, "type": "chat" }, { - "id": "gpt-5.4-mini", - "name": "GPT-5.4 mini", - "display_name": "GPT-5.4 mini", + "id": "MiniMaxAI/MiniMax-M2.5-TEE", + "name": "MiniMax M2.5 TEE", + "display_name": "MiniMax M2.5 TEE", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 400000, - "output": 128000 + "context": 196608, + "output": 65536 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, - "default": false + "default": true }, "extra_capabilities": { "reasoning": { "supported": true, - "default_enabled": false, - "mode": "effort", - "effort": "none", - "effort_options": [ - "none", - "low", - "medium", - "high", - "xhigh" - ], - "verbosity": "medium", - "verbosity_options": [ - "low", - "medium", - "high" - ], - "visibility": "hidden" + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] } }, - "attachment": true, - "open_weights": false, - "knowledge": "2025-08-31", - "release_date": "2026-03-17", - "last_updated": "2026-03-17", + "attachment": false, + "open_weights": true, + "release_date": "2026-02-12", + "last_updated": "2026-02-12", "cost": { - "input": 0.75, - "output": 4.5, + "input": 0.15, + "output": 1.2, "cache_read": 0.075 }, "type": "chat" }, { - "id": "gpt-4-turbo", - "name": "GPT-4 Turbo", - "display_name": "GPT-4 Turbo", + "id": "rednote-hilab/dots.ocr", + "name": "dots.ocr", + "display_name": "dots.ocr", "modalities": { "input": [ "text", @@ -177774,79 +180633,88 @@ ] }, "limit": { - "context": 128000, - "output": 4096 + "context": 131072, + "output": 131072 }, "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": false }, "attachment": true, - "open_weights": false, - "knowledge": "2023-12", - "release_date": "2023-11-06", - "last_updated": "2024-04-09", + "open_weights": true, + "release_date": "2025-12-29", + "last_updated": "2026-04-25", "cost": { - "input": 10, - "output": 30 + "input": 0.01, + "output": 0.0109, + "cache_read": 0.005 }, "type": "chat" - }, + } + ] + }, + "minimax-cn-coding-plan": { + "id": "minimax-cn-coding-plan", + "name": "MiniMax Coding Plan (minimaxi.com)", + "display_name": "MiniMax Coding Plan (minimaxi.com)", + "api": "https://api.minimaxi.com/anthropic/v1", + "doc": "https://platform.minimaxi.com/docs/coding-plan/intro", + "models": [ { - "id": "gpt-5.1-chat-latest", - "name": "GPT-5.1 Chat", - "display_name": "GPT-5.1 Chat", + "id": "MiniMax-M2.1", + "name": "MiniMax-M2.1", + "display_name": "MiniMax-M2.1", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 16384 + "context": 204800, + "output": 131072 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, "default": true }, - "attachment": true, - "open_weights": false, - "knowledge": "2024-09-30", - "release_date": "2025-11-13", - "last_updated": "2025-11-13", + "extra_capabilities": { + "reasoning": { + "supported": true + } + }, + "attachment": false, + "open_weights": true, + "release_date": "2025-12-23", + "last_updated": "2025-12-23", "cost": { - "input": 1.25, - "output": 10, - "cache_read": 0.125 + "input": 0, + "output": 0 }, "type": "chat" }, { - "id": "o1", - "name": "o1", - "display_name": "o1", + "id": "MiniMax-M2.5-highspeed", + "name": "MiniMax-M2.5-highspeed", + "display_name": "MiniMax-M2.5-highspeed", "modalities": { "input": [ - "text", - "image", - "pdf" + "text" ], "output": [ "text" ] }, "limit": { - "context": 200000, - "output": 100000 + "context": 204800, + "output": 131072 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, @@ -177854,34 +180722,25 @@ }, "extra_capabilities": { "reasoning": { - "supported": true, - "default_enabled": true, - "mode": "effort", - "effort": "medium", - "effort_options": [ - "low", - "medium", - "high" - ], - "visibility": "hidden" + "supported": true } }, - "attachment": true, - "open_weights": false, - "knowledge": "2023-09", - "release_date": "2024-12-05", - "last_updated": "2024-12-05", + "attachment": false, + "open_weights": true, + "release_date": "2026-02-13", + "last_updated": "2026-02-13", "cost": { - "input": 15, - "output": 60, - "cache_read": 7.5 + "input": 0, + "output": 0, + "cache_read": 0, + "cache_write": 0 }, "type": "chat" }, { - "id": "gpt-4", - "name": "GPT-4", - "display_name": "GPT-4", + "id": "MiniMax-M2.7-highspeed", + "name": "MiniMax-M2.7-highspeed", + "display_name": "MiniMax-M2.7-highspeed", "modalities": { "input": [ "text" @@ -177891,145 +180750,131 @@ ] }, "limit": { - "context": 8192, - "output": 8192 + "context": 204800, + "output": 131072 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": true, - "open_weights": false, - "knowledge": "2023-11", - "release_date": "2023-11-06", - "last_updated": "2024-04-09", + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } + }, + "attachment": false, + "open_weights": true, + "release_date": "2026-03-18", + "last_updated": "2026-03-18", "cost": { - "input": 30, - "output": 60 + "input": 0, + "output": 0, + "cache_read": 0, + "cache_write": 0 }, "type": "chat" }, { - "id": "gpt-image-1.5", - "name": "gpt-image-1.5", - "display_name": "gpt-image-1.5", - "modalities": { - "input": [ - "text", - "image" - ], - "output": [ - "text", - "image" - ] - }, - "limit": { - "context": 8192, - "output": 8192 - }, - "temperature": false, - "tool_call": false, - "reasoning": { - "supported": false - }, - "attachment": true, - "open_weights": false, - "release_date": "2025-11-25", - "last_updated": "2025-11-25", - "type": "imageGeneration" - }, - { - "id": "gpt-4.1-nano", - "name": "GPT-4.1 nano", - "display_name": "GPT-4.1 nano", + "id": "MiniMax-M2", + "name": "MiniMax-M2", + "display_name": "MiniMax-M2", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 1047576, - "output": 32768 + "context": 196608, + "output": 128000 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": true, - "open_weights": false, - "knowledge": "2024-04", - "release_date": "2025-04-14", - "last_updated": "2025-04-14", + "extra_capabilities": { + "reasoning": { + "supported": true + } + }, + "attachment": false, + "open_weights": true, + "release_date": "2025-10-27", + "last_updated": "2025-10-27", "cost": { - "input": 0.1, - "output": 0.4, - "cache_read": 0.025 + "input": 0, + "output": 0 }, "type": "chat" }, { - "id": "gpt-image-2", - "name": "gpt-image-2", - "display_name": "gpt-image-2", + "id": "MiniMax-M2.5", + "name": "MiniMax-M2.5", + "display_name": "MiniMax-M2.5", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ - "image" + "text" ] }, "limit": { - "context": 8192, - "output": 8192 + "context": 204800, + "output": 131072 }, - "temperature": false, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": true, - "open_weights": false, - "release_date": "2026-04-21", - "last_updated": "2026-04-21", + "extra_capabilities": { + "reasoning": { + "supported": true + } + }, + "attachment": false, + "open_weights": true, + "release_date": "2026-02-12", + "last_updated": "2026-02-12", "cost": { - "input": 5, - "output": 30, - "cache_read": 1.25 + "input": 0, + "output": 0, + "cache_read": 0, + "cache_write": 0 }, - "type": "imageGeneration" - } - ] - }, - "poolside": { - "id": "poolside", - "name": "Poolside", - "display_name": "Poolside", - "api": "https://inference.poolside.ai/v1", - "doc": "https://platform.poolside.ai", - "models": [ + "type": "chat" + }, { - "id": "poolside/laguna-m.1", - "name": "Laguna M.1", - "display_name": "Laguna M.1", + "id": "MiniMax-M3", + "name": "MiniMax-M3", + "display_name": "MiniMax-M3", "modalities": { "input": [ - "text" + "text", + "image", + "video" ], "output": [ "text" ] }, "limit": { - "context": 131040, - "output": 8192 + "context": 512000, + "output": 128000 }, "temperature": true, "tool_call": true, @@ -178039,19 +180884,13 @@ }, "extra_capabilities": { "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] + "supported": true } }, - "attachment": false, - "open_weights": false, - "release_date": "2026-04-28", - "last_updated": "2026-04-28", + "attachment": true, + "open_weights": true, + "release_date": "2026-06-01", + "last_updated": "2026-06-01", "cost": { "input": 0, "output": 0, @@ -178061,9 +180900,9 @@ "type": "chat" }, { - "id": "poolside/laguna-xs.2", - "name": "Laguna XS.2", - "display_name": "Laguna XS.2", + "id": "MiniMax-M2.7", + "name": "MiniMax-M2.7", + "display_name": "MiniMax-M2.7", "modalities": { "input": [ "text" @@ -178073,8 +180912,8 @@ ] }, "limit": { - "context": 131040, - "output": 8192 + "context": 204800, + "output": 131072 }, "temperature": true, "tool_call": true, @@ -178095,8 +180934,8 @@ }, "attachment": false, "open_weights": true, - "release_date": "2026-04-28", - "last_updated": "2026-04-28", + "release_date": "2026-03-18", + "last_updated": "2026-03-18", "cost": { "input": 0, "output": 0, @@ -178107,17 +180946,17 @@ } ] }, - "sarvam": { - "id": "sarvam", - "name": "Sarvam AI", - "display_name": "Sarvam AI", - "api": "https://api.sarvam.ai/v1", - "doc": "https://docs.sarvam.ai/api-reference-docs/getting-started/models", + "deepseek": { + "id": "deepseek", + "name": "DeepSeek", + "display_name": "DeepSeek", + "api": "https://api.deepseek.com", + "doc": "https://api-docs.deepseek.com/zh-cn/quick_start/pricing", "models": [ { - "id": "sarvam-105b", - "name": "Sarvam-105B", - "display_name": "Sarvam-105B", + "id": "deepseek-v4-flash", + "name": "DeepSeek V4 Flash", + "display_name": "DeepSeek V4 Flash", "modalities": { "input": [ "text" @@ -178127,8 +180966,8 @@ ] }, "limit": { - "context": 131072, - "output": 131072 + "context": 1048576, + "output": 393216 }, "temperature": true, "tool_call": true, @@ -178139,24 +180978,40 @@ "extra_capabilities": { "reasoning": { "supported": true, + "default_enabled": true, + "mode": "effort", + "effort": "high", + "effort_options": [ + "high", + "max" + ], "interleaved": true, "summaries": true, "visibility": "summary", "continuation": [ "thinking_blocks" + ], + "notes": [ + "Thinking mode is controlled through the thinking parameter; non-thinking mode disables reasoning." ] } }, - "attachment": false, + "attachment": true, "open_weights": true, - "release_date": "2026-02-18", - "last_updated": "2026-03-06", + "knowledge": "2025-05", + "release_date": "2026-04-24", + "last_updated": "2026-04-24", + "cost": { + "input": 0.14, + "output": 0.28, + "cache_read": 0.028 + }, "type": "chat" }, { - "id": "sarvam-30b", - "name": "Sarvam-30B", - "display_name": "Sarvam-30B", + "id": "deepseek-v4-pro", + "name": "DeepSeek V4 Pro", + "display_name": "DeepSeek V4 Pro", "modalities": { "input": [ "text" @@ -178166,8 +181021,8 @@ ] }, "limit": { - "context": 65536, - "output": 65536 + "context": 1048576, + "output": 393216 }, "temperature": true, "tool_call": true, @@ -178178,33 +181033,40 @@ "extra_capabilities": { "reasoning": { "supported": true, + "default_enabled": true, + "mode": "effort", + "effort": "high", + "effort_options": [ + "high", + "max" + ], "interleaved": true, "summaries": true, "visibility": "summary", "continuation": [ "thinking_blocks" + ], + "notes": [ + "Thinking mode is controlled through the thinking parameter; non-thinking mode disables reasoning." ] } }, - "attachment": false, + "attachment": true, "open_weights": true, - "release_date": "2026-02-18", - "last_updated": "2026-03-06", + "knowledge": "2025-05", + "release_date": "2026-04-24", + "last_updated": "2026-04-24", + "cost": { + "input": 1.74, + "output": 3.48, + "cache_read": 0.145 + }, "type": "chat" - } - ] - }, - "baseten": { - "id": "baseten", - "name": "Baseten", - "display_name": "Baseten", - "api": "https://inference.baseten.co/v1", - "doc": "https://docs.baseten.co/inference/model-apis/overview", - "models": [ + }, { - "id": "MiniMaxAI/MiniMax-M2.5", - "name": "MiniMax-M2.5", - "display_name": "MiniMax-M2.5", + "id": "deepseek-reasoner", + "name": "DeepSeek Reasoner", + "display_name": "DeepSeek Reasoner", "modalities": { "input": [ "text" @@ -178214,10 +181076,10 @@ ] }, "limit": { - "context": 204000, - "output": 204000 + "context": 1048576, + "output": 393216 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { "supported": true, @@ -178226,29 +181088,40 @@ "extra_capabilities": { "reasoning": { "supported": true, + "default_enabled": true, + "mode": "effort", + "effort": "high", + "effort_options": [ + "high", + "max" + ], "interleaved": true, "summaries": true, "visibility": "summary", "continuation": [ "thinking_blocks" + ], + "notes": [ + "Compatibility alias for deepseek-v4-flash thinking mode." ] } }, - "attachment": false, + "attachment": true, "open_weights": true, - "knowledge": "2026-01", - "release_date": "2026-02-12", - "last_updated": "2026-02-12", + "knowledge": "2025-09", + "release_date": "2025-01-20", + "last_updated": "2026-04-24", "cost": { - "input": 0.3, - "output": 1.2 + "input": 0.14, + "output": 0.28, + "cache_read": 0.028 }, "type": "chat" }, { - "id": "zai-org/GLM-4.7", - "name": "GLM 4.7", - "display_name": "GLM 4.7", + "id": "deepseek-chat", + "name": "DeepSeek Chat", + "display_name": "DeepSeek Chat", "modalities": { "input": [ "text" @@ -178258,8 +181131,50 @@ ] }, "limit": { - "context": 200000, - "output": 200000 + "context": 1048576, + "output": 393216 + }, + "temperature": true, + "tool_call": true, + "reasoning": { + "supported": false + }, + "attachment": true, + "open_weights": true, + "knowledge": "2025-09", + "release_date": "2024-12-26", + "last_updated": "2026-04-24", + "cost": { + "input": 0.14, + "output": 0.28, + "cache_read": 0.028 + }, + "type": "chat" + } + ] + }, + "minimax": { + "id": "minimax", + "name": "MiniMax (minimax.io)", + "display_name": "MiniMax (minimax.io)", + "api": "https://api.minimax.io/anthropic/v1", + "doc": "https://platform.minimax.io/docs/guides/quickstart", + "models": [ + { + "id": "MiniMax-M2.1", + "name": "MiniMax-M2.1", + "display_name": "MiniMax-M2.1", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 204800, + "output": 131072 }, "temperature": true, "tool_call": true, @@ -178269,31 +181184,23 @@ }, "extra_capabilities": { "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] + "supported": true } }, "attachment": false, "open_weights": true, - "knowledge": "2025-04", - "release_date": "2025-12-22", - "last_updated": "2025-12-22", + "release_date": "2025-12-23", + "last_updated": "2025-12-23", "cost": { - "input": 0.12, - "output": 2.2, - "cache_read": 0.12 + "input": 0.3, + "output": 1.2 }, "type": "chat" }, { - "id": "zai-org/GLM-5", - "name": "GLM 5", - "display_name": "GLM 5", + "id": "MiniMax-M2.5-highspeed", + "name": "MiniMax-M2.5-highspeed", + "display_name": "MiniMax-M2.5-highspeed", "modalities": { "input": [ "text" @@ -178303,8 +181210,8 @@ ] }, "limit": { - "context": 202800, - "output": 202800 + "context": 204800, + "output": 131072 }, "temperature": true, "tool_call": true, @@ -178314,31 +181221,25 @@ }, "extra_capabilities": { "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] + "supported": true } }, "attachment": false, "open_weights": true, - "knowledge": "2026-01", - "release_date": "2026-02-12", - "last_updated": "2026-02-12", + "release_date": "2026-02-13", + "last_updated": "2026-02-13", "cost": { - "input": 0.95, - "output": 3.15, - "cache_read": 0.2 + "input": 0.6, + "output": 2.4, + "cache_read": 0.06, + "cache_write": 0.375 }, "type": "chat" }, { - "id": "zai-org/GLM-5.1", - "name": "GLM 5.1", - "display_name": "GLM 5.1", + "id": "MiniMax-M2.7-highspeed", + "name": "MiniMax-M2.7-highspeed", + "display_name": "MiniMax-M2.7-highspeed", "modalities": { "input": [ "text" @@ -178348,8 +181249,8 @@ ] }, "limit": { - "context": 202800, - "output": 202800 + "context": 204800, + "output": 131072 }, "temperature": true, "tool_call": true, @@ -178370,31 +181271,31 @@ }, "attachment": false, "open_weights": true, - "release_date": "2026-03-27", - "last_updated": "2026-03-27", + "release_date": "2026-03-18", + "last_updated": "2026-03-18", "cost": { - "input": 1.3, - "output": 4.3, - "cache_read": 0.26 + "input": 0.6, + "output": 2.4, + "cache_read": 0.06, + "cache_write": 0.375 }, "type": "chat" }, { - "id": "moonshotai/Kimi-K2.6", - "name": "Kimi K2.6", - "display_name": "Kimi K2.6", + "id": "MiniMax-M2", + "name": "MiniMax-M2", + "display_name": "MiniMax-M2", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 262000, - "output": 262000 + "context": 196608, + "output": 128000 }, "temperature": true, "tool_call": true, @@ -178404,43 +181305,34 @@ }, "extra_capabilities": { "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] + "supported": true } }, - "attachment": true, + "attachment": false, "open_weights": true, - "knowledge": "2025-01", - "release_date": "2026-04-21", - "last_updated": "2026-04-21", + "release_date": "2025-10-27", + "last_updated": "2025-10-27", "cost": { - "input": 0.95, - "output": 4, - "cache_read": 0.16 + "input": 0.3, + "output": 1.2 }, "type": "chat" }, { - "id": "moonshotai/Kimi-K2.5", - "name": "Kimi K2.5", - "display_name": "Kimi K2.5", + "id": "MiniMax-M2.5", + "name": "MiniMax-M2.5", + "display_name": "MiniMax-M2.5", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 262000, - "output": 262000 + "context": 204800, + "output": 131072 }, "temperature": true, "tool_call": true, @@ -178450,42 +181342,38 @@ }, "extra_capabilities": { "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] + "supported": true } }, - "attachment": true, + "attachment": false, "open_weights": true, - "knowledge": "2025-12", - "release_date": "2026-01-30", + "release_date": "2026-02-12", "last_updated": "2026-02-12", "cost": { - "input": 0.6, - "output": 3, - "cache_read": 0.12 + "input": 0.3, + "output": 1.2, + "cache_read": 0.03, + "cache_write": 0.375 }, "type": "chat" }, { - "id": "deepseek-ai/DeepSeek-V3.1", - "name": "DeepSeek V3.1", - "display_name": "DeepSeek V3.1", + "id": "MiniMax-M3", + "name": "MiniMax-M3", + "display_name": "MiniMax-M3", "modalities": { "input": [ - "text" + "text", + "image", + "video" ], "output": [ "text" ] }, "limit": { - "context": 164000, - "output": 131000 + "context": 512000, + "output": 128000 }, "temperature": true, "tool_call": true, @@ -178493,20 +181381,26 @@ "supported": true, "default": true }, - "attachment": false, + "extra_capabilities": { + "reasoning": { + "supported": true + } + }, + "attachment": true, "open_weights": true, - "release_date": "2025-08-25", - "last_updated": "2025-08-25", + "release_date": "2026-06-01", + "last_updated": "2026-06-01", "cost": { - "input": 0.5, - "output": 1.5 + "input": 0.6, + "output": 2.4, + "cache_read": 0.12 }, "type": "chat" }, { - "id": "deepseek-ai/DeepSeek-V4-Pro", - "name": "Deepseek V4 Pro", - "display_name": "Deepseek V4 Pro", + "id": "MiniMax-M2.7", + "name": "MiniMax-M2.7", + "display_name": "MiniMax-M2.7", "modalities": { "input": [ "text" @@ -178516,8 +181410,8 @@ ] }, "limit": { - "context": 131000, - "output": 131000 + "context": 204800, + "output": 131072 }, "temperature": true, "tool_call": true, @@ -178538,120 +181432,195 @@ }, "attachment": false, "open_weights": true, - "knowledge": "2025-05", - "release_date": "2026-04-24", - "last_updated": "2026-04-24", + "release_date": "2026-03-18", + "last_updated": "2026-03-18", "cost": { - "input": 1.74, - "output": 3.48, - "cache_read": 0.145 + "input": 0.3, + "output": 1.2, + "cache_read": 0.06, + "cache_write": 0.375 }, "type": "chat" - }, + } + ] + }, + "github-copilot": { + "id": "github-copilot", + "name": "GitHub Copilot", + "display_name": "GitHub Copilot", + "api": "https://api.githubcopilot.com", + "doc": "https://docs.github.com/en/copilot", + "models": [ { - "id": "nvidia/NVIDIA-Nemotron-3-Ultra-550B-A55B", - "name": "Nemotron Ultra", - "display_name": "Nemotron Ultra", + "id": "raptor-mini", + "name": "Raptor mini", + "display_name": "Raptor mini", "modalities": { "input": [ + "text", + "image" + ], + "output": [ "text" + ] + }, + "limit": { + "context": 400000, + "output": 128000 + }, + "temperature": false, + "tool_call": true, + "reasoning": { + "supported": true, + "default": true + }, + "attachment": true, + "open_weights": false, + "knowledge": "2024-05-30", + "release_date": "2025-08-07", + "last_updated": "2025-08-07", + "cost": { + "input": 0.25, + "output": 2, + "cache_read": 0.025 + }, + "type": "chat" + }, + { + "id": "claude-sonnet-4.5", + "name": "Claude Sonnet 4.5 (latest)", + "display_name": "Claude Sonnet 4.5 (latest)", + "modalities": { + "input": [ + "text", + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 202800, - "output": 202800 + "context": 200000, + "output": 32000 }, "temperature": true, "tool_call": true, "reasoning": { "supported": true, - "default": true + "default": false }, "extra_capabilities": { "reasoning": { "supported": true, + "default_enabled": false, + "mode": "budget", + "budget": { + "min": 1024, + "unit": "tokens" + }, "interleaved": true, "summaries": true, "visibility": "summary", "continuation": [ "thinking_blocks" + ], + "notes": [ + "Claude 4 manual thinking uses thinking.type = \"enabled\" with budget_tokens.", + "Interleaved thinking requires the interleaved-thinking-2025-05-14 beta header for this model family." ] } }, - "attachment": false, - "open_weights": true, - "release_date": "2026-06-04", - "last_updated": "2026-06-04", + "attachment": true, + "open_weights": false, + "knowledge": "2025-07-31", + "release_date": "2025-09-29", + "last_updated": "2025-09-29", "cost": { - "input": 0.6, - "output": 2.4, - "cache_read": 0.12 + "input": 3, + "output": 15, + "cache_read": 0.3, + "cache_write": 3.75 }, "type": "chat" }, { - "id": "nvidia/Nemotron-120B-A12B", - "name": "Nemotron Super", - "display_name": "Nemotron Super", + "id": "claude-sonnet-4", + "name": "Claude Sonnet 4 (latest)", + "display_name": "Claude Sonnet 4 (latest)", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 202800, - "output": 202800 + "context": 216000, + "output": 16000 }, "temperature": true, "tool_call": true, "reasoning": { "supported": true, - "default": true + "default": false }, "extra_capabilities": { "reasoning": { "supported": true, + "default_enabled": false, + "mode": "budget", + "budget": { + "min": 1024, + "unit": "tokens" + }, "interleaved": true, "summaries": true, "visibility": "summary", "continuation": [ "thinking_blocks" + ], + "notes": [ + "Claude 4 manual thinking uses thinking.type = \"enabled\" with budget_tokens.", + "Interleaved thinking requires the interleaved-thinking-2025-05-14 beta header for this model family." ] } }, - "attachment": false, - "open_weights": true, - "knowledge": "2026-02", - "release_date": "2026-03-11", - "last_updated": "2026-03-11", + "attachment": true, + "open_weights": false, + "knowledge": "2025-03-31", + "release_date": "2025-05-22", + "last_updated": "2025-05-22", "cost": { - "input": 0.06, - "output": 0.75, - "cache_read": 0.06 + "input": 3, + "output": 15, + "cache_read": 0.3, + "cache_write": 3.75 }, "type": "chat" }, { - "id": "openai/gpt-oss-120b", - "name": "OpenAI GPT 120B", - "display_name": "OpenAI GPT 120B", + "id": "gemini-2.5-pro", + "name": "Gemini 2.5 Pro", + "display_name": "Gemini 2.5 Pro", "modalities": { "input": [ - "text" + "text", + "image", + "audio", + "video", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 128072, - "output": 128072 + "context": 128000, + "output": 64000 }, "temperature": true, "tool_call": true, @@ -178661,171 +181630,291 @@ }, "extra_capabilities": { "reasoning": { - "supported": true + "supported": true, + "default_enabled": true, + "mode": "budget", + "budget": { + "default": -1, + "min": 128, + "max": 32768, + "auto": -1, + "unit": "tokens" + }, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thought_signatures" + ] } }, - "attachment": false, - "open_weights": true, - "knowledge": "2025-08", - "release_date": "2025-08-05", - "last_updated": "2025-08-05", + "attachment": true, + "open_weights": false, + "knowledge": "2025-01", + "release_date": "2025-03-20", + "last_updated": "2025-06-05", "cost": { - "input": 0.1, - "output": 0.5 + "input": 1.25, + "output": 10, + "cache_read": 0.125, + "tiers": [ + { + "input": 2.5, + "output": 15, + "cache_read": 0.25, + "tier": { + "type": "context", + "size": 200000 + } + } + ], + "context_over_200k": { + "input": 2.5, + "output": 15, + "cache_read": 0.25 + } }, "type": "chat" - } - ] - }, - "lucidquery": { - "id": "lucidquery", - "name": "LucidQuery AI", - "display_name": "LucidQuery AI", - "api": "https://lucidquery.com/api/v1", - "doc": "https://lucidquery.com/api/docs", - "models": [ + }, { - "id": "lucidquery-nexus-coder", - "name": "LucidQuery Nexus Coder", - "display_name": "LucidQuery Nexus Coder", + "id": "claude-haiku-4.5", + "name": "Claude Haiku 4.5 (latest)", + "display_name": "Claude Haiku 4.5 (latest)", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 250000, - "output": 60000 + "context": 200000, + "output": 64000 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, - "default": true + "default": false + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": false, + "mode": "budget", + "budget": { + "min": 1024, + "unit": "tokens" + }, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ], + "notes": [ + "Claude 4 manual thinking uses thinking.type = \"enabled\" with budget_tokens.", + "Interleaved thinking requires the interleaved-thinking-2025-05-14 beta header for this model family." + ] + } }, "attachment": true, "open_weights": false, - "knowledge": "2025-08-01", - "release_date": "2025-09-01", - "last_updated": "2025-09-01", + "knowledge": "2025-02-28", + "release_date": "2025-10-15", + "last_updated": "2025-10-15", "cost": { - "input": 2, - "output": 5 + "input": 1, + "output": 5, + "cache_read": 0.1, + "cache_write": 1.25 }, "type": "chat" }, { - "id": "lucidnova-rf1-100b", - "name": "LucidNova RF1 100B", - "display_name": "LucidNova RF1 100B", + "id": "gemini-3.5-flash", + "name": "Gemini 3.5 Flash", + "display_name": "Gemini 3.5 Flash", "modalities": { "input": [ - "text" + "text", + "image", + "video", + "audio", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 120000, - "output": 8000 + "context": 200000, + "output": 64000 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, "default": true }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": true, + "mode": "level", + "level": "high", + "level_options": [ + "minimal", + "low", + "medium", + "high" + ], + "summaries": true, + "visibility": "summary", + "continuation": [ + "thought_signatures" + ] + } + }, "attachment": true, "open_weights": false, - "knowledge": "2025-09-16", - "release_date": "2024-12-28", - "last_updated": "2025-09-10", + "knowledge": "2025-01", + "release_date": "2026-05-19", + "last_updated": "2026-05-19", "cost": { - "input": 2, - "output": 5 + "input": 1.5, + "output": 9, + "cache_read": 0.15, + "input_audio": 1.5 }, "type": "chat" - } - ] - }, - "scaleway": { - "id": "scaleway", - "name": "Scaleway", - "display_name": "Scaleway", - "api": "https://api.scaleway.ai/v1", - "doc": "https://www.scaleway.com/en/docs/generative-apis/", - "models": [ + }, { - "id": "bge-multilingual-gemma2", - "name": "BGE Multilingual Gemma2", - "display_name": "BGE Multilingual Gemma2", + "id": "gpt-5.4-nano", + "name": "GPT-5.4 nano", + "display_name": "GPT-5.4 nano", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 8191, - "output": 3072 + "context": 400000, + "output": 128000 }, "temperature": false, - "tool_call": false, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": false }, - "attachment": false, + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": false, + "mode": "effort", + "effort": "none", + "effort_options": [ + "none", + "low", + "medium", + "high", + "xhigh" + ], + "verbosity": "medium", + "verbosity_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" + } + }, + "attachment": true, "open_weights": false, - "release_date": "2024-07-26", - "last_updated": "2025-06-15", + "knowledge": "2025-08-31", + "release_date": "2026-03-17", + "last_updated": "2026-03-17", "cost": { - "input": 0.1, - "output": 0 + "input": 0.2, + "output": 1.25, + "cache_read": 0.02 }, "type": "chat" }, { - "id": "qwen3-coder-30b-a3b-instruct", - "name": "Qwen3-Coder 30B-A3B Instruct", - "display_name": "Qwen3-Coder 30B-A3B Instruct", + "id": "claude-opus-4.7", + "name": "Claude Opus 4.7", + "display_name": "Claude Opus 4.7", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 32768 + "context": 200000, + "output": 32000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": false }, - "attachment": false, - "open_weights": true, - "knowledge": "2025-04", - "release_date": "2025-04", - "last_updated": "2026-03-17", + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": false, + "mode": "effort", + "effort": "high", + "effort_options": [ + "low", + "medium", + "high", + "xhigh", + "max" + ], + "interleaved": true, + "summaries": true, + "visibility": "omitted", + "continuation": [ + "thinking_blocks" + ], + "notes": [ + "Claude Opus 4.7 and newer Opus models require thinking.type = \"adaptive\" to enable thinking explicitly.", + "Manual budget_tokens requests return 400 on Claude Opus 4.7 and newer adaptive-only Opus models.", + "task_budget is separate from thinking control and should not be treated as a thinking budget." + ] + } + }, + "attachment": true, + "open_weights": false, + "knowledge": "2026-01-31", + "release_date": "2026-04-16", + "last_updated": "2026-04-16", "cost": { - "input": 0.2, - "output": 0.8 + "input": 5, + "output": 25, + "cache_read": 0.5, + "cache_write": 6.25 }, "type": "chat" }, { - "id": "mistral-small-3.2-24b-instruct-2506", - "name": "Mistral Small 3.2 24B Instruct (2506)", - "display_name": "Mistral Small 3.2 24B Instruct (2506)", + "id": "gpt-5.2", + "name": "GPT-5.2", + "display_name": "GPT-5.2", "modalities": { "input": [ "text", @@ -178836,196 +181925,373 @@ ] }, "limit": { - "context": 128000, - "output": 32768 + "context": 400000, + "output": 128000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": false }, - "attachment": false, - "open_weights": true, - "knowledge": "2025-03", - "release_date": "2025-06-20", - "last_updated": "2026-03-17", + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": false, + "mode": "effort", + "effort": "none", + "effort_options": [ + "none", + "low", + "medium", + "high", + "xhigh" + ], + "verbosity": "medium", + "verbosity_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" + } + }, + "attachment": true, + "open_weights": false, + "knowledge": "2025-08-31", + "release_date": "2025-12-11", + "last_updated": "2025-12-11", "cost": { - "input": 0.15, - "output": 0.35 + "input": 1.75, + "output": 14, + "cache_read": 0.175 }, "type": "chat" }, { - "id": "pixtral-12b-2409", - "name": "Pixtral 12B 2409", - "display_name": "Pixtral 12B 2409", + "id": "gpt-5.3-codex", + "name": "GPT-5.3 Codex", + "display_name": "GPT-5.3 Codex", "modalities": { "input": [ "text", - "image" + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 4096 + "context": 400000, + "output": 128000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": true, + "mode": "effort", + "effort": "medium", + "effort_options": [ + "low", + "medium", + "high", + "xhigh" + ], + "verbosity": "medium", + "verbosity_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" + } }, "attachment": true, - "open_weights": true, - "knowledge": "2024-09", - "release_date": "2024-09-25", - "last_updated": "2026-03-17", + "open_weights": false, + "knowledge": "2025-08-31", + "release_date": "2026-02-05", + "last_updated": "2026-02-05", "cost": { - "input": 0.2, - "output": 0.2 + "input": 1.75, + "output": 14, + "cache_read": 0.175 }, "type": "chat" }, { - "id": "gpt-oss-120b", - "name": "GPT-OSS 120B", - "display_name": "GPT-OSS 120B", + "id": "claude-opus-4.8", + "name": "Claude Opus 4.8", + "display_name": "Claude Opus 4.8", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 32768 + "context": 200000, + "output": 64000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { - "supported": true + "supported": true, + "default": false }, "extra_capabilities": { "reasoning": { - "supported": true + "supported": true, + "default_enabled": false, + "mode": "effort", + "effort": "high", + "effort_options": [ + "low", + "medium", + "high", + "xhigh", + "max" + ], + "interleaved": true, + "summaries": true, + "visibility": "omitted", + "continuation": [ + "thinking_blocks" + ], + "notes": [ + "Claude Opus 4.7 and newer Opus models require thinking.type = \"adaptive\" to enable thinking explicitly.", + "Manual budget_tokens requests return 400 on Claude Opus 4.7 and newer adaptive-only Opus models.", + "task_budget is separate from thinking control and should not be treated as a thinking budget." + ] } }, "attachment": true, - "open_weights": true, - "release_date": "2024-01-01", - "last_updated": "2026-03-17", + "open_weights": false, + "release_date": "2026-05-28", + "last_updated": "2026-05-28", "cost": { - "input": 0.15, - "output": 0.6 + "input": 5, + "output": 25, + "cache_read": 0.5, + "cache_write": 6.25 }, "type": "chat" }, { - "id": "gemma-3-27b-it", - "name": "Gemma-3-27B-IT", - "display_name": "Gemma-3-27B-IT", + "id": "claude-fable-5", + "name": "Claude Fable 5", + "display_name": "Claude Fable 5", "modalities": { "input": [ "text", - "image" + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 40000, - "output": 8192 + "context": 1000000, + "output": 128000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { "supported": true, "default": true }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": true, + "mode": "effort", + "effort": "high", + "effort_options": [ + "low", + "medium", + "high", + "xhigh", + "max" + ], + "interleaved": true, + "summaries": true, + "visibility": "omitted", + "continuation": [ + "thinking_blocks" + ], + "notes": [ + "Adaptive thinking is always on for Claude Fable 5 and Claude Mythos 5; thinking.type = \"disabled\" is rejected.", + "Manual budget_tokens requests return 400 on Claude Fable 5 and Claude Mythos 5.", + "thinking.display defaults to omitted; set display to summarized to receive readable thinking summaries." + ] + } + }, "attachment": true, "open_weights": false, - "knowledge": "2024-12", - "release_date": "2024-12-01", - "last_updated": "2026-03-17", + "knowledge": "2026-01-31", + "release_date": "2026-06-09", + "last_updated": "2026-06-09", "cost": { - "input": 0.25, - "output": 0.5 + "input": 10, + "output": 50, + "cache_read": 1, + "cache_write": 12.5 }, "type": "chat" }, { - "id": "voxtral-small-24b-2507", - "name": "Voxtral Small 24B 2507", - "display_name": "Voxtral Small 24B 2507", + "id": "claude-opus-4.5", + "name": "Claude Opus 4.5 (latest)", + "display_name": "Claude Opus 4.5 (latest)", "modalities": { "input": [ "text", - "audio" + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 32000, - "output": 16384 + "context": 200000, + "output": 32000 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": false + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": false, + "mode": "mixed", + "budget": { + "min": 1024, + "unit": "tokens" + }, + "effort": "high", + "effort_options": [ + "low", + "medium", + "high" + ], + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ], + "notes": [ + "Claude Opus 4.5 uses manual thinking.type = \"enabled\" with budget_tokens; effort can be used alongside the thinking budget.", + "Interleaved thinking requires the interleaved-thinking-2025-05-14 beta header." + ] + } }, "attachment": true, - "open_weights": true, - "release_date": "2025-07-01", - "last_updated": "2026-03-17", + "open_weights": false, + "knowledge": "2025-03-31", + "release_date": "2025-11-24", + "last_updated": "2025-11-24", "cost": { - "input": 0.15, - "output": 0.35 + "input": 5, + "output": 25, + "cache_read": 0.5, + "cache_write": 6.25 }, "type": "chat" }, { - "id": "whisper-large-v3", - "name": "Whisper Large v3", - "display_name": "Whisper Large v3", + "id": "gpt-5.4", + "name": "GPT-5.4", + "display_name": "GPT-5.4", "modalities": { "input": [ - "audio" + "text", + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 8192, - "output": 8192 + "context": 400000, + "output": 128000 }, "temperature": false, - "tool_call": false, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": false }, - "attachment": false, - "open_weights": true, - "knowledge": "2023-09", - "release_date": "2023-09-01", - "last_updated": "2026-03-17", + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": false, + "mode": "effort", + "effort": "none", + "effort_options": [ + "none", + "low", + "medium", + "high", + "xhigh" + ], + "verbosity": "medium", + "verbosity_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" + } + }, + "attachment": true, + "open_weights": false, + "knowledge": "2025-08-31", + "release_date": "2026-03-05", + "last_updated": "2026-03-05", "cost": { - "input": 0.003, - "output": 0 + "input": 2.5, + "output": 15, + "cache_read": 0.25, + "tiers": [ + { + "input": 5, + "output": 22.5, + "cache_read": 0.5, + "tier": { + "type": "context", + "size": 272000 + } + } + ], + "context_over_200k": { + "input": 5, + "output": 22.5, + "cache_read": 0.5 + } }, "type": "chat" }, { - "id": "mistral-medium-3.5-128b", - "name": "Mistral Medium 3.5 128B", - "display_name": "Mistral Medium 3.5 128B", + "id": "gpt-5.4-mini", + "name": "GPT-5.4 mini", + "display_name": "GPT-5.4 mini", "modalities": { "input": [ "text", @@ -179036,72 +182302,103 @@ ] }, "limit": { - "context": 256000, - "output": 16384 + "context": 400000, + "output": 128000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { "supported": true, - "default": true + "default": false + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": false, + "mode": "effort", + "effort": "none", + "effort_options": [ + "none", + "low", + "medium", + "high", + "xhigh" + ], + "verbosity": "medium", + "verbosity_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" + } }, "attachment": true, - "open_weights": true, - "release_date": "2026-04-29", - "last_updated": "2026-04-29", + "open_weights": false, + "knowledge": "2025-08-31", + "release_date": "2026-03-17", + "last_updated": "2026-03-17", "cost": { - "input": 1.5, - "output": 7.5 + "input": 0.75, + "output": 4.5, + "cache_read": 0.075 }, "type": "chat" }, { - "id": "qwen3-embedding-8b", - "name": "Qwen3 Embedding 8B", - "display_name": "Qwen3 Embedding 8B", + "id": "gpt-4.1", + "name": "GPT-4.1", + "display_name": "GPT-4.1", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 32768, - "output": 4096 + "context": 128000, + "output": 16384 }, - "temperature": false, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { "supported": false }, - "attachment": false, + "attachment": true, "open_weights": false, - "release_date": "2025-25-11", - "last_updated": "2026-03-17", + "knowledge": "2024-04", + "release_date": "2025-04-14", + "last_updated": "2025-04-14", "cost": { - "input": 0.1, - "output": 0 + "input": 2, + "output": 8, + "cache_read": 0.5 }, - "type": "embedding" + "type": "chat" }, { - "id": "gemma-4-26b-a4b-it", - "name": "Gemma 4 26B A4B IT", - "display_name": "Gemma 4 26B A4B IT", + "id": "gemini-3.1-pro-preview", + "name": "Gemini 3.1 Pro Preview", + "display_name": "Gemini 3.1 Pro Preview", "modalities": { "input": [ "text", - "image" + "image", + "video", + "audio", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 256000, - "output": 16384 + "context": 200000, + "output": 64000 }, "temperature": true, "tool_call": true, @@ -179109,113 +182406,191 @@ "supported": true, "default": true }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": true, + "mode": "level", + "level": "high", + "level_options": [ + "low", + "high" + ], + "summaries": true, + "visibility": "summary", + "continuation": [ + "thought_signatures" + ] + } + }, "attachment": true, - "open_weights": true, - "knowledge": "2025-04", - "release_date": "2026-04-01", - "last_updated": "2026-05-22", + "open_weights": false, + "knowledge": "2025-01", + "release_date": "2026-02-19", + "last_updated": "2026-02-19", "cost": { - "input": 0.25, - "output": 0.5 + "input": 2, + "output": 12, + "cache_read": 0.2, + "tiers": [ + { + "input": 4, + "output": 18, + "cache_read": 0.4, + "tier": { + "type": "context", + "size": 200000 + } + } + ], + "context_over_200k": { + "input": 4, + "output": 18, + "cache_read": 0.4 + } }, "type": "chat" }, { - "id": "qwen3.6-35b-a3b", - "name": "Qwen3.6 35B A3B", - "display_name": "Qwen3.6 35B A3B", + "id": "claude-sonnet-4.6", + "name": "Claude Sonnet 4.6", + "display_name": "Claude Sonnet 4.6", "modalities": { "input": [ "text", - "image" + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 16384 + "context": 200000, + "output": 32000 }, "temperature": true, "tool_call": true, "reasoning": { "supported": true, - "default": true + "default": false }, "extra_capabilities": { "reasoning": { "supported": true, + "default_enabled": false, + "mode": "mixed", + "budget": { + "min": 1024, + "unit": "tokens" + }, + "effort": "high", + "effort_options": [ + "low", + "medium", + "high", + "max" + ], "interleaved": true, "summaries": true, "visibility": "summary", "continuation": [ "thinking_blocks" + ], + "notes": [ + "Anthropic recommends adaptive thinking with effort for Claude 4.6; budget_tokens remains a deprecated compatibility path.", + "Anthropic API defaults effort to high; lower effort levels should be chosen per workload." ] } }, "attachment": true, - "open_weights": true, - "knowledge": "2025-04", - "release_date": "2026-05-01", - "last_updated": "2026-05-22", + "open_weights": false, + "knowledge": "2025-08-31", + "release_date": "2026-02-17", + "last_updated": "2026-03-13", "cost": { - "input": 0.25, - "output": 1.5 + "input": 3, + "output": 15, + "cache_read": 0.3, + "cache_write": 3.75 }, "type": "chat" }, { - "id": "qwen3-235b-a22b-instruct-2507", - "name": "Qwen3 235B A22B Instruct 2507", - "display_name": "Qwen3 235B A22B Instruct 2507", + "id": "gpt-5-mini", + "name": "GPT-5 Mini", + "display_name": "GPT-5 Mini", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 260000, - "output": 16384 + "context": 264000, + "output": 64000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { "supported": true, "default": true }, - "attachment": false, - "open_weights": true, - "knowledge": "2025-04", - "release_date": "2025-07-01", - "last_updated": "2026-03-17", + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": true, + "mode": "effort", + "effort": "medium", + "effort_options": [ + "minimal", + "low", + "medium", + "high" + ], + "verbosity": "medium", + "verbosity_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" + } + }, + "attachment": true, + "open_weights": false, + "knowledge": "2024-05-30", + "release_date": "2025-08-07", + "last_updated": "2025-08-07", "cost": { - "input": 0.75, - "output": 2.25, - "reasoning": 8.4 + "input": 0.25, + "output": 2, + "cache_read": 0.025 }, "type": "chat" }, { - "id": "qwen3.5-397b-a17b", - "name": "Qwen3.5 397B A17B", - "display_name": "Qwen3.5 397B A17B", + "id": "gemini-3-flash-preview", + "name": "Gemini 3 Flash Preview", + "display_name": "Gemini 3 Flash Preview", "modalities": { "input": [ "text", "image", - "video" + "video", + "audio", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 256000, - "output": 16384 + "context": 128000, + "output": 64000 }, "temperature": true, "tool_call": true, @@ -179226,145 +182601,255 @@ "extra_capabilities": { "reasoning": { "supported": true, - "interleaved": true, + "default_enabled": true, + "mode": "level", + "level": "high", + "level_options": [ + "minimal", + "low", + "medium", + "high" + ], "summaries": true, "visibility": "summary", "continuation": [ - "thinking_blocks" + "thought_signatures" ] } }, "attachment": true, - "open_weights": true, - "knowledge": "2025-04", - "release_date": "2026-03-17", - "last_updated": "2026-03-17", + "open_weights": false, + "knowledge": "2025-01", + "release_date": "2025-12-17", + "last_updated": "2025-12-17", "cost": { - "input": 0.6, - "output": 3.6 + "input": 0.5, + "output": 3, + "cache_read": 0.05, + "input_audio": 1 }, "type": "chat" }, { - "id": "llama-3.3-70b-instruct", - "name": "Llama-3.3-70B-Instruct", - "display_name": "Llama-3.3-70B-Instruct", + "id": "claude-opus-4.6", + "name": "Claude Opus 4.6", + "display_name": "Claude Opus 4.6", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 100000, - "output": 16384 + "context": 200000, + "output": 32000 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": false + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": false, + "mode": "mixed", + "budget": { + "min": 1024, + "unit": "tokens" + }, + "effort": "high", + "effort_options": [ + "low", + "medium", + "high", + "max" + ], + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ], + "notes": [ + "Anthropic recommends adaptive thinking with effort for Claude 4.6; budget_tokens remains a deprecated compatibility path.", + "Anthropic API defaults effort to high; lower effort levels should be chosen per workload." + ] + } }, "attachment": true, - "open_weights": true, - "knowledge": "2023-12", - "release_date": "2024-12-06", - "last_updated": "2026-03-17", + "open_weights": false, + "knowledge": "2025-05-31", + "release_date": "2026-02-05", + "last_updated": "2026-03-13", "cost": { - "input": 0.9, - "output": 0.9 + "input": 5, + "output": 25, + "cache_read": 0.5, + "cache_write": 6.25 }, "type": "chat" }, { - "id": "devstral-2-123b-instruct-2512", - "name": "Devstral 2 123B Instruct (2512)", - "display_name": "Devstral 2 123B Instruct (2512)", + "id": "gpt-5.2-codex", + "name": "GPT-5.2 Codex", + "display_name": "GPT-5.2 Codex", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 256000, - "output": 16384 + "context": 400000, + "output": 128000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": false, - "open_weights": true, - "knowledge": "2025-12", - "release_date": "2026-01-07", - "last_updated": "2026-03-17", + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": true, + "mode": "effort", + "effort": "medium", + "effort_options": [ + "low", + "medium", + "high", + "xhigh" + ], + "verbosity": "medium", + "verbosity_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" + } + }, + "attachment": true, + "open_weights": false, + "knowledge": "2025-08-31", + "release_date": "2025-12-11", + "last_updated": "2025-12-11", "cost": { - "input": 0.4, - "output": 2 + "input": 1.75, + "output": 14, + "cache_read": 0.175 }, "type": "chat" - } - ] - }, - "cerebras": { - "id": "cerebras", - "name": "Cerebras", - "display_name": "Cerebras", - "doc": "https://inference-docs.cerebras.ai/models/overview", - "models": [ + }, { - "id": "zai-glm-4.7", - "name": "Z.AI GLM-4.7", - "display_name": "Z.AI GLM-4.7", + "id": "gpt-5.5", + "name": "GPT-5.5", + "display_name": "GPT-5.5", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 131072, - "output": 40000 + "context": 400000, + "output": 128000 }, - "temperature": true, + "temperature": false, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": false, - "open_weights": true, - "release_date": "2026-01-10", - "last_updated": "2026-01-10", + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": true, + "mode": "effort", + "effort": "medium", + "effort_options": [ + "low", + "medium", + "high", + "xhigh" + ], + "verbosity": "medium", + "verbosity_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" + } + }, + "attachment": true, + "open_weights": false, + "knowledge": "2025-12-01", + "release_date": "2026-04-23", + "last_updated": "2026-04-23", "cost": { - "input": 2.25, - "output": 2.75, - "cache_read": 0, - "cache_write": 0 + "input": 5, + "output": 30, + "cache_read": 0.5, + "tiers": [ + { + "input": 10, + "output": 45, + "cache_read": 1, + "tier": { + "type": "context", + "size": 272000 + } + } + ], + "context_over_200k": { + "input": 10, + "output": 45, + "cache_read": 1 + } }, "type": "chat" - }, + } + ] + }, + "clarifai": { + "id": "clarifai", + "name": "Clarifai", + "display_name": "Clarifai", + "api": "https://api.clarifai.com/v2/ext/openai/v1", + "doc": "https://docs.clarifai.com/compute/inference/", + "models": [ { - "id": "gpt-oss-120b", - "name": "GPT OSS 120B", - "display_name": "GPT OSS 120B", + "id": "moonshotai/chat-completion/models/Kimi-K2_6", + "name": "Kimi K2.6", + "display_name": "Kimi K2.6", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 131072, - "output": 32768 + "context": 262144, + "output": 262144 }, "temperature": true, "tool_call": true, @@ -179374,23 +182859,30 @@ }, "extra_capabilities": { "reasoning": { - "supported": true + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] } }, - "attachment": false, + "attachment": true, "open_weights": true, - "release_date": "2025-08-05", - "last_updated": "2025-08-05", + "knowledge": "2025-01", + "release_date": "2026-04-21", + "last_updated": "2026-04-21", "cost": { - "input": 0.25, - "output": 0.69 + "input": 0.95, + "output": 4 }, "type": "chat" }, { - "id": "llama3.1-8b", - "name": "Llama 3.1 8B", - "display_name": "Llama 3.1 8B", + "id": "minimaxai/chat-completion/models/MiniMax-M2_5-high-throughput", + "name": "MiniMax-M2.5 High Throughput", + "display_name": "MiniMax-M2.5 High Throughput", "modalities": { "input": [ "text" @@ -179400,38 +182892,29 @@ ] }, "limit": { - "context": 32000, - "output": 8000 + "context": 204800, + "output": 131072 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "attachment": false, "open_weights": true, - "knowledge": "2023-12", - "release_date": "2025-01-01", - "last_updated": "2026-05-27", + "release_date": "2026-02-12", + "last_updated": "2026-02-25", "cost": { - "input": 0.1, - "output": 0.1 + "input": 0.3, + "output": 1.2 }, "type": "chat" - } - ] - }, - "hpc-ai": { - "id": "hpc-ai", - "name": "HPC-AI", - "display_name": "HPC-AI", - "api": "https://api.hpc-ai.com/inference/v1", - "doc": "https://www.hpc-ai.com/doc/docs/quickstart/", - "models": [ + }, { - "id": "zai-org/glm-5.1", - "name": "GLM 5.1", - "display_name": "GLM 5.1", + "id": "openai/chat-completion/models/gpt-oss-120b-high-throughput", + "name": "GPT OSS 120B High Throughput", + "display_name": "GPT OSS 120B High Throughput", "modalities": { "input": [ "text" @@ -179441,8 +182924,8 @@ ] }, "limit": { - "context": 202000, - "output": 202000 + "context": 131072, + "output": 16384 }, "temperature": true, "tool_call": true, @@ -179450,47 +182933,33 @@ "supported": true, "default": true }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } - }, "attachment": false, "open_weights": true, - "release_date": "2026-04-08", - "last_updated": "2026-06-01", + "release_date": "2025-08-05", + "last_updated": "2026-02-25", "cost": { - "input": 0.615, - "output": 2.46, - "cache_read": 0.133 + "input": 0.09, + "output": 0.36 }, "type": "chat" }, { - "id": "moonshotai/kimi-k2.5", - "name": "Kimi K2.5", - "display_name": "Kimi K2.5", + "id": "openai/chat-completion/models/gpt-oss-20b", + "name": "GPT OSS 20B", + "display_name": "GPT OSS 20B", "modalities": { "input": [ - "text", - "image", - "video" + "text" ], "output": [ "text" ] }, "limit": { - "context": 262144, - "output": 262144 + "context": 131072, + "output": 16384 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, @@ -179498,42 +182967,35 @@ }, "extra_capabilities": { "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] + "supported": true } }, "attachment": false, "open_weights": true, - "knowledge": "2025-01-01", - "release_date": "2026-01-01", - "last_updated": "2026-06-01", + "release_date": "2025-08-05", + "last_updated": "2025-12-12", "cost": { - "input": 0.3, - "output": 1.5, - "cache_read": 0.05 + "input": 0.045, + "output": 0.18 }, "type": "chat" }, { - "id": "minimax/minimax-m2.5", - "name": "MiniMax M2.5", - "display_name": "MiniMax M2.5", + "id": "mistralai/completion/models/Ministral-3-14B-Reasoning-2512", + "name": "Ministral 3 14B Reasoning 2512", + "display_name": "Ministral 3 14B Reasoning 2512", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 1000000, - "output": 131072 + "context": 262144, + "output": 262144 }, "temperature": true, "tool_call": true, @@ -179541,46 +183003,33 @@ "supported": true, "default": true }, - "extra_capabilities": { - "reasoning": { - "supported": true - } - }, - "attachment": false, + "attachment": true, "open_weights": true, - "release_date": "2026-02-12", - "last_updated": "2026-06-01", + "knowledge": "2025-12", + "release_date": "2025-12-01", + "last_updated": "2025-12-12", "cost": { - "input": 0.3, - "output": 1.2, - "cache_read": 0.03 + "input": 2.5, + "output": 1.7 }, "type": "chat" - } - ] - }, - "alibaba-token-plan": { - "id": "alibaba-token-plan", - "name": "Alibaba Token Plan", - "display_name": "Alibaba Token Plan", - "api": "https://token-plan.ap-southeast-1.maas.aliyuncs.com/compatible-mode/v1", - "doc": "https://www.alibabacloud.com/help/en/model-studio/token-plan-overview", - "models": [ + }, { - "id": "MiniMax-M2.5", - "name": "MiniMax-M2.5", - "display_name": "MiniMax-M2.5", + "id": "mistralai/completion/models/Ministral-3-3B-Reasoning-2512", + "name": "Ministral 3 3B Reasoning 2512", + "display_name": "Ministral 3 3B Reasoning 2512", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 196608, - "output": 24576 + "context": 262144, + "output": 262144 }, "temperature": true, "tool_call": true, @@ -179588,39 +183037,27 @@ "supported": true, "default": true }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } - }, - "attachment": false, + "attachment": true, "open_weights": true, - "release_date": "2026-02-12", - "last_updated": "2026-02-12", + "release_date": "2025-12", + "last_updated": "2026-02-25", "cost": { - "input": 0, - "output": 0, - "cache_read": 0, - "cache_write": 0 + "input": 1.039, + "output": 0.54825 }, "type": "chat" }, { - "id": "qwen-image-2.0-pro", - "name": "Qwen Image 2.0 Pro", - "display_name": "Qwen Image 2.0 Pro", + "id": "deepseek-ai/deepseek-ocr/models/DeepSeek-OCR", + "name": "DeepSeek OCR", + "display_name": "DeepSeek OCR", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ - "image" + "text" ] }, "limit": { @@ -179632,20 +183069,20 @@ "reasoning": { "supported": false }, - "attachment": false, - "open_weights": false, - "release_date": "2026-03-03", - "last_updated": "2026-03-03", + "attachment": true, + "open_weights": true, + "release_date": "2025-10-20", + "last_updated": "2026-02-25", "cost": { - "input": 0, - "output": 0 + "input": 0.2, + "output": 0.7 }, - "type": "imageGeneration" + "type": "chat" }, { - "id": "deepseek-v3.2", - "name": "DeepSeek V3.2", - "display_name": "DeepSeek V3.2", + "id": "qwen/qwenLM/models/Qwen3-30B-A3B-Thinking-2507", + "name": "Qwen3 30B A3B Thinking 2507", + "display_name": "Qwen3 30B A3B Thinking 2507", "modalities": { "input": [ "text" @@ -179655,8 +183092,8 @@ ] }, "limit": { - "context": 131072, - "output": 65536 + "context": 262144, + "output": 131072 }, "temperature": true, "tool_call": true, @@ -179666,60 +183103,63 @@ }, "extra_capabilities": { "reasoning": { - "supported": true + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] } }, "attachment": false, "open_weights": true, - "knowledge": "2025-01", - "release_date": "2025-12-03", - "last_updated": "2025-12-05", + "release_date": "2025-07-31", + "last_updated": "2026-02-25", "cost": { - "input": 0, - "output": 0 + "input": 0.36, + "output": 1.3 }, "type": "chat" }, { - "id": "wan2.7-image", - "name": "Wan2.7 Image", - "display_name": "Wan2.7 Image", + "id": "qwen/qwenLM/models/Qwen3-30B-A3B-Instruct-2507", + "name": "Qwen3 30B A3B Instruct 2507", + "display_name": "Qwen3 30B A3B Instruct 2507", "modalities": { "input": [ "text" ], "output": [ - "image" + "text" ] }, "limit": { - "context": 8192, - "output": 8192 + "context": 262144, + "output": 262144 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { "supported": false }, "attachment": false, - "open_weights": false, - "release_date": "2026-05-29", - "last_updated": "2026-05-29", + "open_weights": true, + "release_date": "2025-07-30", + "last_updated": "2026-02-25", "cost": { - "input": 0, - "output": 0 + "input": 0.3, + "output": 0.5 }, - "type": "imageGeneration" + "type": "chat" }, { - "id": "kimi-k2.6", - "name": "Kimi K2.6", - "display_name": "Kimi K2.6", + "id": "qwen/qwenCoder/models/Qwen3-Coder-30B-A3B-Instruct", + "name": "Qwen3 Coder 30B A3B Instruct", + "display_name": "Qwen3 Coder 30B A3B Instruct", "modalities": { "input": [ - "text", - "image", - "video" + "text" ], "output": [ "text" @@ -179727,42 +183167,28 @@ }, "limit": { "context": 262144, - "output": 16384 + "output": 65536 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } + "supported": false }, - "attachment": true, + "attachment": false, "open_weights": true, - "knowledge": "2025-01", - "release_date": "2026-04-21", - "last_updated": "2026-04-21", + "knowledge": "2025-04", + "release_date": "2025-07-31", + "last_updated": "2026-02-12", "cost": { - "input": 0, - "output": 0, - "cache_read": 0, - "cache_write": 0 + "input": 0.11458, + "output": 0.74812 }, "type": "chat" }, { - "id": "qwen3.7-max", - "name": "Qwen3.7 Max", - "display_name": "Qwen3.7 Max", + "id": "arcee_ai/AFM/models/trinity-mini", + "name": "Trinity Mini", + "display_name": "Trinity Mini", "modalities": { "input": [ "text" @@ -179772,8 +183198,8 @@ ] }, "limit": { - "context": 1000000, - "output": 65536 + "context": 131072, + "output": 131072 }, "temperature": true, "tool_call": true, @@ -179781,71 +183207,74 @@ "supported": true, "default": true }, - "extra_capabilities": { - "reasoning": { - "supported": true - } - }, "attachment": false, - "open_weights": false, - "release_date": "2026-05-21", - "last_updated": "2026-05-21", + "open_weights": true, + "knowledge": "2024-10", + "release_date": "2025-12", + "last_updated": "2026-02-25", "cost": { - "input": 0, - "output": 0, - "cache_read": 0, - "cache_write": 0 + "input": 0.045, + "output": 0.15 }, "type": "chat" }, { - "id": "wan2.7-image-pro", - "name": "Wan2.7 Image Pro", - "display_name": "Wan2.7 Image Pro", + "id": "clarifai/main/models/mm-poly-8b", + "name": "MM Poly 8B", + "display_name": "MM Poly 8B", "modalities": { "input": [ - "text" + "text", + "image", + "video" ], "output": [ - "image" + "text" ] }, "limit": { - "context": 8192, - "output": 8192 + "context": 32768, + "output": 4096 }, "temperature": true, "tool_call": false, "reasoning": { "supported": false }, - "attachment": false, + "attachment": true, "open_weights": false, - "release_date": "2026-05-29", - "last_updated": "2026-05-29", + "release_date": "2025-06", + "last_updated": "2026-02-25", "cost": { - "input": 0, - "output": 0 + "input": 0.658, + "output": 1.11 }, - "type": "imageGeneration" - }, + "type": "chat" + } + ] + }, + "the-grid-ai": { + "id": "the-grid-ai", + "name": "The Grid AI", + "display_name": "The Grid AI", + "api": "https://api.thegrid.ai/v1", + "doc": "https://thegrid.ai/docs", + "models": [ { - "id": "qwen3.6-plus", - "name": "Qwen3.6 Plus", - "display_name": "Qwen3.6 Plus", + "id": "agent-prime", + "name": "Agent Prime", + "display_name": "Agent Prime", "modalities": { "input": [ - "text", - "image", - "video" + "text" ], "output": [ "text" ] }, "limit": { - "context": 1000000, - "output": 65536 + "context": 128000, + "output": 64000 }, "temperature": true, "tool_call": true, @@ -179853,39 +183282,20 @@ "supported": true, "default": true }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } - }, "attachment": false, "open_weights": false, - "knowledge": "2025-04", - "release_date": "2026-04-02", - "last_updated": "2026-04-02", - "cost": { - "input": 0, - "output": 0, - "cache_read": 0, - "cache_write": 0 - }, + "release_date": "2026-05-04", + "last_updated": "2026-05-19", "type": "chat" }, { - "id": "qwen3.6-flash", - "name": "Qwen3.6 Flash", - "display_name": "Qwen3.6 Flash", + "id": "agent-max", + "name": "Agent Max", + "display_name": "Agent Max", "modalities": { "input": [ "text", - "image", - "video" + "image" ], "output": [ "text" @@ -179893,7 +183303,7 @@ }, "limit": { "context": 1000000, - "output": 65536 + "output": 128000 }, "temperature": true, "tool_call": true, @@ -179912,53 +183322,44 @@ ] } }, - "attachment": true, + "attachment": false, "open_weights": false, - "release_date": "2026-04-27", - "last_updated": "2026-04-27", - "cost": { - "input": 0, - "output": 0, - "cache_read": 0, - "cache_write": 0 - }, + "release_date": "2026-05-04", + "last_updated": "2026-05-19", "type": "chat" }, { - "id": "qwen-image-2.0", - "name": "Qwen Image 2.0", - "display_name": "Qwen Image 2.0", + "id": "text-standard", + "name": "Text Standard", + "display_name": "Text Standard", "modalities": { "input": [ "text" ], "output": [ - "image" + "text" ] }, "limit": { - "context": 8192, - "output": 8192 + "context": 128000, + "output": 16000 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "attachment": false, "open_weights": false, - "release_date": "2026-03-03", - "last_updated": "2026-03-03", - "cost": { - "input": 0, - "output": 0 - }, - "type": "imageGeneration" + "release_date": "2026-02-26", + "last_updated": "2026-05-19", + "type": "chat" }, { - "id": "deepseek-v4-flash", - "name": "DeepSeek V4 Flash", - "display_name": "DeepSeek V4 Flash", + "id": "code-prime", + "name": "Code Prime", + "display_name": "Code Prime", "modalities": { "input": [ "text" @@ -179968,8 +183369,8 @@ ] }, "limit": { - "context": 1000000, - "output": 384000 + "context": 128000, + "output": 64000 }, "temperature": true, "tool_call": true, @@ -179977,33 +183378,16 @@ "supported": true, "default": true }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } - }, "attachment": false, - "open_weights": true, - "knowledge": "2025-05", - "release_date": "2026-04-24", - "last_updated": "2026-04-24", - "cost": { - "input": 0, - "output": 0, - "cache_read": 0 - }, + "open_weights": false, + "release_date": "2026-05-04", + "last_updated": "2026-05-19", "type": "chat" }, { - "id": "glm-5", - "name": "GLM-5", - "display_name": "GLM-5", + "id": "text-prime", + "name": "Text Prime", + "display_name": "Text Prime", "modalities": { "input": [ "text" @@ -180013,8 +183397,8 @@ ] }, "limit": { - "context": 202752, - "output": 16384 + "context": 128000, + "output": 30000 }, "temperature": true, "tool_call": true, @@ -180022,36 +183406,20 @@ "supported": true, "default": true }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } - }, "attachment": false, "open_weights": false, - "release_date": "2026-02-11", - "last_updated": "2026-02-11", - "cost": { - "input": 0, - "output": 0, - "cache_read": 0, - "cache_write": 0 - }, + "release_date": "2026-02-26", + "last_updated": "2026-05-19", "type": "chat" }, { - "id": "deepseek-v4-pro", - "name": "DeepSeek V4 Pro", - "display_name": "DeepSeek V4 Pro", + "id": "code-max", + "name": "Code Max", + "display_name": "Code Max", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" @@ -180059,7 +183427,7 @@ }, "limit": { "context": 1000000, - "output": 384000 + "output": 128000 }, "temperature": true, "tool_call": true, @@ -180079,34 +183447,26 @@ } }, "attachment": false, - "open_weights": true, - "knowledge": "2025-05", - "release_date": "2026-04-24", - "last_updated": "2026-04-24", - "cost": { - "input": 0, - "output": 0, - "cache_read": 0 - }, + "open_weights": false, + "release_date": "2026-05-04", + "last_updated": "2026-05-19", "type": "chat" }, { - "id": "kimi-k2.5", - "name": "Kimi K2.5", - "display_name": "Kimi K2.5", + "id": "agent-standard", + "name": "Agent Standard", + "display_name": "Agent Standard", "modalities": { "input": [ - "text", - "image", - "video" + "text" ], "output": [ "text" ] }, "limit": { - "context": 262144, - "output": 32768 + "context": 128000, + "output": 16000 }, "temperature": true, "tool_call": true, @@ -180114,44 +183474,27 @@ "supported": true, "default": true }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } - }, - "attachment": true, - "open_weights": true, - "knowledge": "2025-01", - "release_date": "2026-01", - "last_updated": "2026-01", - "cost": { - "input": 0, - "output": 0, - "cache_read": 0, - "cache_write": 0 - }, + "attachment": false, + "open_weights": false, + "release_date": "2026-05-04", + "last_updated": "2026-05-19", "type": "chat" }, { - "id": "glm-5.1", - "name": "GLM-5.1", - "display_name": "GLM-5.1", + "id": "text-max", + "name": "Text Max", + "display_name": "Text Max", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 202752, + "context": 1000000, "output": 128000 }, "temperature": true, @@ -180172,30 +183515,15 @@ } }, "attachment": false, - "open_weights": true, - "release_date": "2026-03-27", - "last_updated": "2026-03-27", - "cost": { - "input": 0, - "output": 0, - "cache_read": 0, - "cache_write": 0 - }, + "open_weights": false, + "release_date": "2026-03-24", + "last_updated": "2026-05-19", "type": "chat" - } - ] - }, - "tencent-tokenhub": { - "id": "tencent-tokenhub", - "name": "Tencent TokenHub", - "display_name": "Tencent TokenHub", - "api": "https://tokenhub.tencentmaas.com/v1", - "doc": "https://cloud.tencent.com/document/product/1823/130050", - "models": [ + }, { - "id": "hy3-preview", - "name": "Hy3 preview", - "display_name": "Hy3 preview", + "id": "code-standard", + "name": "Code Standard", + "display_name": "Code Standard", "modalities": { "input": [ "text" @@ -180205,8 +183533,8 @@ ] }, "limit": { - "context": 256000, - "output": 64000 + "context": 128000, + "output": 16000 }, "temperature": true, "tool_call": true, @@ -180214,81 +183542,58 @@ "supported": true, "default": true }, - "extra_capabilities": { - "reasoning": { - "supported": true - } - }, "attachment": false, - "open_weights": true, - "release_date": "2026-04-20", - "last_updated": "2026-04-20", - "cost": { - "input": 0, - "output": 0, - "cache_read": 0, - "cache_write": 0 - }, + "open_weights": false, + "release_date": "2026-05-04", + "last_updated": "2026-05-19", "type": "chat" } ] }, - "alibaba-coding-plan-cn": { - "id": "alibaba-coding-plan-cn", - "name": "Alibaba Coding Plan (China)", - "display_name": "Alibaba Coding Plan (China)", - "api": "https://coding.dashscope.aliyuncs.com/v1", - "doc": "https://help.aliyun.com/zh/model-studio/coding-plan", + "synthetic": { + "id": "synthetic", + "name": "Synthetic", + "display_name": "Synthetic", + "api": "https://api.synthetic.new/openai/v1", + "doc": "https://synthetic.new/pricing", "models": [ { - "id": "MiniMax-M2.5", - "name": "MiniMax-M2.5", - "display_name": "MiniMax-M2.5", + "id": "hf:meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8", + "name": "Llama-4-Maverick-17B-128E-Instruct-FP8", + "display_name": "Llama-4-Maverick-17B-128E-Instruct-FP8", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 196608, - "output": 24576 + "context": 524000, + "output": 4096 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } + "supported": false }, - "attachment": false, + "attachment": true, "open_weights": true, - "release_date": "2026-02-12", - "last_updated": "2026-02-12", + "knowledge": "2024-08", + "release_date": "2025-04-05", + "last_updated": "2025-04-05", "cost": { - "input": 0, - "output": 0, - "cache_read": 0, - "cache_write": 0 + "input": 0.22, + "output": 0.88 }, "type": "chat" }, { - "id": "qwen3.5-plus", - "name": "Qwen3.5 Plus", - "display_name": "Qwen3.5 Plus", + "id": "hf:meta-llama/Llama-4-Scout-17B-16E-Instruct", + "name": "Llama-4-Scout-17B-16E-Instruct", + "display_name": "Llama-4-Scout-17B-16E-Instruct", "modalities": { "input": [ "text", @@ -180299,43 +183604,29 @@ ] }, "limit": { - "context": 1000000, - "output": 65536 + "context": 328000, + "output": 4096 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } + "supported": false }, - "attachment": false, - "open_weights": false, - "knowledge": "2025-04", - "release_date": "2026-02-16", - "last_updated": "2026-02-16", + "attachment": true, + "open_weights": true, + "knowledge": "2024-08", + "release_date": "2025-04-05", + "last_updated": "2025-04-05", "cost": { - "input": 0, - "output": 0, - "cache_read": 0, - "cache_write": 0 + "input": 0.15, + "output": 0.6 }, "type": "chat" }, { - "id": "qwen3-coder-plus", - "name": "Qwen3 Coder Plus", - "display_name": "Qwen3 Coder Plus", + "id": "hf:meta-llama/Llama-3.3-70B-Instruct", + "name": "Llama-3.3-70B-Instruct", + "display_name": "Llama-3.3-70B-Instruct", "modalities": { "input": [ "text" @@ -180345,31 +183636,30 @@ ] }, "limit": { - "context": 1000000, - "output": 65536 + "context": 128000, + "output": 32768 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "attachment": false, "open_weights": true, - "knowledge": "2025-04", - "release_date": "2025-07-23", - "last_updated": "2025-07-23", + "knowledge": "2023-12", + "release_date": "2024-12-06", + "last_updated": "2024-12-06", "cost": { - "input": 0, - "output": 0, - "cache_read": 0, - "cache_write": 0 + "input": 0.9, + "output": 0.9 }, "type": "chat" }, { - "id": "glm-4.7", - "name": "GLM-4.7", - "display_name": "GLM-4.7", + "id": "hf:meta-llama/Llama-3.1-70B-Instruct", + "name": "Llama-3.1-70B-Instruct", + "display_name": "Llama-3.1-70B-Instruct", "modalities": { "input": [ "text" @@ -180379,8 +183669,8 @@ ] }, "limit": { - "context": 202752, - "output": 16384 + "context": 128000, + "output": 32768 }, "temperature": true, "tool_call": true, @@ -180388,34 +183678,21 @@ "supported": true, "default": true }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } - }, "attachment": false, "open_weights": true, - "knowledge": "2025-04", - "release_date": "2025-12-22", - "last_updated": "2025-12-22", + "knowledge": "2023-12", + "release_date": "2024-07-23", + "last_updated": "2024-07-23", "cost": { - "input": 0, - "output": 0, - "cache_read": 0, - "cache_write": 0 + "input": 0.9, + "output": 0.9 }, "type": "chat" }, { - "id": "qwen3-coder-next", - "name": "Qwen3 Coder Next", - "display_name": "Qwen3 Coder Next", + "id": "hf:meta-llama/Llama-3.1-405B-Instruct", + "name": "Llama-3.1-405B-Instruct", + "display_name": "Llama-3.1-405B-Instruct", "modalities": { "input": [ "text" @@ -180425,30 +183702,30 @@ ] }, "limit": { - "context": 262144, - "output": 65536 + "context": 128000, + "output": 32768 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "attachment": false, "open_weights": true, - "release_date": "2026-02-03", - "last_updated": "2026-02-03", + "knowledge": "2023-12", + "release_date": "2024-07-23", + "last_updated": "2024-07-23", "cost": { - "input": 0, - "output": 0, - "cache_read": 0, - "cache_write": 0 + "input": 3, + "output": 3 }, "type": "chat" }, { - "id": "qwen3.7-max", - "name": "Qwen3.7 Max", - "display_name": "Qwen3.7 Max", + "id": "hf:meta-llama/Llama-3.1-8B-Instruct", + "name": "Llama-3.1-8B-Instruct", + "display_name": "Llama-3.1-8B-Instruct", "modalities": { "input": [ "text" @@ -180458,8 +183735,8 @@ ] }, "limit": { - "context": 1000000, - "output": 65536 + "context": 128000, + "output": 32768 }, "temperature": true, "tool_call": true, @@ -180467,40 +183744,32 @@ "supported": true, "default": true }, - "extra_capabilities": { - "reasoning": { - "supported": true - } - }, "attachment": false, - "open_weights": false, - "release_date": "2026-05-21", - "last_updated": "2026-05-21", + "open_weights": true, + "knowledge": "2023-12", + "release_date": "2024-07-23", + "last_updated": "2024-07-23", "cost": { - "input": 2.5, - "output": 7.5, - "cache_read": 0.5, - "cache_write": 3.125 + "input": 0.2, + "output": 0.2 }, "type": "chat" }, { - "id": "qwen3.6-plus", - "name": "Qwen3.6 Plus", - "display_name": "Qwen3.6 Plus", + "id": "hf:deepseek-ai/DeepSeek-R1", + "name": "DeepSeek R1", + "display_name": "DeepSeek R1", "modalities": { "input": [ - "text", - "image", - "video" + "text" ], "output": [ "text" ] }, "limit": { - "context": 1000000, - "output": 65536 + "context": 128000, + "output": 128000 }, "temperature": true, "tool_call": true, @@ -180520,68 +183789,51 @@ } }, "attachment": false, - "open_weights": false, - "knowledge": "2025-04", - "release_date": "2026-04-02", - "last_updated": "2026-04-02", + "open_weights": true, + "knowledge": "2025-01", + "release_date": "2025-01-20", + "last_updated": "2025-01-20", "cost": { - "input": 0, - "output": 0, - "cache_read": 0, - "cache_write": 0 + "input": 0.55, + "output": 2.19 }, "type": "chat" }, { - "id": "qwen3.6-flash", - "name": "Qwen3.6 Flash", - "display_name": "Qwen3.6 Flash", + "id": "hf:deepseek-ai/DeepSeek-V3-0324", + "name": "DeepSeek V3 (0324)", + "display_name": "DeepSeek V3 (0324)", "modalities": { "input": [ - "text", - "image", - "video" + "text" ], "output": [ "text" ] }, "limit": { - "context": 1000000, - "output": 65536 + "context": 128000, + "output": 128000 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } + "supported": false }, - "attachment": true, + "attachment": false, "open_weights": false, - "release_date": "2026-04-27", - "last_updated": "2026-04-27", + "release_date": "2025-08-01", + "last_updated": "2025-08-01", "cost": { - "input": 0.1875, - "output": 1.125, - "cache_write": 0.234375 + "input": 1.2, + "output": 1.2 }, "type": "chat" }, { - "id": "qwen3-max-2026-01-23", - "name": "Qwen3 Max", - "display_name": "Qwen3 Max", + "id": "hf:deepseek-ai/DeepSeek-V3.1-Terminus", + "name": "DeepSeek V3.1 Terminus", + "display_name": "DeepSeek V3.1 Terminus", "modalities": { "input": [ "text" @@ -180591,42 +183843,29 @@ ] }, "limit": { - "context": 262144, - "output": 32768 + "context": 128000, + "output": 128000 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } + "supported": true, + "default": true }, "attachment": false, "open_weights": false, - "knowledge": "2025-04", - "release_date": "2026-01-23", - "last_updated": "2026-01-23", + "release_date": "2025-09-22", + "last_updated": "2025-09-25", "cost": { - "input": 0, - "output": 0, - "cache_read": 0, - "cache_write": 0 + "input": 1.2, + "output": 1.2 }, "type": "chat" }, { - "id": "glm-5", - "name": "GLM-5", - "display_name": "GLM-5", + "id": "hf:deepseek-ai/DeepSeek-R1-0528", + "name": "DeepSeek R1 (0528)", + "display_name": "DeepSeek R1 (0528)", "modalities": { "input": [ "text" @@ -180636,8 +183875,8 @@ ] }, "limit": { - "context": 202752, - "output": 16384 + "context": 128000, + "output": 128000 }, "temperature": true, "tool_call": true, @@ -180658,32 +183897,29 @@ }, "attachment": false, "open_weights": false, - "release_date": "2026-02-11", - "last_updated": "2026-02-11", + "release_date": "2025-08-01", + "last_updated": "2025-08-01", "cost": { - "input": 0, - "output": 0, - "cache_read": 0, - "cache_write": 0 + "input": 3, + "output": 8 }, "type": "chat" }, { - "id": "qwen3.7-plus", - "name": "Qwen3.7 Plus", - "display_name": "Qwen3.7 Plus", + "id": "hf:deepseek-ai/DeepSeek-V3.1", + "name": "DeepSeek V3.1", + "display_name": "DeepSeek V3.1", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 1000000, - "output": 64000 + "context": 128000, + "output": 128000 }, "temperature": true, "tool_call": true, @@ -180691,40 +183927,31 @@ "supported": true, "default": true }, - "extra_capabilities": { - "reasoning": { - "supported": true - } - }, "attachment": false, "open_weights": false, - "knowledge": "2025-04", - "release_date": "2026-06-02", - "last_updated": "2026-06-02", + "release_date": "2025-08-21", + "last_updated": "2025-08-21", "cost": { - "input": 0, - "output": 0, - "cache_read": 0, - "cache_write": 0 + "input": 0.56, + "output": 1.68 }, "type": "chat" }, { - "id": "kimi-k2.5", - "name": "Kimi K2.5", - "display_name": "Kimi K2.5", + "id": "hf:deepseek-ai/DeepSeek-V3.2", + "name": "DeepSeek V3.2", + "display_name": "DeepSeek V3.2", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 262144, - "output": 32768 + "context": 162816, + "output": 8000 }, "temperature": true, "tool_call": true, @@ -180734,41 +183961,25 @@ }, "extra_capabilities": { "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] + "supported": true } }, - "attachment": true, + "attachment": false, "open_weights": true, - "knowledge": "2025-01", - "release_date": "2026-01-27", - "last_updated": "2026-01-27", + "release_date": "2025-12-01", + "last_updated": "2025-12-01", "cost": { - "input": 0, - "output": 0, - "cache_read": 0, + "input": 0.27, + "output": 0.4, + "cache_read": 0.27, "cache_write": 0 }, "type": "chat" - } - ] - }, - "nebius": { - "id": "nebius", - "name": "Nebius Token Factory", - "display_name": "Nebius Token Factory", - "api": "https://api.tokenfactory.nebius.com/v1", - "doc": "https://docs.tokenfactory.nebius.com/", - "models": [ + }, { - "id": "MiniMaxAI/MiniMax-M2.5", - "name": "MiniMax-M2.5", - "display_name": "MiniMax-M2.5", + "id": "hf:deepseek-ai/DeepSeek-V3", + "name": "DeepSeek V3", + "display_name": "DeepSeek V3", "modalities": { "input": [ "text" @@ -180778,8 +183989,8 @@ ] }, "limit": { - "context": 196608, - "output": 8192 + "context": 128000, + "output": 128000 }, "temperature": true, "tool_call": true, @@ -180787,28 +183998,21 @@ "supported": true, "default": true }, - "extra_capabilities": { - "reasoning": { - "supported": true - } - }, "attachment": false, "open_weights": true, - "knowledge": "2025-01", + "knowledge": "2024-07", "release_date": "2025-01-20", - "last_updated": "2026-05-07", + "last_updated": "2025-05-29", "cost": { - "input": 0.3, - "output": 1.2, - "cache_read": 0.03, - "cache_write": 0.375 + "input": 1.25, + "output": 1.25 }, "type": "chat" }, { - "id": "MiniMaxAI/MiniMax-M2.5-fast", - "name": "MiniMax-M2.5-fast", - "display_name": "MiniMax-M2.5-fast", + "id": "hf:moonshotai/Kimi-K2-Thinking", + "name": "Kimi K2 Thinking", + "display_name": "Kimi K2 Thinking", "modalities": { "input": [ "text" @@ -180818,8 +184022,8 @@ ] }, "limit": { - "context": 8000, - "output": 8192 + "context": 262144, + "output": 262144 }, "temperature": true, "tool_call": true, @@ -180827,23 +184031,32 @@ "supported": true, "default": true }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } + }, "attachment": false, "open_weights": true, - "knowledge": "2025-01", - "release_date": "2025-01-20", - "last_updated": "2026-05-07", + "knowledge": "2025-11", + "release_date": "2025-11-07", + "last_updated": "2025-11-07", "cost": { - "input": 0.3, - "output": 1.2, - "cache_read": 0.03, - "cache_write": 0.375 + "input": 0.55, + "output": 2.19 }, "type": "chat" }, { - "id": "zai-org/GLM-5", - "name": "GLM-5", - "display_name": "GLM-5", + "id": "hf:moonshotai/Kimi-K2-Instruct-0905", + "name": "Kimi K2 0905", + "display_name": "Kimi K2 0905", "modalities": { "input": [ "text" @@ -180853,54 +184066,41 @@ ] }, "limit": { - "context": 200000, - "output": 16384 + "context": 262144, + "output": 32768 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } + "supported": false }, "attachment": false, - "open_weights": false, - "knowledge": "2026-01", - "release_date": "2026-03-01", - "last_updated": "2026-03-10", + "open_weights": true, + "knowledge": "2024-10", + "release_date": "2025-09-05", + "last_updated": "2025-09-05", "cost": { - "input": 1, - "output": 3.2, - "cache_read": 0.1, - "cache_write": 1 + "input": 1.2, + "output": 1.2 }, "type": "chat" }, { - "id": "NousResearch/Hermes-4-405B", - "name": "Hermes-4-405B", - "display_name": "Hermes-4-405B", + "id": "hf:moonshotai/Kimi-K2.6", + "name": "Kimi K2.6", + "display_name": "Kimi K2.6", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 8192 + "context": 262144, + "output": 65536 }, "temperature": true, "tool_call": true, @@ -180919,35 +184119,34 @@ ] } }, - "attachment": false, + "attachment": true, "open_weights": true, - "knowledge": "2025-11", - "release_date": "2026-01-30", - "last_updated": "2026-02-04", + "knowledge": "2025-01", + "release_date": "2026-04-21", + "last_updated": "2026-04-21", "cost": { - "input": 1, - "output": 3, - "reasoning": 3, - "cache_read": 0.1, - "cache_write": 1.25 + "input": 0.95, + "output": 4, + "cache_read": 0.95 }, "type": "chat" }, { - "id": "NousResearch/Hermes-4-70B", - "name": "Hermes-4-70B", - "display_name": "Hermes-4-70B", + "id": "hf:moonshotai/Kimi-K2.5", + "name": "Kimi K2.5", + "display_name": "Kimi K2.5", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 8192 + "context": 262144, + "output": 65536 }, "temperature": true, "tool_call": true, @@ -180968,34 +184167,30 @@ }, "attachment": false, "open_weights": true, - "knowledge": "2025-11", - "release_date": "2026-01-30", - "last_updated": "2026-02-04", + "knowledge": "2025-01", + "release_date": "2026-01", + "last_updated": "2026-01", "cost": { - "input": 0.13, - "output": 0.4, - "reasoning": 0.4, - "cache_read": 0.013, - "cache_write": 0.16 + "input": 0.55, + "output": 2.19 }, "type": "chat" }, { - "id": "moonshotai/Kimi-K2.5", - "name": "Kimi-K2.5", - "display_name": "Kimi-K2.5", + "id": "hf:zai-org/GLM-4.7-Flash", + "name": "GLM-4.7-Flash", + "display_name": "GLM-4.7-Flash", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 256000, - "output": 8192 + "context": 196608, + "output": 65536 }, "temperature": true, "tool_call": true, @@ -181014,36 +184209,32 @@ ] } }, - "attachment": true, + "attachment": false, "open_weights": true, - "knowledge": "2025-06", - "release_date": "2025-12-15", - "last_updated": "2026-02-04", + "release_date": "2026-01-18", + "last_updated": "2026-01-18", "cost": { - "input": 0.5, - "output": 2.5, - "reasoning": 2.5, - "cache_read": 0.05, - "cache_write": 0.625 + "input": 0.06, + "output": 0.4, + "cache_read": 0.06 }, "type": "chat" }, { - "id": "moonshotai/Kimi-K2.5-fast", - "name": "Kimi-K2.5-fast", - "display_name": "Kimi-K2.5-fast", + "id": "hf:zai-org/GLM-4.6", + "name": "GLM 4.6", + "display_name": "GLM 4.6", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 256000, - "output": 8192 + "context": 200000, + "output": 64000 }, "temperature": true, "tool_call": true, @@ -181053,32 +184244,24 @@ }, "extra_capabilities": { "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] + "supported": true } }, - "attachment": true, + "attachment": false, "open_weights": true, - "knowledge": "2025-06", - "release_date": "2025-12-15", - "last_updated": "2026-02-04", + "knowledge": "2025-04", + "release_date": "2025-09-30", + "last_updated": "2025-09-30", "cost": { - "input": 0.5, - "output": 2.5, - "cache_read": 0.05, - "cache_write": 0.625 + "input": 0.55, + "output": 2.19 }, "type": "chat" }, { - "id": "meta-llama/Meta-Llama-3.1-8B-Instruct", - "name": "Meta-Llama-3.1-8B-Instruct", - "display_name": "Meta-Llama-3.1-8B-Instruct", + "id": "hf:zai-org/GLM-5", + "name": "GLM-5", + "display_name": "GLM-5", "modalities": { "input": [ "text" @@ -181088,31 +184271,41 @@ ] }, "limit": { - "context": 128000, - "output": 4096 + "context": 196608, + "output": 65536 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } }, "attachment": false, "open_weights": true, - "knowledge": "2024-12", - "release_date": "2024-07-23", - "last_updated": "2026-02-04", + "release_date": "2026-02-12", + "last_updated": "2026-04-08", "cost": { - "input": 0.02, - "output": 0.06, - "cache_read": 0.002, - "cache_write": 0.025 + "input": 1, + "output": 3, + "cache_read": 1 }, "type": "chat" }, { - "id": "meta-llama/Llama-3.3-70B-Instruct", - "name": "Llama-3.3-70B-Instruct", - "display_name": "Llama-3.3-70B-Instruct", + "id": "hf:zai-org/GLM-4.7", + "name": "GLM 4.7", + "display_name": "GLM 4.7", "modalities": { "input": [ "text" @@ -181122,31 +184315,41 @@ ] }, "limit": { - "context": 128000, - "output": 8192 + "context": 200000, + "output": 64000 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } }, "attachment": false, "open_weights": true, - "knowledge": "2025-08", - "release_date": "2025-12-05", - "last_updated": "2026-02-04", + "knowledge": "2025-04", + "release_date": "2025-12-22", + "last_updated": "2025-12-22", "cost": { - "input": 0.13, - "output": 0.4, - "cache_read": 0.013, - "cache_write": 0.16 + "input": 0.55, + "output": 2.19 }, "type": "chat" }, { - "id": "deepseek-ai/DeepSeek-V4-Pro", - "name": "DeepSeek V4 Pro", - "display_name": "DeepSeek V4 Pro", + "id": "hf:zai-org/GLM-5.1", + "name": "GLM 5.1", + "display_name": "GLM 5.1", "modalities": { "input": [ "text" @@ -181156,8 +184359,8 @@ ] }, "limit": { - "context": 1000000, - "output": 384000 + "context": 196608, + "output": 65536 }, "temperature": true, "tool_call": true, @@ -181178,20 +184381,19 @@ }, "attachment": false, "open_weights": true, - "knowledge": "2025-05", - "release_date": "2026-04-24", - "last_updated": "2026-04-24", + "release_date": "2026-03-27", + "last_updated": "2026-04-12", "cost": { - "input": 1.75, - "output": 3.5, - "cache_read": 0.15 + "input": 1, + "output": 3, + "cache_read": 1 }, "type": "chat" }, { - "id": "deepseek-ai/DeepSeek-V3.2", - "name": "DeepSeek-V3.2", - "display_name": "DeepSeek-V3.2", + "id": "hf:MiniMaxAI/MiniMax-M2.1", + "name": "MiniMax-M2.1", + "display_name": "MiniMax-M2.1", "modalities": { "input": [ "text" @@ -181201,8 +184403,8 @@ ] }, "limit": { - "context": 163000, - "output": 16384 + "context": 204800, + "output": 131072 }, "temperature": true, "tool_call": true, @@ -181222,23 +184424,19 @@ } }, "attachment": false, - "open_weights": true, - "knowledge": "2025-11", - "release_date": "2026-01-20", - "last_updated": "2026-02-04", - "cost": { - "input": 0.3, - "output": 0.45, - "reasoning": 0.45, - "cache_read": 0.03, - "cache_write": 0.375 + "open_weights": true, + "release_date": "2025-12-23", + "last_updated": "2025-12-23", + "cost": { + "input": 0.55, + "output": 2.19 }, "type": "chat" }, { - "id": "deepseek-ai/DeepSeek-V3.2-fast", - "name": "DeepSeek-V3.2-fast", - "display_name": "DeepSeek-V3.2-fast", + "id": "hf:MiniMaxAI/MiniMax-M2", + "name": "MiniMax-M2", + "display_name": "MiniMax-M2", "modalities": { "input": [ "text" @@ -181248,8 +184446,8 @@ ] }, "limit": { - "context": 8000, - "output": 8192 + "context": 196608, + "output": 131000 }, "temperature": true, "tool_call": true, @@ -181257,23 +184455,25 @@ "supported": true, "default": true }, + "extra_capabilities": { + "reasoning": { + "supported": true + } + }, "attachment": false, "open_weights": true, - "knowledge": "2025-01", - "release_date": "2025-01-27", - "last_updated": "2026-05-07", + "release_date": "2025-10-27", + "last_updated": "2025-10-27", "cost": { - "input": 0.4, - "output": 2, - "cache_read": 0.04, - "cache_write": 0.5 + "input": 0.55, + "output": 2.19 }, "type": "chat" }, { - "id": "nvidia/Llama-3_1-Nemotron-Ultra-253B-v1", - "name": "Llama-3.1-Nemotron-Ultra-253B-v1", - "display_name": "Llama-3.1-Nemotron-Ultra-253B-v1", + "id": "hf:MiniMaxAI/MiniMax-M2.5", + "name": "MiniMax-M2.5", + "display_name": "MiniMax-M2.5", "modalities": { "input": [ "text" @@ -181283,31 +184483,41 @@ ] }, "limit": { - "context": 128000, - "output": 4096 + "context": 191488, + "output": 65536 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } }, "attachment": false, "open_weights": true, - "knowledge": "2024-12", - "release_date": "2025-01-15", - "last_updated": "2026-02-04", + "release_date": "2026-02-07", + "last_updated": "2026-02-07", "cost": { "input": 0.6, - "output": 1.8, - "cache_read": 0.06, - "cache_write": 0.75 + "output": 3, + "cache_read": 0.6 }, "type": "chat" }, { - "id": "nvidia/Nemotron-3-Nano-Omni", - "name": "Nemotron-3-Nano-Omni", - "display_name": "Nemotron-3-Nano-Omni", + "id": "hf:openai/gpt-oss-120b", + "name": "GPT OSS 120B", + "display_name": "GPT OSS 120B", "modalities": { "input": [ "text" @@ -181317,8 +184527,8 @@ ] }, "limit": { - "context": 65536, - "output": 8192 + "context": 128000, + "output": 32768 }, "temperature": true, "tool_call": true, @@ -181326,34 +184536,37 @@ "supported": true, "default": true }, + "extra_capabilities": { + "reasoning": { + "supported": true + } + }, "attachment": false, "open_weights": true, - "knowledge": "2025-01", - "release_date": "2025-01-20", - "last_updated": "2026-05-07", + "release_date": "2025-08-05", + "last_updated": "2025-08-05", "cost": { - "input": 0.06, - "output": 0.24, - "cache_read": 0.006, - "cache_write": 0.075 + "input": 0.1, + "output": 0.1 }, "type": "chat" }, { - "id": "nvidia/nemotron-3-super-120b-a12b", - "name": "Nemotron-3-Super-120B-A12B", - "display_name": "Nemotron-3-Super-120B-A12B", + "id": "hf:Qwen/Qwen3.5-397B-A17B", + "name": "Qwen3.5-97B-A17B", + "display_name": "Qwen3.5-97B-A17B", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 256000, - "output": 32768 + "context": 262144, + "output": 65536 }, "temperature": true, "tool_call": true, @@ -181361,21 +184574,32 @@ "supported": true, "default": true }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } + }, "attachment": false, "open_weights": true, - "knowledge": "2026-02", - "release_date": "2026-03-11", - "last_updated": "2026-03-12", + "release_date": "2026-02-11", + "last_updated": "2026-02-11", "cost": { - "input": 0.3, - "output": 0.9 + "input": 0.6, + "output": 3, + "cache_read": 0.6 }, "type": "chat" }, { - "id": "nvidia/NVIDIA-Nemotron-3-Nano-30B-A3B", - "name": "Nemotron-3-Nano-30B-A3B", - "display_name": "Nemotron-3-Nano-30B-A3B", + "id": "hf:Qwen/Qwen3-235B-A22B-Thinking-2507", + "name": "Qwen3 235B A22B Thinking 2507", + "display_name": "Qwen3 235B A22B Thinking 2507", "modalities": { "input": [ "text" @@ -181385,31 +184609,41 @@ ] }, "limit": { - "context": 32000, - "output": 4096 + "context": 256000, + "output": 32000 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } }, "attachment": false, "open_weights": true, - "knowledge": "2025-05", - "release_date": "2025-08-10", - "last_updated": "2026-02-04", + "knowledge": "2025-04", + "release_date": "2025-07-25", + "last_updated": "2025-07-25", "cost": { - "input": 0.06, - "output": 0.24, - "cache_read": 0.006, - "cache_write": 0.075 + "input": 0.65, + "output": 3 }, "type": "chat" }, { - "id": "PrimeIntellect/INTELLECT-3", - "name": "INTELLECT-3", - "display_name": "INTELLECT-3", + "id": "hf:Qwen/Qwen3-Coder-480B-A35B-Instruct", + "name": "Qwen 3 Coder 480B", + "display_name": "Qwen 3 Coder 480B", "modalities": { "input": [ "text" @@ -181419,8 +184653,8 @@ ] }, "limit": { - "context": 128000, - "output": 8192 + "context": 256000, + "output": 32000 }, "temperature": true, "tool_call": true, @@ -181429,21 +184663,19 @@ }, "attachment": false, "open_weights": true, - "knowledge": "2025-10", - "release_date": "2026-01-25", - "last_updated": "2026-02-04", + "knowledge": "2025-04", + "release_date": "2025-07-23", + "last_updated": "2025-07-23", "cost": { - "input": 0.2, - "output": 1.1, - "cache_read": 0.02, - "cache_write": 0.25 + "input": 2, + "output": 2 }, "type": "chat" }, { - "id": "Qwen/Qwen3-Embedding-8B", - "name": "Qwen3-Embedding-8B", - "display_name": "Qwen3-Embedding-8B", + "id": "hf:Qwen/Qwen2.5-Coder-32B-Instruct", + "name": "Qwen2.5-Coder-32B-Instruct", + "display_name": "Qwen2.5-Coder-32B-Instruct", "modalities": { "input": [ "text" @@ -181454,28 +184686,28 @@ }, "limit": { "context": 32768, - "output": 8192 + "output": 32768 }, - "temperature": false, + "temperature": true, "tool_call": false, "reasoning": { "supported": false }, "attachment": false, "open_weights": true, - "knowledge": "2025-10", - "release_date": "2026-01-10", - "last_updated": "2026-02-04", + "knowledge": "2024-10", + "release_date": "2024-11-11", + "last_updated": "2024-11-11", "cost": { - "input": 0.01, - "output": 0 + "input": 0.8, + "output": 0.8 }, - "type": "embedding" + "type": "chat" }, { - "id": "Qwen/Qwen3-30B-A3B-Instruct-2507", - "name": "Qwen3-30B-A3B-Instruct-2507", - "display_name": "Qwen3-30B-A3B-Instruct-2507", + "id": "hf:Qwen/Qwen3-235B-A22B-Instruct-2507", + "name": "Qwen 3 235B Instruct", + "display_name": "Qwen 3 235B Instruct", "modalities": { "input": [ "text" @@ -181485,8 +184717,8 @@ ] }, "limit": { - "context": 128000, - "output": 8192 + "context": 256000, + "output": 32000 }, "temperature": true, "tool_call": true, @@ -181495,24 +184727,23 @@ }, "attachment": false, "open_weights": true, - "knowledge": "2025-12", - "release_date": "2026-01-28", - "last_updated": "2026-02-04", + "knowledge": "2025-04", + "release_date": "2025-04-28", + "last_updated": "2025-07-21", "cost": { - "input": 0.1, - "output": 0.3, - "cache_read": 0.01, - "cache_write": 0.125 + "input": 0.2, + "output": 0.6 }, "type": "chat" }, { - "id": "Qwen/Qwen3.5-397B-A17B", - "name": "Qwen3.5-397B-A17B", - "display_name": "Qwen3.5-397B-A17B", + "id": "hf:nvidia/Kimi-K2.5-NVFP4", + "name": "Kimi K2.5 (NVFP4)", + "display_name": "Kimi K2.5 (NVFP4)", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" @@ -181520,7 +184751,7 @@ }, "limit": { "context": 262144, - "output": 8192 + "output": 65536 }, "temperature": true, "tool_call": true, @@ -181541,21 +184772,19 @@ }, "attachment": false, "open_weights": true, - "knowledge": "2025-07", - "release_date": "2025-07-15", - "last_updated": "2026-05-07", + "knowledge": "2025-01", + "release_date": "2026-01", + "last_updated": "2026-01", "cost": { - "input": 0.6, - "output": 3.6, - "cache_read": 0.06, - "cache_write": 0.75 + "input": 0.55, + "output": 2.19 }, "type": "chat" }, { - "id": "Qwen/Qwen3.5-397B-A17B-fast", - "name": "Qwen3.5-397B-A17B-fast", - "display_name": "Qwen3.5-397B-A17B-fast", + "id": "hf:nvidia/NVIDIA-Nemotron-3-Super-120B-A12B-NVFP4", + "name": "Nemotron 3 Super 120B", + "display_name": "Nemotron 3 Super 120B", "modalities": { "input": [ "text" @@ -181565,8 +184794,8 @@ ] }, "limit": { - "context": 8000, - "output": 8192 + "context": 262144, + "output": 65536 }, "temperature": true, "tool_call": true, @@ -181587,21 +184816,29 @@ }, "attachment": false, "open_weights": true, - "knowledge": "2025-07", - "release_date": "2025-07-15", - "last_updated": "2026-05-07", + "knowledge": "2024-04", + "release_date": "2026-03-11", + "last_updated": "2026-04-03", "cost": { - "input": 0.6, - "output": 3.6, - "cache_read": 0.06, - "cache_write": 0.75 + "input": 0.3, + "output": 1, + "cache_read": 0.3 }, "type": "chat" - }, + } + ] + }, + "iflowcn": { + "id": "iflowcn", + "name": "iFlow", + "display_name": "iFlow", + "api": "https://apis.iflow.cn/v1", + "doc": "https://platform.iflow.cn/en/docs", + "models": [ { - "id": "Qwen/Qwen3-235B-A22B-Instruct-2507", - "name": "Qwen3 235B A22B Instruct 2507", - "display_name": "Qwen3 235B A22B Instruct 2507", + "id": "qwen3-coder-plus", + "name": "Qwen3-Coder-Plus", + "display_name": "Qwen3-Coder-Plus", "modalities": { "input": [ "text" @@ -181611,30 +184848,29 @@ ] }, "limit": { - "context": 262144, - "output": 8192 + "context": 256000, + "output": 64000 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, "attachment": false, - "open_weights": false, - "knowledge": "2025-07", - "release_date": "2025-07-25", - "last_updated": "2025-10-04", + "open_weights": true, + "knowledge": "2025-04", + "release_date": "2025-07-01", + "last_updated": "2025-07-01", "cost": { - "input": 0.2, - "output": 0.6 + "input": 0, + "output": 0 }, "type": "chat" }, { - "id": "Qwen/Qwen3-Next-80B-A3B-Thinking-fast", - "name": "Qwen3-Next-80B-A3B-Thinking-fast", - "display_name": "Qwen3-Next-80B-A3B-Thinking-fast", + "id": "deepseek-v3", + "name": "DeepSeek-V3", + "display_name": "DeepSeek-V3", "modalities": { "input": [ "text" @@ -181644,47 +184880,32 @@ ] }, "limit": { - "context": 8000, - "output": 8192 + "context": 128000, + "output": 32000 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } + "supported": false }, "attachment": false, "open_weights": true, - "knowledge": "2025-07", - "release_date": "2025-07-25", - "last_updated": "2026-05-07", + "knowledge": "2024-10", + "release_date": "2024-12-26", + "last_updated": "2024-12-26", "cost": { - "input": 0.15, - "output": 1.2, - "cache_read": 0.015, - "cache_write": 0.1875 + "input": 0, + "output": 0 }, "type": "chat" }, { - "id": "Qwen/Qwen2.5-VL-72B-Instruct", - "name": "Qwen2.5-VL-72B-Instruct", - "display_name": "Qwen2.5-VL-72B-Instruct", + "id": "kimi-k2", + "name": "Kimi-K2", + "display_name": "Kimi-K2", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" @@ -181692,28 +184913,26 @@ }, "limit": { "context": 128000, - "output": 8192 + "output": 64000 }, "temperature": true, "tool_call": true, "reasoning": { "supported": false }, - "attachment": true, - "open_weights": true, - "knowledge": "2024-12", - "release_date": "2025-01-20", - "last_updated": "2026-02-04", + "attachment": false, + "open_weights": false, + "knowledge": "2024-10", + "release_date": "2024-12-01", + "last_updated": "2024-12-01", "cost": { - "input": 0.25, - "output": 0.75, - "cache_read": 0.025, - "cache_write": 0.31 + "input": 0, + "output": 0 }, "type": "chat" }, { - "id": "Qwen/Qwen3-32B", + "id": "qwen3-32b", "name": "Qwen3-32B", "display_name": "Qwen3-32B", "modalities": { @@ -181726,7 +184945,7 @@ }, "limit": { "context": 128000, - "output": 8192 + "output": 32000 }, "temperature": true, "tool_call": true, @@ -181746,21 +184965,19 @@ }, "attachment": false, "open_weights": true, - "knowledge": "2025-12", - "release_date": "2026-01-28", - "last_updated": "2026-02-04", + "knowledge": "2024-10", + "release_date": "2024-12-01", + "last_updated": "2024-12-01", "cost": { - "input": 0.1, - "output": 0.3, - "cache_read": 0.01, - "cache_write": 0.125 + "input": 0, + "output": 0 }, "type": "chat" }, { - "id": "Qwen/Qwen3-235B-A22B-Thinking-2507-fast", - "name": "Qwen3-235B-A22B-Thinking-2507-fast", - "display_name": "Qwen3-235B-A22B-Thinking-2507-fast", + "id": "qwen3-max-preview", + "name": "Qwen3-Max-Preview", + "display_name": "Qwen3-Max-Preview", "modalities": { "input": [ "text" @@ -181770,14 +184987,13 @@ ] }, "limit": { - "context": 8000, - "output": 8192 + "context": 256000, + "output": 32000 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": true }, "extra_capabilities": { "reasoning": { @@ -181791,22 +185007,20 @@ } }, "attachment": false, - "open_weights": true, - "knowledge": "2025-07", - "release_date": "2025-07-25", - "last_updated": "2026-05-07", + "open_weights": false, + "knowledge": "2024-12", + "release_date": "2025-01-01", + "last_updated": "2025-01-01", "cost": { - "input": 0.5, - "output": 2, - "cache_read": 0.05, - "cache_write": 0.625 + "input": 0, + "output": 0 }, "type": "chat" }, { - "id": "Qwen/Qwen3-Next-80B-A3B-Thinking", - "name": "Qwen3-Next-80B-A3B-Thinking", - "display_name": "Qwen3-Next-80B-A3B-Thinking", + "id": "qwen3-max", + "name": "Qwen3-Max", + "display_name": "Qwen3-Max", "modalities": { "input": [ "text" @@ -181816,14 +185030,13 @@ ] }, "limit": { - "context": 128000, - "output": 16384 + "context": 256000, + "output": 32000 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": true }, "extra_capabilities": { "reasoning": { @@ -181837,23 +185050,20 @@ } }, "attachment": false, - "open_weights": true, - "knowledge": "2025-12", - "release_date": "2026-01-28", - "last_updated": "2026-02-04", + "open_weights": false, + "knowledge": "2024-12", + "release_date": "2025-01-01", + "last_updated": "2025-01-01", "cost": { - "input": 0.15, - "output": 1.2, - "reasoning": 1.2, - "cache_read": 0.015, - "cache_write": 0.18 + "input": 0, + "output": 0 }, "type": "chat" }, { - "id": "google/gemma-2-2b-it", - "name": "Gemma-2-2b-it", - "display_name": "Gemma-2-2b-it", + "id": "qwen3-235b", + "name": "Qwen3-235B-A22B", + "display_name": "Qwen3-235B-A22B", "modalities": { "input": [ "text" @@ -181863,66 +185073,68 @@ ] }, "limit": { - "context": 8192, - "output": 4096 + "context": 128000, + "output": 32000 }, "temperature": true, - "tool_call": false, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "attachment": false, "open_weights": true, - "knowledge": "2024-06", - "release_date": "2024-07-31", - "last_updated": "2026-02-04", + "knowledge": "2024-10", + "release_date": "2024-12-01", + "last_updated": "2024-12-01", "cost": { - "input": 0.02, - "output": 0.06, - "cache_read": 0.002, - "cache_write": 0.025 + "input": 0, + "output": 0 }, "type": "chat" }, { - "id": "google/gemma-3-27b-it", - "name": "Gemma-3-27b-it", - "display_name": "Gemma-3-27b-it", + "id": "glm-4.6", + "name": "GLM-4.6", + "display_name": "GLM-4.6", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 110000, - "output": 8192 + "context": 200000, + "output": 128000 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": true, - "open_weights": true, - "knowledge": "2025-10", - "release_date": "2026-01-20", - "last_updated": "2026-02-04", + "extra_capabilities": { + "reasoning": { + "supported": true + } + }, + "attachment": false, + "open_weights": false, + "knowledge": "2024-10", + "release_date": "2024-12-01", + "last_updated": "2025-11-13", "cost": { - "input": 0.1, - "output": 0.3, - "cache_read": 0.01, - "cache_write": 0.125 + "input": 0, + "output": 0 }, "type": "chat" }, { - "id": "openai/gpt-oss-120b-fast", - "name": "gpt-oss-120b-fast", - "display_name": "gpt-oss-120b-fast", + "id": "qwen3-235b-a22b-thinking-2507", + "name": "Qwen3-235B-A22B-Thinking", + "display_name": "Qwen3-235B-A22B-Thinking", "modalities": { "input": [ "text" @@ -181932,8 +185144,8 @@ ] }, "limit": { - "context": 8000, - "output": 8192 + "context": 256000, + "output": 64000 }, "temperature": true, "tool_call": true, @@ -181941,23 +185153,32 @@ "supported": true, "default": true }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } + }, "attachment": false, "open_weights": true, - "knowledge": "2025-06", - "release_date": "2025-06-10", - "last_updated": "2026-05-07", + "knowledge": "2025-04", + "release_date": "2025-07-01", + "last_updated": "2025-07-01", "cost": { - "input": 0.1, - "output": 0.5, - "cache_read": 0.01, - "cache_write": 0.125 + "input": 0, + "output": 0 }, "type": "chat" }, { - "id": "openai/gpt-oss-120b", - "name": "gpt-oss-120b", - "display_name": "gpt-oss-120b", + "id": "deepseek-r1", + "name": "DeepSeek-R1", + "display_name": "DeepSeek-R1", "modalities": { "input": [ "text" @@ -181968,7 +185189,7 @@ }, "limit": { "context": 128000, - "output": 8192 + "output": 32000 }, "temperature": true, "tool_call": true, @@ -181989,110 +185210,95 @@ }, "attachment": false, "open_weights": true, - "knowledge": "2025-09", - "release_date": "2026-01-10", - "last_updated": "2026-02-04", + "knowledge": "2024-12", + "release_date": "2025-01-20", + "last_updated": "2025-01-20", "cost": { - "input": 0.15, - "output": 0.6, - "reasoning": 0.6, - "cache_read": 0.015, - "cache_write": 0.18 + "input": 0, + "output": 0 }, "type": "chat" - } - ] - }, - "minimax": { - "id": "minimax", - "name": "MiniMax (minimax.io)", - "display_name": "MiniMax (minimax.io)", - "api": "https://api.minimax.io/anthropic/v1", - "doc": "https://platform.minimax.io/docs/guides/quickstart", - "models": [ + }, { - "id": "MiniMax-M2.5", - "name": "MiniMax-M2.5", - "display_name": "MiniMax-M2.5", + "id": "qwen3-vl-plus", + "name": "Qwen3-VL-Plus", + "display_name": "Qwen3-VL-Plus", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 204800, - "output": 131072 + "context": 256000, + "output": 32000 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": true }, "extra_capabilities": { "reasoning": { - "supported": true + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] } }, - "attachment": false, - "open_weights": true, - "release_date": "2026-02-12", - "last_updated": "2026-02-12", + "attachment": true, + "open_weights": false, + "knowledge": "2024-12", + "release_date": "2025-01-01", + "last_updated": "2025-01-01", "cost": { - "input": 0.3, - "output": 1.2, - "cache_read": 0.03, - "cache_write": 0.375 + "input": 0, + "output": 0 }, "type": "chat" }, { - "id": "MiniMax-M3", - "name": "MiniMax-M3", - "display_name": "MiniMax-M3", + "id": "qwen3-235b-a22b-instruct", + "name": "Qwen3-235B-A22B-Instruct", + "display_name": "Qwen3-235B-A22B-Instruct", "modalities": { "input": [ - "text", - "image", - "video" + "text" ], "output": [ "text" ] }, "limit": { - "context": 512000, - "output": 128000 + "context": 256000, + "output": 64000 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true - } + "supported": false }, - "attachment": true, + "attachment": false, "open_weights": true, - "release_date": "2026-06-01", - "last_updated": "2026-06-01", + "knowledge": "2025-04", + "release_date": "2025-07-01", + "last_updated": "2025-07-01", "cost": { - "input": 0.6, - "output": 2.4, - "cache_read": 0.12 + "input": 0, + "output": 0 }, "type": "chat" }, { - "id": "MiniMax-M2.5-highspeed", - "name": "MiniMax-M2.5-highspeed", - "display_name": "MiniMax-M2.5-highspeed", + "id": "kimi-k2-0905", + "name": "Kimi-K2-0905", + "display_name": "Kimi-K2-0905", "modalities": { "input": [ "text" @@ -182102,36 +185308,29 @@ ] }, "limit": { - "context": 204800, - "output": 131072 + "context": 256000, + "output": 64000 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true - } + "supported": false }, "attachment": false, - "open_weights": true, - "release_date": "2026-02-13", - "last_updated": "2026-02-13", + "open_weights": false, + "knowledge": "2024-12", + "release_date": "2025-09-05", + "last_updated": "2025-09-05", "cost": { - "input": 0.6, - "output": 2.4, - "cache_read": 0.06, - "cache_write": 0.375 + "input": 0, + "output": 0 }, "type": "chat" }, { - "id": "MiniMax-M2.7", - "name": "MiniMax-M2.7", - "display_name": "MiniMax-M2.7", + "id": "deepseek-v3.2", + "name": "DeepSeek-V3.2-Exp", + "display_name": "DeepSeek-V3.2-Exp", "modalities": { "input": [ "text" @@ -182141,79 +185340,73 @@ ] }, "limit": { - "context": 204800, - "output": 131072 + "context": 128000, + "output": 64000 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": true }, "extra_capabilities": { "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] + "supported": true } }, "attachment": false, "open_weights": true, - "release_date": "2026-03-18", - "last_updated": "2026-03-18", + "knowledge": "2024-12", + "release_date": "2025-01-01", + "last_updated": "2025-01-01", "cost": { - "input": 0.3, - "output": 1.2, - "cache_read": 0.06, - "cache_write": 0.375 + "input": 0, + "output": 0 }, "type": "chat" - }, + } + ] + }, + "xiaomi-token-plan-sgp": { + "id": "xiaomi-token-plan-sgp", + "name": "Xiaomi Token Plan (Singapore)", + "display_name": "Xiaomi Token Plan (Singapore)", + "api": "https://token-plan-sgp.xiaomimimo.com/v1", + "doc": "https://platform.xiaomimimo.com/#/docs", + "models": [ { - "id": "MiniMax-M2", - "name": "MiniMax-M2", - "display_name": "MiniMax-M2", + "id": "mimo-v2.5-tts", + "name": "MiMo-V2.5-TTS", + "display_name": "MiMo-V2.5-TTS", "modalities": { "input": [ "text" ], "output": [ - "text" + "audio" ] }, "limit": { - "context": 196608, - "output": 128000 + "context": 8192, + "output": 8192 }, - "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true - } + "supported": false }, "attachment": false, "open_weights": true, - "release_date": "2025-10-27", - "last_updated": "2025-10-27", + "release_date": "2026-04-22", + "last_updated": "2026-04-22", "cost": { - "input": 0.3, - "output": 1.2 + "input": 0, + "output": 0 }, "type": "chat" }, { - "id": "MiniMax-M2.7-highspeed", - "name": "MiniMax-M2.7-highspeed", - "display_name": "MiniMax-M2.7-highspeed", + "id": "mimo-v2.5-pro", + "name": "MiMo-V2.5-Pro", + "display_name": "MiMo-V2.5-Pro", "modalities": { "input": [ "text" @@ -182223,7 +185416,7 @@ ] }, "limit": { - "context": 204800, + "context": 1048576, "output": 131072 }, "temperature": true, @@ -182245,20 +185438,20 @@ }, "attachment": false, "open_weights": true, - "release_date": "2026-03-18", - "last_updated": "2026-03-18", + "knowledge": "2024-12", + "release_date": "2026-04-22", + "last_updated": "2026-04-22", "cost": { - "input": 0.6, - "output": 2.4, - "cache_read": 0.06, - "cache_write": 0.375 + "input": 0, + "output": 0, + "cache_read": 0 }, "type": "chat" }, { - "id": "MiniMax-M2.1", - "name": "MiniMax-M2.1", - "display_name": "MiniMax-M2.1", + "id": "mimo-v2-pro", + "name": "MiMo-V2-Pro", + "display_name": "MiMo-V2-Pro", "modalities": { "input": [ "text" @@ -182268,7 +185461,7 @@ ] }, "limit": { - "context": 204800, + "context": 1048576, "output": 131072 }, "temperature": true, @@ -182279,86 +185472,51 @@ }, "extra_capabilities": { "reasoning": { - "supported": true + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] } }, "attachment": false, - "open_weights": true, - "release_date": "2025-12-23", - "last_updated": "2025-12-23", - "cost": { - "input": 0.3, - "output": 1.2 - }, - "type": "chat" - } - ] - }, - "llama": { - "id": "llama", - "name": "Llama", - "display_name": "Llama", - "api": "https://api.llama.com/compat/v1/", - "doc": "https://llama.developer.meta.com/docs/models", - "models": [ - { - "id": "cerebras-llama-4-maverick-17b-128e-instruct", - "name": "Cerebras-Llama-4-Maverick-17B-128E-Instruct", - "display_name": "Cerebras-Llama-4-Maverick-17B-128E-Instruct", - "modalities": { - "input": [ - "text" - ], - "output": [ - "text" - ] - }, - "limit": { - "context": 128000, - "output": 4096 - }, - "temperature": true, - "tool_call": true, - "reasoning": { - "supported": false - }, - "attachment": true, - "open_weights": true, - "knowledge": "2025-01", - "release_date": "2025-04-05", - "last_updated": "2025-04-05", + "open_weights": false, + "knowledge": "2024-12", + "release_date": "2026-03-18", + "last_updated": "2026-03-18", "cost": { "input": 0, - "output": 0 + "output": 0, + "cache_read": 0 }, "type": "chat" }, { - "id": "groq-llama-4-maverick-17b-128e-instruct", - "name": "Groq-Llama-4-Maverick-17B-128E-Instruct", - "display_name": "Groq-Llama-4-Maverick-17B-128E-Instruct", + "id": "mimo-v2-tts", + "name": "MiMo-V2-TTS", + "display_name": "MiMo-V2-TTS", "modalities": { "input": [ "text" ], "output": [ - "text" + "audio" ] }, "limit": { - "context": 128000, - "output": 4096 + "context": 8192, + "output": 8192 }, - "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": false }, - "attachment": true, + "attachment": false, "open_weights": true, - "knowledge": "2025-01", - "release_date": "2025-04-05", - "last_updated": "2025-04-05", + "release_date": "2026-03-18", + "last_updated": "2026-03-18", "cost": { "input": 0, "output": 0 @@ -182366,97 +185524,126 @@ "type": "chat" }, { - "id": "llama-4-maverick-17b-128e-instruct-fp8", - "name": "Llama-4-Maverick-17B-128E-Instruct-FP8", - "display_name": "Llama-4-Maverick-17B-128E-Instruct-FP8", + "id": "mimo-v2-omni", + "name": "MiMo-V2-Omni", + "display_name": "MiMo-V2-Omni", "modalities": { "input": [ "text", - "image" + "image", + "audio", + "video", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 4096 + "context": 262144, + "output": 131072 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } }, "attachment": true, - "open_weights": true, - "knowledge": "2024-08", - "release_date": "2025-04-05", - "last_updated": "2025-04-05", + "open_weights": false, + "knowledge": "2024-12", + "release_date": "2026-03-18", + "last_updated": "2026-03-18", "cost": { "input": 0, - "output": 0 + "output": 0, + "cache_read": 0 }, "type": "chat" }, { - "id": "llama-4-scout-17b-16e-instruct-fp8", - "name": "Llama-4-Scout-17B-16E-Instruct-FP8", - "display_name": "Llama-4-Scout-17B-16E-Instruct-FP8", + "id": "mimo-v2.5", + "name": "MiMo-V2.5", + "display_name": "MiMo-V2.5", "modalities": { "input": [ "text", - "image" + "image", + "audio", + "video" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 4096 + "context": 1048576, + "output": 131072 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } }, "attachment": true, "open_weights": true, - "knowledge": "2024-08", - "release_date": "2025-04-05", - "last_updated": "2025-04-05", + "knowledge": "2024-12", + "release_date": "2026-04-22", + "last_updated": "2026-04-22", "cost": { "input": 0, - "output": 0 + "output": 0, + "cache_read": 0 }, "type": "chat" }, { - "id": "cerebras-llama-4-scout-17b-16e-instruct", - "name": "Cerebras-Llama-4-Scout-17B-16E-Instruct", - "display_name": "Cerebras-Llama-4-Scout-17B-16E-Instruct", + "id": "mimo-v2.5-tts-voicedesign", + "name": "MiMo-V2.5-TTS-VoiceDesign", + "display_name": "MiMo-V2.5-TTS-VoiceDesign", "modalities": { "input": [ "text" ], "output": [ - "text" + "audio" ] }, "limit": { - "context": 128000, - "output": 4096 + "context": 8192, + "output": 8192 }, - "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": false }, - "attachment": true, + "attachment": false, "open_weights": true, - "knowledge": "2025-01", - "release_date": "2025-04-05", - "last_updated": "2025-04-05", + "release_date": "2026-04-22", + "last_updated": "2026-04-22", "cost": { "input": 0, "output": 0 @@ -182464,66 +185651,77 @@ "type": "chat" }, { - "id": "llama-3.3-8b-instruct", - "name": "Llama-3.3-8B-Instruct", - "display_name": "Llama-3.3-8B-Instruct", + "id": "mimo-v2.5-tts-voiceclone", + "name": "MiMo-V2.5-TTS-VoiceClone", + "display_name": "MiMo-V2.5-TTS-VoiceClone", "modalities": { "input": [ "text" ], "output": [ - "text" + "audio" ] }, "limit": { - "context": 128000, - "output": 4096 + "context": 8192, + "output": 8192 }, - "temperature": true, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": false }, - "attachment": true, + "attachment": false, "open_weights": true, - "knowledge": "2023-12", - "release_date": "2024-12-06", - "last_updated": "2024-12-06", + "release_date": "2026-04-22", + "last_updated": "2026-04-22", "cost": { "input": 0, "output": 0 }, "type": "chat" - }, + } + ] + }, + "claudinio": { + "id": "claudinio", + "name": "Claudinio", + "display_name": "Claudinio", + "api": "https://api.claudin.io/v1", + "doc": "https://claudin.io", + "models": [ { - "id": "llama-3.3-70b-instruct", - "name": "Llama-3.3-70B-Instruct", - "display_name": "Llama-3.3-70B-Instruct", + "id": "claudinio", + "name": "Claudinio", + "display_name": "Claudinio", "modalities": { "input": [ - "text" + "text", + "image", + "audio", + "video" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 4096 + "context": 256000, + "output": 64000 }, - "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "attachment": true, - "open_weights": true, - "knowledge": "2023-12", - "release_date": "2024-12-06", - "last_updated": "2024-12-06", + "open_weights": false, + "knowledge": "2026-05", + "release_date": "2026-05-12", + "last_updated": "2026-06-02", "cost": { - "input": 0, - "output": 0 + "input": 0.5, + "output": 2, + "cache_read": 0.15 }, "type": "chat" } @@ -194610,36 +197808,47 @@ "type": "chat" }, { - "id": "qwen3-vl:235b-instruct", - "name": "qwen3-vl:235b-instruct", - "display_name": "qwen3-vl:235b-instruct", + "id": "deepseek-v4-flash", + "name": "deepseek-v4-flash", + "display_name": "deepseek-v4-flash", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 262144, - "output": 131072 + "context": 1048576, + "output": 1048576 }, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, - "attachment": true, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } + }, + "attachment": false, "open_weights": true, - "release_date": "2025-09-22", - "last_updated": "2026-01-19", + "release_date": "2026-04-24", + "last_updated": "2026-04-24", "type": "chat" }, { - "id": "kimi-k2:1t", - "name": "kimi-k2:1t", - "display_name": "kimi-k2:1t", + "id": "minimax-m2.5", + "name": "minimax-m2.5", + "display_name": "minimax-m2.5", "modalities": { "input": [ "text" @@ -194649,24 +197858,30 @@ ] }, "limit": { - "context": 262144, - "output": 262144 + "context": 204800, + "output": 131072 }, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true + } }, "attachment": false, "open_weights": true, - "knowledge": "2024-10", - "release_date": "2025-07-11", - "last_updated": "2026-01-19", + "knowledge": "2025-01", + "release_date": "2026-02-12", + "last_updated": "2026-02-12", "type": "chat" }, { - "id": "glm-4.6", - "name": "glm-4.6", - "display_name": "glm-4.6", + "id": "glm-4.7", + "name": "glm-4.7", + "display_name": "glm-4.7", "modalities": { "input": [ "text" @@ -194686,19 +197901,25 @@ }, "extra_capabilities": { "reasoning": { - "supported": true + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] } }, "attachment": false, "open_weights": true, - "release_date": "2025-09-29", + "release_date": "2025-12-22", "last_updated": "2026-01-19", "type": "chat" }, { - "id": "nemotron-3-ultra", - "name": "nemotron-3-ultra", - "display_name": "nemotron-3-ultra", + "id": "minimax-m2.1", + "name": "minimax-m2.1", + "display_name": "minimax-m2.1", "modalities": { "input": [ "text" @@ -194708,25 +197929,29 @@ ] }, "limit": { - "context": 262144, - "output": 128000 + "context": 204800, + "output": 131072 }, - "temperature": true, "tool_call": true, "reasoning": { "supported": true, "default": true }, + "extra_capabilities": { + "reasoning": { + "supported": true + } + }, "attachment": false, "open_weights": true, - "release_date": "2026-06-04", - "last_updated": "2026-06-04", + "release_date": "2025-12-23", + "last_updated": "2026-01-19", "type": "chat" }, { - "id": "kimi-k2-thinking", - "name": "kimi-k2-thinking", - "display_name": "kimi-k2-thinking", + "id": "glm-5.1", + "name": "glm-5.1", + "display_name": "glm-5.1", "modalities": { "input": [ "text" @@ -194736,8 +197961,8 @@ ] }, "limit": { - "context": 262144, - "output": 262144 + "context": 202752, + "output": 131072 }, "tool_call": true, "reasoning": { @@ -194757,30 +197982,26 @@ }, "attachment": false, "open_weights": true, - "knowledge": "2024-08", - "release_date": "2025-11-06", - "last_updated": "2026-01-19", + "release_date": "2026-03-27", + "last_updated": "2026-04-07", "type": "chat" }, { - "id": "minimax-m3", - "name": "minimax-m3", - "display_name": "minimax-m3", + "id": "deepseek-v4-pro", + "name": "deepseek-v4-pro", + "display_name": "deepseek-v4-pro", "modalities": { "input": [ - "text", - "image", - "video" + "text" ], "output": [ "text" ] }, "limit": { - "context": 512000, - "output": 131072 + "context": 1048576, + "output": 1048576 }, - "temperature": true, "tool_call": true, "reasoning": { "supported": true, @@ -194788,20 +198009,25 @@ }, "extra_capabilities": { "reasoning": { - "supported": true + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] } }, - "attachment": true, + "attachment": false, "open_weights": true, - "knowledge": "2025-01", - "release_date": "2026-05-31", - "last_updated": "2026-05-31", + "release_date": "2026-04-24", + "last_updated": "2026-04-24", "type": "chat" }, { - "id": "deepseek-v3.2", - "name": "deepseek-v3.2", - "display_name": "deepseek-v3.2", + "id": "glm-4.6", + "name": "glm-4.6", + "display_name": "glm-4.6", "modalities": { "input": [ "text" @@ -194811,8 +198037,8 @@ ] }, "limit": { - "context": 163840, - "output": 65536 + "context": 202752, + "output": 131072 }, "tool_call": true, "reasoning": { @@ -194826,14 +198052,14 @@ }, "attachment": false, "open_weights": true, - "release_date": "2025-06-15", + "release_date": "2025-09-29", "last_updated": "2026-01-19", "type": "chat" }, { - "id": "minimax-m2.1", - "name": "minimax-m2.1", - "display_name": "minimax-m2.1", + "id": "kimi-k2-thinking", + "name": "kimi-k2-thinking", + "display_name": "kimi-k2-thinking", "modalities": { "input": [ "text" @@ -194843,8 +198069,8 @@ ] }, "limit": { - "context": 204800, - "output": 131072 + "context": 262144, + "output": 262144 }, "tool_call": true, "reasoning": { @@ -194853,32 +198079,41 @@ }, "extra_capabilities": { "reasoning": { - "supported": true + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] } }, "attachment": false, "open_weights": true, - "release_date": "2025-12-23", + "knowledge": "2024-08", + "release_date": "2025-11-06", "last_updated": "2026-01-19", "type": "chat" }, { - "id": "kimi-k2.6", - "name": "kimi-k2.6", - "display_name": "kimi-k2.6", + "id": "minimax-m3", + "name": "minimax-m3", + "display_name": "minimax-m3", "modalities": { "input": [ "text", - "image" + "image", + "video" ], "output": [ "text" ] }, "limit": { - "context": 262144, - "output": 262144 + "context": 512000, + "output": 131072 }, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, @@ -194891,14 +198126,15 @@ }, "attachment": true, "open_weights": true, - "release_date": "2026-04-20", - "last_updated": "2026-04-20", + "knowledge": "2025-01", + "release_date": "2026-05-31", + "last_updated": "2026-05-31", "type": "chat" }, { - "id": "glm-4.7", - "name": "glm-4.7", - "display_name": "glm-4.7", + "id": "minimax-m2", + "name": "minimax-m2", + "display_name": "minimax-m2", "modalities": { "input": [ "text" @@ -194908,8 +198144,8 @@ ] }, "limit": { - "context": 202752, - "output": 131072 + "context": 204800, + "output": 128000 }, "tool_call": true, "reasoning": { @@ -194918,68 +198154,22 @@ }, "extra_capabilities": { "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] + "supported": true } }, "attachment": false, "open_weights": true, - "release_date": "2025-12-22", + "release_date": "2025-10-23", "last_updated": "2026-01-19", "type": "chat" }, { - "id": "qwen3.5:397b", - "name": "qwen3.5:397b", - "display_name": "qwen3.5:397b", + "id": "kimi-k2:1t", + "name": "kimi-k2:1t", + "display_name": "kimi-k2:1t", "modalities": { "input": [ - "text", - "image" - ], - "output": [ "text" - ] - }, - "limit": { - "context": 262144, - "output": 65536 - }, - "tool_call": true, - "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } - }, - "attachment": true, - "open_weights": true, - "release_date": "2026-02-15", - "last_updated": "2026-02-17", - "type": "chat" - }, - { - "id": "mistral-large-3:675b", - "name": "mistral-large-3:675b", - "display_name": "mistral-large-3:675b", - "modalities": { - "input": [ - "text", - "image" ], "output": [ "text" @@ -194993,9 +198183,10 @@ "reasoning": { "supported": false }, - "attachment": true, + "attachment": false, "open_weights": true, - "release_date": "2025-12-02", + "knowledge": "2024-10", + "release_date": "2025-07-11", "last_updated": "2026-01-19", "type": "chat" }, @@ -195038,20 +198229,21 @@ "type": "chat" }, { - "id": "deepseek-v4-flash", - "name": "deepseek-v4-flash", - "display_name": "deepseek-v4-flash", + "id": "kimi-k2.5", + "name": "kimi-k2.5", + "display_name": "kimi-k2.5", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 1048576, - "output": 1048576 + "context": 262144, + "output": 262144 }, "tool_call": true, "reasoning": { @@ -195069,27 +198261,28 @@ ] } }, - "attachment": false, + "attachment": true, "open_weights": true, - "release_date": "2026-04-24", - "last_updated": "2026-04-24", + "release_date": "2026-01-27", + "last_updated": "2026-01-27", "type": "chat" }, { - "id": "glm-5", - "name": "glm-5", - "display_name": "glm-5", + "id": "qwen3.5:397b", + "name": "qwen3.5:397b", + "display_name": "qwen3.5:397b", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 202752, - "output": 131072 + "context": 262144, + "output": 65536 }, "tool_call": true, "reasoning": { @@ -195107,27 +198300,28 @@ ] } }, - "attachment": false, + "attachment": true, "open_weights": true, - "release_date": "2026-02-11", - "last_updated": "2026-02-11", + "release_date": "2026-02-15", + "last_updated": "2026-02-17", "type": "chat" }, { - "id": "minimax-m2", - "name": "minimax-m2", - "display_name": "minimax-m2", + "id": "kimi-k2.6", + "name": "kimi-k2.6", + "display_name": "kimi-k2.6", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 204800, - "output": 128000 + "context": 262144, + "output": 262144 }, "tool_call": true, "reasoning": { @@ -195139,91 +198333,73 @@ "supported": true } }, - "attachment": false, + "attachment": true, "open_weights": true, - "release_date": "2025-10-23", - "last_updated": "2026-01-19", + "release_date": "2026-04-20", + "last_updated": "2026-04-20", "type": "chat" }, { - "id": "minimax-m2.5", - "name": "minimax-m2.5", - "display_name": "minimax-m2.5", + "id": "qwen3-vl:235b-instruct", + "name": "qwen3-vl:235b-instruct", + "display_name": "qwen3-vl:235b-instruct", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 204800, + "context": 262144, "output": 131072 }, "tool_call": true, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true - } + "supported": false }, - "attachment": false, + "attachment": true, "open_weights": true, - "knowledge": "2025-01", - "release_date": "2026-02-12", - "last_updated": "2026-02-12", + "release_date": "2025-09-22", + "last_updated": "2026-01-19", "type": "chat" }, { - "id": "deepseek-v4-pro", - "name": "deepseek-v4-pro", - "display_name": "deepseek-v4-pro", + "id": "mistral-large-3:675b", + "name": "mistral-large-3:675b", + "display_name": "mistral-large-3:675b", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 1048576, - "output": 1048576 + "context": 262144, + "output": 262144 }, "tool_call": true, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } + "supported": false }, - "attachment": false, + "attachment": true, "open_weights": true, - "release_date": "2026-04-24", - "last_updated": "2026-04-24", + "release_date": "2025-12-02", + "last_updated": "2026-01-19", "type": "chat" }, { - "id": "kimi-k2.5", - "name": "kimi-k2.5", - "display_name": "kimi-k2.5", + "id": "nemotron-3-ultra", + "name": "nemotron-3-ultra", + "display_name": "nemotron-3-ultra", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" @@ -195231,34 +198407,24 @@ }, "limit": { "context": 262144, - "output": 262144 + "output": 128000 }, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, "default": true }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } - }, - "attachment": true, + "attachment": false, "open_weights": true, - "release_date": "2026-01-27", - "last_updated": "2026-01-27", + "release_date": "2026-06-04", + "last_updated": "2026-06-04", "type": "chat" }, { - "id": "glm-5.1", - "name": "glm-5.1", - "display_name": "glm-5.1", + "id": "glm-5", + "name": "glm-5", + "display_name": "glm-5", "modalities": { "input": [ "text" @@ -195289,8 +198455,40 @@ }, "attachment": false, "open_weights": true, - "release_date": "2026-03-27", - "last_updated": "2026-04-07", + "release_date": "2026-02-11", + "last_updated": "2026-02-11", + "type": "chat" + }, + { + "id": "deepseek-v3.2", + "name": "deepseek-v3.2", + "display_name": "deepseek-v3.2", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 163840, + "output": 65536 + }, + "tool_call": true, + "reasoning": { + "supported": true, + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true + } + }, + "attachment": false, + "open_weights": true, + "release_date": "2025-06-15", + "last_updated": "2026-01-19", "type": "chat" } ] @@ -206982,6 +210180,80 @@ }, "type": "chat" }, + { + "id": "gemini-3.1-flash-image", + "name": "gemini-3.1-flash-image", + "display_name": "gemini-3.1-flash-image", + "modalities": { + "input": [ + "text", + "image" + ] + }, + "limit": { + "context": 8192, + "output": 8192 + }, + "tool_call": false, + "reasoning": { + "supported": true, + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true + } + }, + "cost": { + "input": 0.5, + "output": 3, + "cache_read": 0.5 + }, + "type": "imageGeneration" + }, + { + "id": "gemini-3-pro-image", + "name": "gemini-3-pro-image", + "display_name": "gemini-3-pro-image", + "modalities": { + "input": [ + "text", + "image" + ] + }, + "limit": { + "context": 8192, + "output": 8192 + }, + "tool_call": false, + "reasoning": { + "supported": true, + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": true, + "mode": "level", + "level": "high", + "level_options": [ + "low", + "high" + ], + "summaries": true, + "visibility": "summary", + "continuation": [ + "thought_signatures" + ] + } + }, + "cost": { + "input": 2, + "output": 12, + "cache_read": 2 + }, + "type": "imageGeneration" + }, { "id": "step-3.7-flash-free", "name": "step-3.7-flash-free", @@ -207115,9 +210387,9 @@ "supported": false }, "cost": { - "input": 0.22, - "output": 1.32, - "cache_read": 0.044 + "input": 0.022, + "output": 0.132, + "cache_read": 0.0044 }, "type": "chat" }, @@ -208285,13 +211557,12 @@ "type": "imageGeneration" }, { - "id": "wan2.7-videoedit", - "name": "wan2.7-videoedit", - "display_name": "wan2.7-videoedit", + "id": "wan2.7-t2v", + "name": "wan2.7-t2v", + "display_name": "wan2.7-t2v", "modalities": { "input": [ - "text", - "video" + "text" ] }, "limit": { @@ -208309,12 +211580,13 @@ "type": "chat" }, { - "id": "wan2.7-t2v", - "name": "wan2.7-t2v", - "display_name": "wan2.7-t2v", + "id": "wan2.7-videoedit", + "name": "wan2.7-videoedit", + "display_name": "wan2.7-videoedit", "modalities": { "input": [ - "text" + "text", + "video" ] }, "limit": { @@ -216652,6 +219924,30 @@ }, "type": "chat" }, + { + "id": "gte-rerank-v2", + "name": "gte-rerank-v2", + "display_name": "gte-rerank-v2", + "modalities": { + "input": [ + "text", + "image" + ] + }, + "limit": { + "context": 8192, + "output": 8192 + }, + "tool_call": false, + "reasoning": { + "supported": false + }, + "cost": { + "input": 0.11, + "output": 0.11 + }, + "type": "rerank" + }, { "id": "inclusionAI/Ling-flash-2.0", "name": "inclusionAI/Ling-flash-2.0", @@ -217254,30 +220550,6 @@ }, "type": "embedding" }, - { - "id": "gte-rerank-v2", - "name": "gte-rerank-v2", - "display_name": "gte-rerank-v2", - "modalities": { - "input": [ - "text", - "image" - ] - }, - "limit": { - "context": 8192, - "output": 8192 - }, - "tool_call": false, - "reasoning": { - "supported": false - }, - "cost": { - "input": 0.11, - "output": 0.11 - }, - "type": "rerank" - }, { "id": "bce-reranker-base", "name": "bce-reranker-base", @@ -219535,25 +222807,6 @@ }, "type": "chat" }, - { - "id": "unsloth/gemma-3-12b-it", - "name": "unsloth/gemma-3-12b-it", - "display_name": "unsloth/gemma-3-12b-it", - "limit": { - "context": 8192, - "output": 8192 - }, - "tool_call": false, - "reasoning": { - "supported": false - }, - "cost": { - "input": 0.2, - "output": 0.8, - "cache_read": 0 - }, - "type": "chat" - }, { "id": "gemini-exp-1206", "name": "gemini-exp-1206", @@ -219596,6 +222849,25 @@ }, "type": "chat" }, + { + "id": "unsloth/gemma-3-12b-it", + "name": "unsloth/gemma-3-12b-it", + "display_name": "unsloth/gemma-3-12b-it", + "limit": { + "context": 8192, + "output": 8192 + }, + "tool_call": false, + "reasoning": { + "supported": false + }, + "cost": { + "input": 0.2, + "output": 0.8, + "cache_read": 0 + }, + "type": "chat" + }, { "id": "qwen-max-0125", "name": "qwen-max-0125", @@ -220273,6 +223545,36 @@ }, "type": "chat" }, + { + "id": "qwen3-14b", + "name": "qwen3-14b", + "display_name": "qwen3-14b", + "limit": { + "context": 8192, + "output": 8192 + }, + "tool_call": false, + "reasoning": { + "supported": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } + }, + "cost": { + "input": 0.16, + "output": 1.6, + "cache_read": 0 + }, + "type": "chat" + }, { "id": "aihub-Phi-4", "name": "aihub-Phi-4", @@ -220339,9 +223641,28 @@ "type": "imageGeneration" }, { - "id": "qwen3-14b", - "name": "qwen3-14b", - "display_name": "qwen3-14b", + "id": "grok-3-fast", + "name": "grok-3-fast", + "display_name": "grok-3-fast", + "limit": { + "context": 8192, + "output": 8192 + }, + "tool_call": false, + "reasoning": { + "supported": false + }, + "cost": { + "input": 5.5, + "output": 27.5, + "cache_read": 0 + }, + "type": "chat" + }, + { + "id": "qwen3-8b", + "name": "qwen3-8b", + "display_name": "qwen3-8b", "limit": { "context": 8192, "output": 8192 @@ -220362,16 +223683,16 @@ } }, "cost": { - "input": 0.16, - "output": 1.6, + "input": 0.08, + "output": 0.8, "cache_read": 0 }, "type": "chat" }, { - "id": "qwen3-8b", - "name": "qwen3-8b", - "display_name": "qwen3-8b", + "id": "qwen3-4b", + "name": "qwen3-4b", + "display_name": "qwen3-4b", "limit": { "context": 8192, "output": 8192 @@ -220392,16 +223713,16 @@ } }, "cost": { - "input": 0.08, - "output": 0.8, + "input": 0.046, + "output": 0.46, "cache_read": 0 }, "type": "chat" }, { - "id": "grok-3-fast", - "name": "grok-3-fast", - "display_name": "grok-3-fast", + "id": "deepseek-ai/DeepSeek-R1-Zero", + "name": "deepseek-ai/DeepSeek-R1-Zero", + "display_name": "deepseek-ai/DeepSeek-R1-Zero", "limit": { "context": 8192, "output": 8192 @@ -220411,9 +223732,8 @@ "supported": false }, "cost": { - "input": 5.5, - "output": 27.5, - "cache_read": 0 + "input": 2.2, + "output": 2.2 }, "type": "chat" }, @@ -220456,39 +223776,9 @@ "type": "chat" }, { - "id": "qwen3-4b", - "name": "qwen3-4b", - "display_name": "qwen3-4b", - "limit": { - "context": 8192, - "output": 8192 - }, - "tool_call": false, - "reasoning": { - "supported": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } - }, - "cost": { - "input": 0.046, - "output": 0.46, - "cache_read": 0 - }, - "type": "chat" - }, - { - "id": "deepseek-ai/DeepSeek-R1-Zero", - "name": "deepseek-ai/DeepSeek-R1-Zero", - "display_name": "deepseek-ai/DeepSeek-R1-Zero", + "id": "grok-3-mini-beta", + "name": "grok-3-mini-beta", + "display_name": "grok-3-mini-beta", "limit": { "context": 8192, "output": 8192 @@ -220498,8 +223788,9 @@ "supported": false }, "cost": { - "input": 2.2, - "output": 2.2 + "input": 0.33, + "output": 0.5511, + "cache_read": 0 }, "type": "chat" }, @@ -220533,25 +223824,6 @@ }, "type": "chat" }, - { - "id": "grok-3-mini-beta", - "name": "grok-3-mini-beta", - "display_name": "grok-3-mini-beta", - "limit": { - "context": 8192, - "output": 8192 - }, - "tool_call": false, - "reasoning": { - "supported": false - }, - "cost": { - "input": 0.33, - "output": 0.5511, - "cache_read": 0 - }, - "type": "chat" - }, { "id": "qwen3-0.6b", "name": "qwen3-0.6b", @@ -221282,6 +224554,30 @@ }, "type": "chat" }, + { + "id": "wan2.6-t2i", + "name": "wan2.6-t2i", + "display_name": "wan2.6-t2i", + "modalities": { + "input": [ + "image", + "text" + ] + }, + "limit": { + "context": 8192, + "output": 8192 + }, + "tool_call": false, + "reasoning": { + "supported": false + }, + "cost": { + "input": 2, + "output": 0 + }, + "type": "imageGeneration" + }, { "id": "grok-2-1212", "name": "grok-2-1212", @@ -221301,13 +224597,125 @@ "type": "chat" }, { - "id": "wan2.6-t2i", - "name": "wan2.6-t2i", - "display_name": "wan2.6-t2i", + "id": "gpt-image-test", + "name": "gpt-image-test", + "display_name": "gpt-image-test", + "limit": { + "context": 8192, + "output": 8192 + }, + "tool_call": false, + "reasoning": { + "supported": false + }, + "cost": { + "input": 5, + "output": 40, + "cache_read": 0 + }, + "type": "chat" + }, + { + "id": "grok-4.20-beta-0309-non-reasoning", + "name": "grok-4.20-beta-0309-non-reasoning", + "display_name": "grok-4.20-beta-0309-non-reasoning", "modalities": { "input": [ - "image", - "text" + "text", + "image" + ] + }, + "limit": { + "context": 2000000, + "output": 2000000 + }, + "tool_call": true, + "reasoning": { + "supported": true, + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true + } + }, + "cost": { + "input": 2, + "output": 6, + "cache_read": 0.2 + }, + "type": "chat" + }, + { + "id": "grok-4.20-beta-0309-reasoning", + "name": "grok-4.20-beta-0309-reasoning", + "display_name": "grok-4.20-beta-0309-reasoning", + "modalities": { + "input": [ + "text", + "image" + ] + }, + "limit": { + "context": 2000000, + "output": 2000000 + }, + "tool_call": true, + "reasoning": { + "supported": true, + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true + } + }, + "cost": { + "input": 2, + "output": 6, + "cache_read": 0.2 + }, + "type": "chat" + }, + { + "id": "grok-4.20-multi-agent-beta-0309", + "name": "grok-4.20-multi-agent-beta-0309", + "display_name": "grok-4.20-multi-agent-beta-0309", + "modalities": { + "input": [ + "text", + "image" + ] + }, + "limit": { + "context": 2000000, + "output": 2000000 + }, + "tool_call": true, + "reasoning": { + "supported": true, + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true + } + }, + "cost": { + "input": 2, + "output": 6, + "cache_read": 0.2 + }, + "type": "chat" + }, + { + "id": "imagen-3.0-generate-002", + "name": "imagen-3.0-generate-002", + "display_name": "imagen-3.0-generate-002", + "modalities": { + "input": [ + "text", + "image" ] }, "limit": { @@ -221320,14 +224728,223 @@ }, "cost": { "input": 2, - "output": 0 + "output": 2, + "cache_read": 0 }, "type": "imageGeneration" }, { - "id": "imagen-3.0-generate-002", - "name": "imagen-3.0-generate-002", - "display_name": "imagen-3.0-generate-002", + "id": "llama3.1-8b", + "name": "llama3.1-8b", + "display_name": "llama3.1-8b", + "limit": { + "context": 8192, + "output": 8192 + }, + "tool_call": false, + "reasoning": { + "supported": false + }, + "cost": { + "input": 0.3, + "output": 0.6 + }, + "type": "chat" + }, + { + "id": "o1-2024-12-17", + "name": "o1-2024-12-17", + "display_name": "o1-2024-12-17", + "modalities": { + "input": [ + "text", + "image" + ] + }, + "limit": { + "context": 8192, + "output": 8192 + }, + "tool_call": false, + "reasoning": { + "supported": true, + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": true, + "mode": "effort", + "effort": "medium", + "effort_options": [ + "low", + "medium", + "high" + ], + "visibility": "hidden" + } + }, + "cost": { + "input": 15, + "output": 60, + "cache_read": 7.5 + }, + "type": "chat" + }, + { + "id": "sf-kimi-k2-thinking", + "name": "sf-kimi-k2-thinking", + "display_name": "sf-kimi-k2-thinking", + "limit": { + "context": 8192, + "output": 8192 + }, + "tool_call": false, + "reasoning": { + "supported": false + }, + "cost": { + "input": 0.548, + "output": 2.192 + }, + "type": "chat" + }, + { + "id": "DESCRIBE", + "name": "DESCRIBE", + "display_name": "DESCRIBE", + "modalities": { + "input": [ + "text", + "image" + ] + }, + "limit": { + "context": 8192, + "output": 8192 + }, + "tool_call": false, + "reasoning": { + "supported": false + }, + "cost": { + "input": 2, + "output": 2, + "cache_read": 0 + }, + "type": "imageGeneration" + }, + { + "id": "UPSCALE", + "name": "UPSCALE", + "display_name": "UPSCALE", + "modalities": { + "input": [ + "text", + "image" + ] + }, + "limit": { + "context": 8192, + "output": 8192 + }, + "tool_call": false, + "reasoning": { + "supported": false + }, + "cost": { + "input": 2, + "output": 2, + "cache_read": 0 + }, + "type": "imageGeneration" + }, + { + "id": "bai-qwen3-vl-235b-a22b-instruct", + "name": "bai-qwen3-vl-235b-a22b-instruct", + "display_name": "bai-qwen3-vl-235b-a22b-instruct", + "limit": { + "context": 8192, + "output": 8192 + }, + "tool_call": false, + "reasoning": { + "supported": false + }, + "cost": { + "input": 0.274, + "output": 1.096 + }, + "type": "chat" + }, + { + "id": "cc-MiniMax-M2", + "name": "cc-MiniMax-M2", + "display_name": "cc-MiniMax-M2", + "modalities": { + "input": [ + "text" + ] + }, + "limit": { + "context": 8192, + "output": 8192 + }, + "tool_call": true, + "reasoning": { + "supported": false + }, + "cost": { + "input": 0.1, + "output": 0.1 + }, + "type": "chat" + }, + { + "id": "cc-deepseek-v3", + "name": "cc-deepseek-v3", + "display_name": "cc-deepseek-v3", + "limit": { + "context": 8192, + "output": 8192 + }, + "tool_call": false, + "reasoning": { + "supported": false + }, + "cost": { + "input": 0.3, + "output": 0.3 + }, + "type": "chat" + }, + { + "id": "cc-deepseek-v3.1", + "name": "cc-deepseek-v3.1", + "display_name": "cc-deepseek-v3.1", + "modalities": { + "input": [ + "text" + ] + }, + "limit": { + "context": 8192, + "output": 8192 + }, + "tool_call": true, + "reasoning": { + "supported": false + }, + "cost": { + "input": 0.56, + "output": 1.68 + }, + "type": "chat" + }, + { + "id": "cc-ernie-4.5-300b-a47b", + "name": "cc-ernie-4.5-300b-a47b", + "display_name": "cc-ernie-4.5-300b-a47b", "modalities": { "input": [ "text", @@ -221338,21 +224955,626 @@ "context": 8192, "output": 8192 }, + "tool_call": true, + "reasoning": { + "supported": false + }, + "cost": { + "input": 0.32, + "output": 1.28, + "cache_read": 0 + }, + "type": "chat" + }, + { + "id": "cc-kimi-dev-72b", + "name": "cc-kimi-dev-72b", + "display_name": "cc-kimi-dev-72b", + "limit": { + "context": 8192, + "output": 8192 + }, + "tool_call": false, + "reasoning": { + "supported": false + }, + "cost": { + "input": 0.32, + "output": 1.28, + "cache_read": 0 + }, + "type": "chat" + }, + { + "id": "cc-kimi-k2-instruct", + "name": "cc-kimi-k2-instruct", + "display_name": "cc-kimi-k2-instruct", + "modalities": { + "input": [ + "text" + ] + }, + "limit": { + "context": 8192, + "output": 8192 + }, + "tool_call": true, + "reasoning": { + "supported": false + }, + "cost": { + "input": 1.1, + "output": 3.3 + }, + "type": "chat" + }, + { + "id": "cc-kimi-k2-instruct-0905", + "name": "cc-kimi-k2-instruct-0905", + "display_name": "cc-kimi-k2-instruct-0905", + "modalities": { + "input": [ + "text" + ] + }, + "limit": { + "context": 8192, + "output": 8192 + }, + "tool_call": true, + "reasoning": { + "supported": false + }, + "cost": { + "input": 1.1, + "output": 3.3 + }, + "type": "chat" + }, + { + "id": "cc-kimi-k2-thinking", + "name": "cc-kimi-k2-thinking", + "display_name": "cc-kimi-k2-thinking", + "limit": { + "context": 8192, + "output": 8192 + }, + "tool_call": false, + "reasoning": { + "supported": false + }, + "cost": { + "input": 0.548, + "output": 2.192 + }, + "type": "chat" + }, + { + "id": "computer-use-preview", + "name": "computer-use-preview", + "display_name": "computer-use-preview", + "limit": { + "context": 8192, + "output": 8192 + }, + "tool_call": false, + "reasoning": { + "supported": false + }, + "cost": { + "input": 3, + "output": 12 + }, + "type": "chat" + }, + { + "id": "Baichuan3-Turbo", + "name": "Baichuan3-Turbo", + "display_name": "Baichuan3-Turbo", + "limit": { + "context": 8192, + "output": 8192 + }, + "tool_call": false, + "reasoning": { + "supported": false + }, + "cost": { + "input": 1.9, + "output": 1.9 + }, + "type": "chat" + }, + { + "id": "Baichuan3-Turbo-128k", + "name": "Baichuan3-Turbo-128k", + "display_name": "Baichuan3-Turbo-128k", + "limit": { + "context": 8192, + "output": 8192 + }, + "tool_call": false, + "reasoning": { + "supported": false + }, + "cost": { + "input": 3.8, + "output": 3.8 + }, + "type": "chat" + }, + { + "id": "Baichuan4", + "name": "Baichuan4", + "display_name": "Baichuan4", + "limit": { + "context": 8192, + "output": 8192 + }, + "tool_call": false, + "reasoning": { + "supported": false + }, + "cost": { + "input": 16, + "output": 16 + }, + "type": "chat" + }, + { + "id": "Baichuan4-Air", + "name": "Baichuan4-Air", + "display_name": "Baichuan4-Air", + "limit": { + "context": 8192, + "output": 8192 + }, + "tool_call": false, + "reasoning": { + "supported": false + }, + "cost": { + "input": 0.16, + "output": 0.16 + }, + "type": "chat" + }, + { + "id": "Baichuan4-Turbo", + "name": "Baichuan4-Turbo", + "display_name": "Baichuan4-Turbo", + "limit": { + "context": 8192, + "output": 8192 + }, + "tool_call": false, + "reasoning": { + "supported": false + }, + "cost": { + "input": 2.4, + "output": 2.4 + }, + "type": "chat" + }, + { + "id": "DeepSeek-v3", + "name": "DeepSeek-v3", + "display_name": "DeepSeek-v3", + "limit": { + "context": 8192, + "output": 8192 + }, + "tool_call": false, + "reasoning": { + "supported": false + }, + "cost": { + "input": 0.272, + "output": 1.088 + }, + "type": "chat" + }, + { + "id": "Doubao-1.5-lite-32k", + "name": "Doubao-1.5-lite-32k", + "display_name": "Doubao-1.5-lite-32k", + "limit": { + "context": 8192, + "output": 8192 + }, + "tool_call": false, + "reasoning": { + "supported": false + }, + "cost": { + "input": 0.05, + "output": 0.1, + "cache_read": 0.01 + }, + "type": "chat" + }, + { + "id": "Doubao-1.5-pro-256k", + "name": "Doubao-1.5-pro-256k", + "display_name": "Doubao-1.5-pro-256k", + "limit": { + "context": 8192, + "output": 8192 + }, + "tool_call": false, + "reasoning": { + "supported": false + }, + "cost": { + "input": 0.8, + "output": 1.44, + "cache_read": 0.8 + }, + "type": "chat" + }, + { + "id": "Doubao-1.5-pro-32k", + "name": "Doubao-1.5-pro-32k", + "display_name": "Doubao-1.5-pro-32k", + "limit": { + "context": 8192, + "output": 8192 + }, + "tool_call": false, + "reasoning": { + "supported": false + }, + "cost": { + "input": 0.134, + "output": 0.335, + "cache_read": 0.0268 + }, + "type": "chat" + }, + { + "id": "Doubao-1.5-vision-pro-32k", + "name": "Doubao-1.5-vision-pro-32k", + "display_name": "Doubao-1.5-vision-pro-32k", + "limit": { + "context": 8192, + "output": 8192 + }, + "tool_call": false, + "reasoning": { + "supported": false + }, + "cost": { + "input": 0.46, + "output": 1.38 + }, + "type": "chat" + }, + { + "id": "Doubao-lite-128k", + "name": "Doubao-lite-128k", + "display_name": "Doubao-lite-128k", + "limit": { + "context": 8192, + "output": 8192 + }, + "tool_call": false, + "reasoning": { + "supported": false + }, + "cost": { + "input": 0.14, + "output": 0.28, + "cache_read": 0.14 + }, + "type": "chat" + }, + { + "id": "Doubao-lite-32k", + "name": "Doubao-lite-32k", + "display_name": "Doubao-lite-32k", + "limit": { + "context": 8192, + "output": 8192 + }, + "tool_call": false, + "reasoning": { + "supported": false + }, + "cost": { + "input": 0.06, + "output": 0.12, + "cache_read": 0.012 + }, + "type": "chat" + }, + { + "id": "Doubao-lite-4k", + "name": "Doubao-lite-4k", + "display_name": "Doubao-lite-4k", + "limit": { + "context": 8192, + "output": 8192 + }, + "tool_call": false, + "reasoning": { + "supported": false + }, + "cost": { + "input": 0.06, + "output": 0.12, + "cache_read": 0.06 + }, + "type": "chat" + }, + { + "id": "Doubao-pro-128k", + "name": "Doubao-pro-128k", + "display_name": "Doubao-pro-128k", + "limit": { + "context": 8192, + "output": 8192 + }, + "tool_call": false, + "reasoning": { + "supported": false + }, + "cost": { + "input": 0.8, + "output": 1.44 + }, + "type": "chat" + }, + { + "id": "Doubao-pro-256k", + "name": "Doubao-pro-256k", + "display_name": "Doubao-pro-256k", + "limit": { + "context": 8192, + "output": 8192 + }, + "tool_call": false, + "reasoning": { + "supported": false + }, + "cost": { + "input": 0.8, + "output": 1.44, + "cache_read": 0.8 + }, + "type": "chat" + }, + { + "id": "Doubao-pro-32k", + "name": "Doubao-pro-32k", + "display_name": "Doubao-pro-32k", + "limit": { + "context": 8192, + "output": 8192 + }, + "tool_call": false, + "reasoning": { + "supported": false + }, + "cost": { + "input": 0.14, + "output": 0.35, + "cache_read": 0.028 + }, + "type": "chat" + }, + { + "id": "Doubao-pro-4k", + "name": "Doubao-pro-4k", + "display_name": "Doubao-pro-4k", + "limit": { + "context": 8192, + "output": 8192 + }, + "tool_call": false, + "reasoning": { + "supported": false + }, + "cost": { + "input": 0.14, + "output": 0.35 + }, + "type": "chat" + }, + { + "id": "GPT-OSS-20B", + "name": "GPT-OSS-20B", + "display_name": "GPT-OSS-20B", + "limit": { + "context": 8192, + "output": 8192 + }, + "tool_call": false, + "reasoning": { + "supported": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true + } + }, + "cost": { + "input": 0.11, + "output": 0.55 + }, + "type": "chat" + }, + { + "id": "Gryphe/MythoMax-L2-13b", + "name": "Gryphe/MythoMax-L2-13b", + "display_name": "Gryphe/MythoMax-L2-13b", + "limit": { + "context": 8192, + "output": 8192 + }, + "tool_call": false, + "reasoning": { + "supported": false + }, + "cost": { + "input": 0.4, + "output": 0.4 + }, + "type": "chat" + }, + { + "id": "MiniMax-Text-01", + "name": "MiniMax-Text-01", + "display_name": "MiniMax-Text-01", + "modalities": { + "input": [ + "text" + ] + }, + "limit": { + "context": 8192, + "output": 8192 + }, + "tool_call": false, + "reasoning": { + "supported": false + }, + "cost": { + "input": 0.14, + "output": 1.12 + }, + "type": "chat" + }, + { + "id": "Mistral-large-2407", + "name": "Mistral-large-2407", + "display_name": "Mistral-large-2407", + "limit": { + "context": 8192, + "output": 8192 + }, + "tool_call": false, + "reasoning": { + "supported": false + }, + "cost": { + "input": 3, + "output": 9 + }, + "type": "chat" + }, + { + "id": "Qwen/Qwen2-1.5B-Instruct", + "name": "Qwen/Qwen2-1.5B-Instruct", + "display_name": "Qwen/Qwen2-1.5B-Instruct", + "limit": { + "context": 8192, + "output": 8192 + }, + "tool_call": false, + "reasoning": { + "supported": false + }, + "cost": { + "input": 0.2, + "output": 0.2 + }, + "type": "chat" + }, + { + "id": "Qwen/Qwen2-57B-A14B-Instruct", + "name": "Qwen/Qwen2-57B-A14B-Instruct", + "display_name": "Qwen/Qwen2-57B-A14B-Instruct", + "limit": { + "context": 8192, + "output": 8192 + }, + "tool_call": false, + "reasoning": { + "supported": false + }, + "cost": { + "input": 0.24, + "output": 0.24 + }, + "type": "chat" + }, + { + "id": "Qwen/Qwen2-72B-Instruct", + "name": "Qwen/Qwen2-72B-Instruct", + "display_name": "Qwen/Qwen2-72B-Instruct", + "limit": { + "context": 8192, + "output": 8192 + }, + "tool_call": false, + "reasoning": { + "supported": false + }, + "cost": { + "input": 0.8, + "output": 0.8 + }, + "type": "chat" + }, + { + "id": "Qwen/Qwen2-7B-Instruct", + "name": "Qwen/Qwen2-7B-Instruct", + "display_name": "Qwen/Qwen2-7B-Instruct", + "limit": { + "context": 8192, + "output": 8192 + }, + "tool_call": false, + "reasoning": { + "supported": false + }, + "cost": { + "input": 0.08, + "output": 0.08 + }, + "type": "chat" + }, + { + "id": "Qwen/Qwen2.5-32B-Instruct", + "name": "Qwen/Qwen2.5-32B-Instruct", + "display_name": "Qwen/Qwen2.5-32B-Instruct", + "limit": { + "context": 8192, + "output": 8192 + }, + "tool_call": false, + "reasoning": { + "supported": false + }, + "cost": { + "input": 0.6, + "output": 0.6 + }, + "type": "chat" + }, + { + "id": "Qwen/Qwen2.5-72B-Instruct", + "name": "Qwen/Qwen2.5-72B-Instruct", + "display_name": "Qwen/Qwen2.5-72B-Instruct", + "limit": { + "context": 8192, + "output": 8192 + }, "tool_call": false, "reasoning": { "supported": false }, "cost": { - "input": 2, - "output": 2, - "cache_read": 0 + "input": 0.8, + "output": 0.8 }, - "type": "imageGeneration" + "type": "chat" }, { - "id": "llama3.1-8b", - "name": "llama3.1-8b", - "display_name": "llama3.1-8b", + "id": "Qwen/Qwen2.5-72B-Instruct-128K", + "name": "Qwen/Qwen2.5-72B-Instruct-128K", + "display_name": "Qwen/Qwen2.5-72B-Instruct-128K", "limit": { "context": 8192, "output": 8192 @@ -221362,55 +225584,33 @@ "supported": false }, "cost": { - "input": 0.3, - "output": 0.6 + "input": 0.8, + "output": 0.8 }, "type": "chat" }, { - "id": "o1-2024-12-17", - "name": "o1-2024-12-17", - "display_name": "o1-2024-12-17", - "modalities": { - "input": [ - "text", - "image" - ] - }, + "id": "Qwen/Qwen2.5-7B-Instruct", + "name": "Qwen/Qwen2.5-7B-Instruct", + "display_name": "Qwen/Qwen2.5-7B-Instruct", "limit": { "context": 8192, "output": 8192 }, "tool_call": false, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": true, - "mode": "effort", - "effort": "medium", - "effort_options": [ - "low", - "medium", - "high" - ], - "visibility": "hidden" - } + "supported": false }, "cost": { - "input": 15, - "output": 60, - "cache_read": 7.5 + "input": 0.4, + "output": 0.4 }, "type": "chat" }, { - "id": "sf-kimi-k2-thinking", - "name": "sf-kimi-k2-thinking", - "display_name": "sf-kimi-k2-thinking", + "id": "Qwen/Qwen2.5-Coder-32B-Instruct", + "name": "Qwen/Qwen2.5-Coder-32B-Instruct", + "display_name": "Qwen/Qwen2.5-Coder-32B-Instruct", "limit": { "context": 8192, "output": 8192 @@ -221420,40 +225620,44 @@ "supported": false }, "cost": { - "input": 0.548, - "output": 2.192 + "input": 0.16, + "output": 0.16 }, "type": "chat" }, { - "id": "DESCRIBE", - "name": "DESCRIBE", - "display_name": "DESCRIBE", - "modalities": { - "input": [ - "text", - "image" - ] - }, + "id": "Qwen3-235B-A22B-Thinking-2507", + "name": "Qwen3-235B-A22B-Thinking-2507", + "display_name": "Qwen3-235B-A22B-Thinking-2507", "limit": { "context": 8192, "output": 8192 }, "tool_call": false, "reasoning": { - "supported": false + "supported": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } }, "cost": { - "input": 2, - "output": 2, - "cache_read": 0 + "input": 0.28, + "output": 2.8 }, - "type": "imageGeneration" + "type": "chat" }, { - "id": "UPSCALE", - "name": "UPSCALE", - "display_name": "UPSCALE", + "id": "Stable-Diffusion-3-5-Large", + "name": "Stable-Diffusion-3-5-Large", + "display_name": "Stable-Diffusion-3-5-Large", "modalities": { "input": [ "text", @@ -221469,16 +225673,16 @@ "supported": false }, "cost": { - "input": 2, - "output": 2, + "input": 4, + "output": 4, "cache_read": 0 }, "type": "imageGeneration" }, { - "id": "bai-qwen3-vl-235b-a22b-instruct", - "name": "bai-qwen3-vl-235b-a22b-instruct", - "display_name": "bai-qwen3-vl-235b-a22b-instruct", + "id": "WizardLM/WizardCoder-Python-34B-V1.0", + "name": "WizardLM/WizardCoder-Python-34B-V1.0", + "display_name": "WizardLM/WizardCoder-Python-34B-V1.0", "limit": { "context": 8192, "output": 8192 @@ -221488,38 +225692,33 @@ "supported": false }, "cost": { - "input": 0.274, - "output": 1.096 + "input": 0.9, + "output": 0.9 }, "type": "chat" }, { - "id": "cc-MiniMax-M2", - "name": "cc-MiniMax-M2", - "display_name": "cc-MiniMax-M2", - "modalities": { - "input": [ - "text" - ] - }, + "id": "ahm-Phi-3-5-MoE-instruct", + "name": "ahm-Phi-3-5-MoE-instruct", + "display_name": "ahm-Phi-3-5-MoE-instruct", "limit": { "context": 8192, "output": 8192 }, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": false }, "cost": { - "input": 0.1, - "output": 0.1 + "input": 0.4, + "output": 1.6 }, "type": "chat" }, { - "id": "cc-deepseek-v3", - "name": "cc-deepseek-v3", - "display_name": "cc-deepseek-v3", + "id": "ahm-Phi-3-5-mini-instruct", + "name": "ahm-Phi-3-5-mini-instruct", + "display_name": "ahm-Phi-3-5-mini-instruct", "limit": { "context": 8192, "output": 8192 @@ -221529,63 +225728,57 @@ "supported": false }, "cost": { - "input": 0.3, - "output": 0.3 + "input": 1, + "output": 3 }, "type": "chat" }, { - "id": "cc-deepseek-v3.1", - "name": "cc-deepseek-v3.1", - "display_name": "cc-deepseek-v3.1", + "id": "ahm-Phi-3-5-vision-instruct", + "name": "ahm-Phi-3-5-vision-instruct", + "display_name": "ahm-Phi-3-5-vision-instruct", "modalities": { "input": [ - "text" + "text", + "image" ] }, "limit": { "context": 8192, "output": 8192 }, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": false }, "cost": { - "input": 0.56, - "output": 1.68 + "input": 0.4, + "output": 1.6 }, "type": "chat" }, { - "id": "cc-ernie-4.5-300b-a47b", - "name": "cc-ernie-4.5-300b-a47b", - "display_name": "cc-ernie-4.5-300b-a47b", - "modalities": { - "input": [ - "text", - "image" - ] - }, + "id": "ahm-Phi-3-medium-128k", + "name": "ahm-Phi-3-medium-128k", + "display_name": "ahm-Phi-3-medium-128k", "limit": { "context": 8192, "output": 8192 }, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": false }, "cost": { - "input": 0.32, - "output": 1.28, - "cache_read": 0 + "input": 6, + "output": 18 }, "type": "chat" }, { - "id": "cc-kimi-dev-72b", - "name": "cc-kimi-dev-72b", - "display_name": "cc-kimi-dev-72b", + "id": "ahm-Phi-3-medium-4k", + "name": "ahm-Phi-3-medium-4k", + "display_name": "ahm-Phi-3-medium-4k", "limit": { "context": 8192, "output": 8192 @@ -221595,62 +225788,56 @@ "supported": false }, "cost": { - "input": 0.32, - "output": 1.28, - "cache_read": 0 + "input": 1, + "output": 3 }, "type": "chat" }, { - "id": "cc-kimi-k2-instruct", - "name": "cc-kimi-k2-instruct", - "display_name": "cc-kimi-k2-instruct", - "modalities": { - "input": [ - "text" - ] - }, + "id": "ahm-Phi-3-small-128k", + "name": "ahm-Phi-3-small-128k", + "display_name": "ahm-Phi-3-small-128k", "limit": { "context": 8192, "output": 8192 }, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": false }, "cost": { - "input": 1.1, - "output": 3.3 + "input": 1, + "output": 3 }, "type": "chat" }, { - "id": "cc-kimi-k2-instruct-0905", - "name": "cc-kimi-k2-instruct-0905", - "display_name": "cc-kimi-k2-instruct-0905", - "modalities": { - "input": [ - "text" - ] - }, + "id": "aihubmix-Codestral-2501", + "name": "aihubmix-Codestral-2501", + "display_name": "aihubmix-Codestral-2501", "limit": { "context": 8192, "output": 8192 }, - "tool_call": true, + "tool_call": false, "reasoning": { "supported": false }, "cost": { - "input": 1.1, - "output": 3.3 + "input": 0.4, + "output": 1.2 }, "type": "chat" }, { - "id": "cc-kimi-k2-thinking", - "name": "cc-kimi-k2-thinking", - "display_name": "cc-kimi-k2-thinking", + "id": "aihubmix-Cohere-command-r", + "name": "aihubmix-Cohere-command-r", + "display_name": "aihubmix-Cohere-command-r", + "modalities": { + "input": [ + "text" + ] + }, "limit": { "context": 8192, "output": 8192 @@ -221660,15 +225847,15 @@ "supported": false }, "cost": { - "input": 0.548, - "output": 2.192 + "input": 0.64, + "output": 1.92 }, "type": "chat" }, { - "id": "computer-use-preview", - "name": "computer-use-preview", - "display_name": "computer-use-preview", + "id": "aihubmix-Jamba-1-5-Large", + "name": "aihubmix-Jamba-1-5-Large", + "display_name": "aihubmix-Jamba-1-5-Large", "limit": { "context": 8192, "output": 8192 @@ -221678,15 +225865,15 @@ "supported": false }, "cost": { - "input": 3, - "output": 12 + "input": 2.2, + "output": 8.8 }, "type": "chat" }, { - "id": "gpt-image-test", - "name": "gpt-image-test", - "display_name": "gpt-image-test", + "id": "aihubmix-Llama-3-1-405B-Instruct", + "name": "aihubmix-Llama-3-1-405B-Instruct", + "display_name": "aihubmix-Llama-3-1-405B-Instruct", "limit": { "context": 8192, "output": 8192 @@ -221697,108 +225884,68 @@ }, "cost": { "input": 5, - "output": 40, - "cache_read": 0 + "output": 15 }, "type": "chat" }, { - "id": "grok-4.20-beta-0309-non-reasoning", - "name": "grok-4.20-beta-0309-non-reasoning", - "display_name": "grok-4.20-beta-0309-non-reasoning", - "modalities": { - "input": [ - "text", - "image" - ] - }, + "id": "aihubmix-Llama-3-1-70B-Instruct", + "name": "aihubmix-Llama-3-1-70B-Instruct", + "display_name": "aihubmix-Llama-3-1-70B-Instruct", "limit": { - "context": 2000000, - "output": 2000000 + "context": 8192, + "output": 8192 }, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true - } + "supported": false }, "cost": { - "input": 2, - "output": 6, - "cache_read": 0.2 + "input": 0.6, + "output": 0.78 }, "type": "chat" }, { - "id": "grok-4.20-beta-0309-reasoning", - "name": "grok-4.20-beta-0309-reasoning", - "display_name": "grok-4.20-beta-0309-reasoning", - "modalities": { - "input": [ - "text", - "image" - ] - }, + "id": "aihubmix-Llama-3-1-8B-Instruct", + "name": "aihubmix-Llama-3-1-8B-Instruct", + "display_name": "aihubmix-Llama-3-1-8B-Instruct", "limit": { - "context": 2000000, - "output": 2000000 + "context": 8192, + "output": 8192 }, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true - } + "supported": false }, "cost": { - "input": 2, - "output": 6, - "cache_read": 0.2 + "input": 0.3, + "output": 0.6 }, "type": "chat" }, { - "id": "grok-4.20-multi-agent-beta-0309", - "name": "grok-4.20-multi-agent-beta-0309", - "display_name": "grok-4.20-multi-agent-beta-0309", - "modalities": { - "input": [ - "text", - "image" - ] - }, + "id": "aihubmix-Llama-3-2-11B-Vision", + "name": "aihubmix-Llama-3-2-11B-Vision", + "display_name": "aihubmix-Llama-3-2-11B-Vision", "limit": { - "context": 2000000, - "output": 2000000 + "context": 8192, + "output": 8192 }, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true - } + "supported": false }, "cost": { - "input": 2, - "output": 6, - "cache_read": 0.2 + "input": 0.4, + "output": 0.4 }, "type": "chat" }, { - "id": "deepseek-ai/DeepSeek-V2-Chat", - "name": "deepseek-ai/DeepSeek-V2-Chat", - "display_name": "deepseek-ai/DeepSeek-V2-Chat", + "id": "aihubmix-Llama-3-2-90B-Vision", + "name": "aihubmix-Llama-3-2-90B-Vision", + "display_name": "aihubmix-Llama-3-2-90B-Vision", "limit": { "context": 8192, "output": 8192 @@ -221808,15 +225955,15 @@ "supported": false }, "cost": { - "input": 0.16, - "output": 0.32 + "input": 2.4, + "output": 2.4 }, "type": "chat" }, { - "id": "deepseek-ai/DeepSeek-V2.5", - "name": "deepseek-ai/DeepSeek-V2.5", - "display_name": "deepseek-ai/DeepSeek-V2.5", + "id": "aihubmix-Llama-3-70B-Instruct", + "name": "aihubmix-Llama-3-70B-Instruct", + "display_name": "aihubmix-Llama-3-70B-Instruct", "limit": { "context": 8192, "output": 8192 @@ -221826,15 +225973,15 @@ "supported": false }, "cost": { - "input": 0.16, - "output": 0.32 + "input": 0.7, + "output": 0.7 }, "type": "chat" }, { - "id": "deepseek-ai/deepseek-llm-67b-chat", - "name": "deepseek-ai/deepseek-llm-67b-chat", - "display_name": "deepseek-ai/deepseek-llm-67b-chat", + "id": "aihubmix-Mistral-large", + "name": "aihubmix-Mistral-large", + "display_name": "aihubmix-Mistral-large", "limit": { "context": 8192, "output": 8192 @@ -221844,15 +225991,20 @@ "supported": false }, "cost": { - "input": 0.16, - "output": 0.16 + "input": 4, + "output": 12 }, "type": "chat" }, { - "id": "deepseek-ai/deepseek-vl2", - "name": "deepseek-ai/deepseek-vl2", - "display_name": "deepseek-ai/deepseek-vl2", + "id": "aihubmix-command-r-08-2024", + "name": "aihubmix-command-r-08-2024", + "display_name": "aihubmix-command-r-08-2024", + "modalities": { + "input": [ + "text" + ] + }, "limit": { "context": 8192, "output": 8192 @@ -221862,15 +226014,20 @@ "supported": false }, "cost": { - "input": 0.16, - "output": 0.16 + "input": 0.2, + "output": 0.8 }, "type": "chat" }, { - "id": "deepseek-v3", - "name": "deepseek-v3", - "display_name": "deepseek-v3", + "id": "aihubmix-command-r-plus", + "name": "aihubmix-command-r-plus", + "display_name": "aihubmix-command-r-plus", + "modalities": { + "input": [ + "text" + ] + }, "limit": { "context": 8192, "output": 8192 @@ -221880,19 +226037,18 @@ "supported": false }, "cost": { - "input": 0.272, - "output": 1.088, - "cache_read": 0 + "input": 3.84, + "output": 19.2 }, "type": "chat" }, { - "id": "distil-whisper-large-v3-en", - "name": "distil-whisper-large-v3-en", - "display_name": "distil-whisper-large-v3-en", + "id": "aihubmix-command-r-plus-08-2024", + "name": "aihubmix-command-r-plus-08-2024", + "display_name": "aihubmix-command-r-plus-08-2024", "modalities": { "input": [ - "audio" + "text" ] }, "limit": { @@ -221904,15 +226060,15 @@ "supported": false }, "cost": { - "input": 5.556, - "output": 5.556 + "input": 2.8, + "output": 11.2 }, "type": "chat" }, { - "id": "doubao-1-5-thinking-vision-pro-250428", - "name": "doubao-1-5-thinking-vision-pro-250428", - "display_name": "doubao-1-5-thinking-vision-pro-250428", + "id": "alicloud-deepseek-v3.2", + "name": "alicloud-deepseek-v3.2", + "display_name": "alicloud-deepseek-v3.2", "limit": { "context": 8192, "output": 8192 @@ -221922,16 +226078,16 @@ "supported": false }, "cost": { - "input": 2, - "output": 2, - "cache_read": 2 + "input": 0.274, + "output": 0.411, + "cache_read": 0.0548 }, "type": "chat" }, { - "id": "fx-flux-2-pro", - "name": "fx-flux-2-pro", - "display_name": "fx-flux-2-pro", + "id": "alicloud-glm-4.7", + "name": "alicloud-glm-4.7", + "display_name": "alicloud-glm-4.7", "limit": { "context": 8192, "output": 8192 @@ -221941,86 +226097,53 @@ "supported": false }, "cost": { - "input": 2, - "output": 0, - "cache_read": 0 + "input": 0.41096, + "output": 1.917786, + "cache_read": 0.41096 }, "type": "chat" }, { - "id": "gemini-2.5-pro-exp-03-25", - "name": "gemini-2.5-pro-exp-03-25", - "display_name": "gemini-2.5-pro-exp-03-25", - "modalities": { - "input": [ - "text", - "image", - "audio", - "video" - ] - }, + "id": "alicloud-kimi-k2-thinking", + "name": "alicloud-kimi-k2-thinking", + "display_name": "alicloud-kimi-k2-thinking", "limit": { "context": 8192, "output": 8192 }, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "default_enabled": true, - "mode": "budget", - "budget": { - "default": -1, - "min": 128, - "max": 32768, - "auto": -1, - "unit": "tokens" - }, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thought_signatures" - ] - } + "supported": false }, "cost": { - "input": 1.25, - "output": 5, - "cache_read": 0.125 + "input": 0.548, + "output": 2.192 }, "type": "chat" }, { - "id": "gemini-embedding-exp-03-07", - "name": "gemini-embedding-exp-03-07", - "display_name": "gemini-embedding-exp-03-07", - "modalities": { - "input": [ - "text" - ] - }, + "id": "alicloud-kimi-k2.5", + "name": "alicloud-kimi-k2.5", + "display_name": "alicloud-kimi-k2.5", "limit": { - "context": 8192, - "output": 8192 + "context": 256000, + "output": 256000 }, "tool_call": false, "reasoning": { "supported": false }, "cost": { - "input": 0.02, - "output": 0.02 + "input": 0.548, + "output": 2.877, + "cache_read": 0.0959 }, - "type": "embedding" + "type": "chat" }, { - "id": "gemini-exp-1114", - "name": "gemini-exp-1114", - "display_name": "gemini-exp-1114", + "id": "alicloud-minimax-m2.5", + "name": "alicloud-minimax-m2.5", + "display_name": "alicloud-minimax-m2.5", "limit": { "context": 8192, "output": 8192 @@ -222030,33 +226153,47 @@ "supported": false }, "cost": { - "input": 1.25, - "output": 5 + "input": 0.2876, + "output": 1.1504, + "cache_read": 0.05752 }, "type": "chat" }, { - "id": "gemini-exp-1121", - "name": "gemini-exp-1121", - "display_name": "gemini-exp-1121", + "id": "anthropic-opus-4-6", + "name": "anthropic-opus-4-6", + "display_name": "anthropic-opus-4-6", + "modalities": { + "input": [ + "text", + "image" + ] + }, "limit": { - "context": 8192, - "output": 8192 + "context": 200000, + "output": 200000 }, - "tool_call": false, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true + } }, "cost": { - "input": 1.25, - "output": 5 + "input": 5, + "output": 25, + "cache_read": 0.5 }, "type": "chat" }, { - "id": "gemini-pro", - "name": "gemini-pro", - "display_name": "gemini-pro", + "id": "azure-deepseek-v3.2", + "name": "azure-deepseek-v3.2", + "display_name": "azure-deepseek-v3.2", "limit": { "context": 8192, "output": 8192 @@ -222066,15 +226203,15 @@ "supported": false }, "cost": { - "input": 0.2, - "output": 0.6 + "input": 0.58, + "output": 1.680028 }, "type": "chat" }, { - "id": "gemini-pro-vision", - "name": "gemini-pro-vision", - "display_name": "gemini-pro-vision", + "id": "azure-deepseek-v3.2-speciale", + "name": "azure-deepseek-v3.2-speciale", + "display_name": "azure-deepseek-v3.2-speciale", "limit": { "context": 8192, "output": 8192 @@ -222084,33 +226221,33 @@ "supported": false }, "cost": { - "input": 1, - "output": 1 + "input": 0.58, + "output": 1.680028 }, "type": "chat" }, { - "id": "gemma-7b-it", - "name": "gemma-7b-it", - "display_name": "gemma-7b-it", + "id": "azure-kimi-k2.5", + "name": "azure-kimi-k2.5", + "display_name": "azure-kimi-k2.5", "limit": { - "context": 8192, - "output": 8192 + "context": 256000, + "output": 256000 }, "tool_call": false, "reasoning": { "supported": false }, "cost": { - "input": 0.1, - "output": 0.1 + "input": 0.6, + "output": 3 }, "type": "chat" }, { - "id": "glm-3-turbo", - "name": "glm-3-turbo", - "display_name": "glm-3-turbo", + "id": "cbs-glm-4.7", + "name": "cbs-glm-4.7", + "display_name": "cbs-glm-4.7", "limit": { "context": 8192, "output": 8192 @@ -222120,15 +226257,15 @@ "supported": false }, "cost": { - "input": 0.71, - "output": 0.71 + "input": 2.25, + "output": 2.749995 }, "type": "chat" }, { - "id": "glm-4", - "name": "glm-4", - "display_name": "glm-4", + "id": "cerebras-llama-3.3-70b", + "name": "cerebras-llama-3.3-70b", + "display_name": "cerebras-llama-3.3-70b", "limit": { "context": 8192, "output": 8192 @@ -222138,15 +226275,15 @@ "supported": false }, "cost": { - "input": 14.2, - "output": 14.2 + "input": 0.6, + "output": 0.6 }, "type": "chat" }, { - "id": "glm-4-flash", - "name": "glm-4-flash", - "display_name": "glm-4-flash", + "id": "chatglm_lite", + "name": "chatglm_lite", + "display_name": "chatglm_lite", "limit": { "context": 8192, "output": 8192 @@ -222156,15 +226293,15 @@ "supported": false }, "cost": { - "input": 0.1, - "output": 0.1 + "input": 0.2858, + "output": 0.2858 }, "type": "chat" }, { - "id": "glm-4-plus", - "name": "glm-4-plus", - "display_name": "glm-4-plus", + "id": "chatglm_pro", + "name": "chatglm_pro", + "display_name": "chatglm_pro", "limit": { "context": 8192, "output": 8192 @@ -222174,20 +226311,15 @@ "supported": false }, "cost": { - "input": 8, - "output": 8 + "input": 1.4286, + "output": 1.4286 }, "type": "chat" }, { - "id": "glm-4.5-airx", - "name": "glm-4.5-airx", - "display_name": "glm-4.5-airx", - "modalities": { - "input": [ - "text" - ] - }, + "id": "chatglm_std", + "name": "chatglm_std", + "display_name": "chatglm_std", "limit": { "context": 8192, "output": 8192 @@ -222197,16 +226329,15 @@ "supported": false }, "cost": { - "input": 1.1, - "output": 4.51, - "cache_read": 0.22 + "input": 0.7144, + "output": 0.7144 }, "type": "chat" }, { - "id": "glm-4v", - "name": "glm-4v", - "display_name": "glm-4v", + "id": "chatglm_turbo", + "name": "chatglm_turbo", + "display_name": "chatglm_turbo", "limit": { "context": 8192, "output": 8192 @@ -222216,15 +226347,15 @@ "supported": false }, "cost": { - "input": 14.2, - "output": 14.2 + "input": 0.7144, + "output": 0.7144 }, "type": "chat" }, { - "id": "glm-4v-plus", - "name": "glm-4v-plus", - "display_name": "glm-4v-plus", + "id": "claude-2", + "name": "claude-2", + "display_name": "claude-2", "limit": { "context": 8192, "output": 8192 @@ -222234,15 +226365,15 @@ "supported": false }, "cost": { - "input": 2, - "output": 2 + "input": 8.8, + "output": 8.8 }, "type": "chat" }, { - "id": "google-gemma-3-12b-it", - "name": "google-gemma-3-12b-it", - "display_name": "google-gemma-3-12b-it", + "id": "claude-2.0", + "name": "claude-2.0", + "display_name": "claude-2.0", "limit": { "context": 8192, "output": 8192 @@ -222252,15 +226383,15 @@ "supported": false }, "cost": { - "input": 0.2, - "output": 0.2 + "input": 8.8, + "output": 39.6 }, "type": "chat" }, { - "id": "google-gemma-3-27b-it", - "name": "google-gemma-3-27b-it", - "display_name": "google-gemma-3-27b-it", + "id": "claude-2.1", + "name": "claude-2.1", + "display_name": "claude-2.1", "limit": { "context": 8192, "output": 8192 @@ -222270,35 +226401,45 @@ "supported": false }, "cost": { - "input": 0.2, - "output": 0.2, - "cache_read": 0 + "input": 8.8, + "output": 39.6 }, "type": "chat" }, { - "id": "google-gemma-3-4b-it", - "name": "google-gemma-3-4b-it", - "display_name": "google-gemma-3-4b-it", + "id": "claude-3-5-sonnet-20240620", + "name": "claude-3-5-sonnet-20240620", + "display_name": "claude-3-5-sonnet-20240620", + "modalities": { + "input": [ + "text", + "image" + ] + }, "limit": { - "context": 8192, - "output": 8192 + "context": 200000, + "output": 200000 }, "tool_call": false, "reasoning": { "supported": false }, "cost": { - "input": 0.2, - "output": 0.2, - "cache_read": 0 + "input": 3.3, + "output": 16.5 }, "type": "chat" }, { - "id": "google/gemini-exp-1114", - "name": "google/gemini-exp-1114", - "display_name": "google/gemini-exp-1114", + "id": "claude-3-haiku-20240229", + "name": "claude-3-haiku-20240229", + "display_name": "claude-3-haiku-20240229", + "modalities": { + "input": [ + "text", + "image" + ] + }, "limit": { "context": 8192, "output": 8192 @@ -222308,15 +226449,21 @@ "supported": false }, "cost": { - "input": 1.25, - "output": 5 + "input": 0.275, + "output": 0.275 }, "type": "chat" }, { - "id": "google/gemma-2-27b-it", - "name": "google/gemma-2-27b-it", - "display_name": "google/gemma-2-27b-it", + "id": "claude-3-haiku-20240307", + "name": "claude-3-haiku-20240307", + "display_name": "claude-3-haiku-20240307", + "modalities": { + "input": [ + "text", + "image" + ] + }, "limit": { "context": 8192, "output": 8192 @@ -222326,15 +226473,21 @@ "supported": false }, "cost": { - "input": 0.8, - "output": 0.8 + "input": 0.275, + "output": 1.375 }, "type": "chat" }, { - "id": "google/gemma-2-9b-it:free", - "name": "google/gemma-2-9b-it:free", - "display_name": "google/gemma-2-9b-it:free", + "id": "claude-3-sonnet-20240229", + "name": "claude-3-sonnet-20240229", + "display_name": "claude-3-sonnet-20240229", + "modalities": { + "input": [ + "text", + "image" + ] + }, "limit": { "context": 8192, "output": 8192 @@ -222344,15 +226497,15 @@ "supported": false }, "cost": { - "input": 0.02, - "output": 0.02 + "input": 3.3, + "output": 16.5 }, "type": "chat" }, { - "id": "gpt-3.5-turbo", - "name": "gpt-3.5-turbo", - "display_name": "gpt-3.5-turbo", + "id": "claude-instant-1", + "name": "claude-instant-1", + "display_name": "claude-instant-1", "limit": { "context": 8192, "output": 8192 @@ -222362,15 +226515,15 @@ "supported": false }, "cost": { - "input": 0.5, - "output": 1.5 + "input": 1.793, + "output": 1.793 }, "type": "chat" }, { - "id": "gpt-3.5-turbo-0301", - "name": "gpt-3.5-turbo-0301", - "display_name": "gpt-3.5-turbo-0301", + "id": "claude-instant-1.2", + "name": "claude-instant-1.2", + "display_name": "claude-instant-1.2", "limit": { "context": 8192, "output": 8192 @@ -222380,15 +226533,15 @@ "supported": false }, "cost": { - "input": 1.5, - "output": 1.5 + "input": 0.88, + "output": 3.96 }, "type": "chat" }, { - "id": "gpt-3.5-turbo-0613", - "name": "gpt-3.5-turbo-0613", - "display_name": "gpt-3.5-turbo-0613", + "id": "code-davinci-edit-001", + "name": "code-davinci-edit-001", + "display_name": "code-davinci-edit-001", "limit": { "context": 8192, "output": 8192 @@ -222398,15 +226551,15 @@ "supported": false }, "cost": { - "input": 1.5, - "output": 2 + "input": 20, + "output": 20 }, "type": "chat" }, { - "id": "gpt-3.5-turbo-1106", - "name": "gpt-3.5-turbo-1106", - "display_name": "gpt-3.5-turbo-1106", + "id": "cogview-3", + "name": "cogview-3", + "display_name": "cogview-3", "limit": { "context": 8192, "output": 8192 @@ -222416,15 +226569,15 @@ "supported": false }, "cost": { - "input": 1, - "output": 2 + "input": 35.5, + "output": 35.5 }, "type": "chat" }, { - "id": "gpt-3.5-turbo-16k", - "name": "gpt-3.5-turbo-16k", - "display_name": "gpt-3.5-turbo-16k", + "id": "cogview-3-plus", + "name": "cogview-3-plus", + "display_name": "cogview-3-plus", "limit": { "context": 8192, "output": 8192 @@ -222434,15 +226587,20 @@ "supported": false }, "cost": { - "input": 3, - "output": 4 + "input": 10, + "output": 10 }, "type": "chat" }, { - "id": "gpt-3.5-turbo-16k-0613", - "name": "gpt-3.5-turbo-16k-0613", - "display_name": "gpt-3.5-turbo-16k-0613", + "id": "command", + "name": "command", + "display_name": "command", + "modalities": { + "input": [ + "text" + ] + }, "limit": { "context": 8192, "output": 8192 @@ -222452,15 +226610,15 @@ "supported": false }, "cost": { - "input": 3, - "output": 4 + "input": 1, + "output": 2 }, "type": "chat" }, { - "id": "gpt-3.5-turbo-instruct", - "name": "gpt-3.5-turbo-instruct", - "display_name": "gpt-3.5-turbo-instruct", + "id": "command-light", + "name": "command-light", + "display_name": "command-light", "limit": { "context": 8192, "output": 8192 @@ -222470,15 +226628,15 @@ "supported": false }, "cost": { - "input": 1.5, + "input": 1, "output": 2 }, "type": "chat" }, { - "id": "gpt-4", - "name": "gpt-4", - "display_name": "gpt-4", + "id": "command-light-nightly", + "name": "command-light-nightly", + "display_name": "command-light-nightly", "limit": { "context": 8192, "output": 8192 @@ -222488,15 +226646,15 @@ "supported": false }, "cost": { - "input": 30, - "output": 60 + "input": 1, + "output": 2 }, "type": "chat" }, { - "id": "gpt-4-0125-preview", - "name": "gpt-4-0125-preview", - "display_name": "gpt-4-0125-preview", + "id": "command-nightly", + "name": "command-nightly", + "display_name": "command-nightly", "limit": { "context": 8192, "output": 8192 @@ -222506,15 +226664,20 @@ "supported": false }, "cost": { - "input": 10, - "output": 30 + "input": 1, + "output": 2 }, "type": "chat" }, { - "id": "gpt-4-0314", - "name": "gpt-4-0314", - "display_name": "gpt-4-0314", + "id": "command-r", + "name": "command-r", + "display_name": "command-r", + "modalities": { + "input": [ + "text" + ] + }, "limit": { "context": 8192, "output": 8192 @@ -222524,15 +226687,20 @@ "supported": false }, "cost": { - "input": 30, - "output": 60 + "input": 0.64, + "output": 1.92 }, "type": "chat" }, { - "id": "gpt-4-0613", - "name": "gpt-4-0613", - "display_name": "gpt-4-0613", + "id": "command-r-08-2024", + "name": "command-r-08-2024", + "display_name": "command-r-08-2024", + "modalities": { + "input": [ + "text" + ] + }, "limit": { "context": 8192, "output": 8192 @@ -222542,15 +226710,20 @@ "supported": false }, "cost": { - "input": 30, - "output": 60 + "input": 0.2, + "output": 0.8 }, "type": "chat" }, { - "id": "gpt-4-1106-preview", - "name": "gpt-4-1106-preview", - "display_name": "gpt-4-1106-preview", + "id": "command-r-plus", + "name": "command-r-plus", + "display_name": "command-r-plus", + "modalities": { + "input": [ + "text" + ] + }, "limit": { "context": 8192, "output": 8192 @@ -222560,15 +226733,20 @@ "supported": false }, "cost": { - "input": 10, - "output": 30 + "input": 3.84, + "output": 19.2 }, "type": "chat" }, { - "id": "gpt-4-32k-0314", - "name": "gpt-4-32k-0314", - "display_name": "gpt-4-32k-0314", + "id": "command-r-plus-08-2024", + "name": "command-r-plus-08-2024", + "display_name": "command-r-plus-08-2024", + "modalities": { + "input": [ + "text" + ] + }, "limit": { "context": 8192, "output": 8192 @@ -222578,15 +226756,21 @@ "supported": false }, "cost": { - "input": 60, - "output": 120 + "input": 2.8, + "output": 11.2 }, "type": "chat" }, { - "id": "gpt-4-32k-0613", - "name": "gpt-4-32k-0613", - "display_name": "gpt-4-32k-0613", + "id": "dall-e-2", + "name": "dall-e-2", + "display_name": "dall-e-2", + "modalities": { + "input": [ + "text", + "image" + ] + }, "limit": { "context": 8192, "output": 8192 @@ -222596,15 +226780,15 @@ "supported": false }, "cost": { - "input": 60, - "output": 120 + "input": 16, + "output": 16 }, - "type": "chat" + "type": "imageGeneration" }, { - "id": "gpt-4-turbo", - "name": "gpt-4-turbo", - "display_name": "gpt-4-turbo", + "id": "davinci", + "name": "davinci", + "display_name": "davinci", "limit": { "context": 8192, "output": 8192 @@ -222614,15 +226798,15 @@ "supported": false }, "cost": { - "input": 10, - "output": 30 + "input": 20, + "output": 20 }, "type": "chat" }, { - "id": "gpt-4-turbo-2024-04-09", - "name": "gpt-4-turbo-2024-04-09", - "display_name": "gpt-4-turbo-2024-04-09", + "id": "davinci-002", + "name": "davinci-002", + "display_name": "davinci-002", "limit": { "context": 8192, "output": 8192 @@ -222632,15 +226816,15 @@ "supported": false }, "cost": { - "input": 10, - "output": 30 + "input": 2, + "output": 2 }, "type": "chat" }, { - "id": "gpt-4-turbo-preview", - "name": "gpt-4-turbo-preview", - "display_name": "gpt-4-turbo-preview", + "id": "deepinfra-llama-3.1-8b-instant", + "name": "deepinfra-llama-3.1-8b-instant", + "display_name": "deepinfra-llama-3.1-8b-instant", "limit": { "context": 8192, "output": 8192 @@ -222650,15 +226834,15 @@ "supported": false }, "cost": { - "input": 10, - "output": 30 + "input": 0.033, + "output": 0.054978 }, "type": "chat" }, { - "id": "gpt-4-vision-preview", - "name": "gpt-4-vision-preview", - "display_name": "gpt-4-vision-preview", + "id": "deepinfra-llama-3.3-70b-instant-turbo", + "name": "deepinfra-llama-3.3-70b-instant-turbo", + "display_name": "deepinfra-llama-3.3-70b-instant-turbo", "limit": { "context": 8192, "output": 8192 @@ -222668,40 +226852,33 @@ "supported": false }, "cost": { - "input": 10, - "output": 30 + "input": 0.11, + "output": 0.352 }, "type": "chat" }, { - "id": "gpt-4o-2024-05-13", - "name": "gpt-4o-2024-05-13", - "display_name": "gpt-4o-2024-05-13", + "id": "deepinfra-llama-4-maverick-17b-128e-instruct", + "name": "deepinfra-llama-4-maverick-17b-128e-instruct", + "display_name": "deepinfra-llama-4-maverick-17b-128e-instruct", "limit": { - "context": 128000, - "output": 128000 + "context": 8192, + "output": 8192 }, "tool_call": false, "reasoning": { "supported": false }, "cost": { - "input": 5, - "output": 15, - "cache_read": 5 + "input": 1.65, + "output": 6.6 }, "type": "chat" }, { - "id": "gpt-4o-mini-2024-07-18", - "name": "gpt-4o-mini-2024-07-18", - "display_name": "gpt-4o-mini-2024-07-18", - "modalities": { - "input": [ - "text", - "image" - ] - }, + "id": "deepinfra-llama-4-scout-17b-16e-instruct", + "name": "deepinfra-llama-4-scout-17b-16e-instruct", + "display_name": "deepinfra-llama-4-scout-17b-16e-instruct", "limit": { "context": 8192, "output": 8192 @@ -222711,75 +226888,57 @@ "supported": false }, "cost": { - "input": 0.15, - "output": 0.6, - "cache_read": 0.075 + "input": 0.088, + "output": 0.33, + "cache_read": 0 }, "type": "chat" }, { - "id": "gpt-oss-20b", - "name": "gpt-oss-20b", - "display_name": "gpt-oss-20b", - "modalities": { - "input": [ - "text" - ] - }, + "id": "deepseek-ai/DeepSeek-Coder-V2-Instruct", + "name": "deepseek-ai/DeepSeek-Coder-V2-Instruct", + "display_name": "deepseek-ai/DeepSeek-Coder-V2-Instruct", "limit": { - "context": 128000, - "output": 128000 - }, - "tool_call": true, - "reasoning": { - "supported": true, - "default": true + "context": 8192, + "output": 8192 }, - "extra_capabilities": { - "reasoning": { - "supported": true - } + "tool_call": false, + "reasoning": { + "supported": false }, "cost": { - "input": 0.11, - "output": 0.55 + "input": 0.16, + "output": 0.32 }, "type": "chat" }, { - "id": "grok-2-vision-1212", - "name": "grok-2-vision-1212", - "display_name": "grok-2-vision-1212", - "modalities": { - "input": [ - "text", - "image" - ] - }, + "id": "deepseek-ai/DeepSeek-R1-Distill-Llama-70B", + "name": "deepseek-ai/DeepSeek-R1-Distill-Llama-70B", + "display_name": "deepseek-ai/DeepSeek-R1-Distill-Llama-70B", "limit": { "context": 8192, "output": 8192 }, "tool_call": false, "reasoning": { - "supported": false + "supported": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true + } }, "cost": { - "input": 1.8, - "output": 9 + "input": 0.6, + "output": 0.6 }, "type": "chat" }, { - "id": "grok-vision-beta", - "name": "grok-vision-beta", - "display_name": "grok-vision-beta", - "modalities": { - "input": [ - "text", - "image" - ] - }, + "id": "deepseek-ai/DeepSeek-R1-Distill-Llama-8B", + "name": "deepseek-ai/DeepSeek-R1-Distill-Llama-8B", + "display_name": "deepseek-ai/DeepSeek-R1-Distill-Llama-8B", "limit": { "context": 8192, "output": 8192 @@ -222789,15 +226948,15 @@ "supported": false }, "cost": { - "input": 5.6, - "output": 16.8 + "input": 0.01, + "output": 0.01 }, "type": "chat" }, { - "id": "groq-llama-3.1-8b-instant", - "name": "groq-llama-3.1-8b-instant", - "display_name": "groq-llama-3.1-8b-instant", + "id": "deepseek-ai/DeepSeek-R1-Distill-Qwen-1.5B", + "name": "deepseek-ai/DeepSeek-R1-Distill-Qwen-1.5B", + "display_name": "deepseek-ai/DeepSeek-R1-Distill-Qwen-1.5B", "limit": { "context": 8192, "output": 8192 @@ -222807,15 +226966,15 @@ "supported": false }, "cost": { - "input": 0.055, - "output": 0.088 + "input": 0.01, + "output": 0.01 }, "type": "chat" }, { - "id": "groq-llama-3.3-70b-versatile", - "name": "groq-llama-3.3-70b-versatile", - "display_name": "groq-llama-3.3-70b-versatile", + "id": "deepseek-ai/DeepSeek-R1-Distill-Qwen-14B", + "name": "deepseek-ai/DeepSeek-R1-Distill-Qwen-14B", + "display_name": "deepseek-ai/DeepSeek-R1-Distill-Qwen-14B", "limit": { "context": 8192, "output": 8192 @@ -222825,15 +226984,15 @@ "supported": false }, "cost": { - "input": 0.649, - "output": 0.869011 + "input": 0.1, + "output": 0.1 }, "type": "chat" }, { - "id": "groq-llama-4-maverick-17b-128e-instruct", - "name": "groq-llama-4-maverick-17b-128e-instruct", - "display_name": "groq-llama-4-maverick-17b-128e-instruct", + "id": "deepseek-ai/DeepSeek-R1-Distill-Qwen-32B", + "name": "deepseek-ai/DeepSeek-R1-Distill-Qwen-32B", + "display_name": "deepseek-ai/DeepSeek-R1-Distill-Qwen-32B", "limit": { "context": 8192, "output": 8192 @@ -222843,15 +227002,15 @@ "supported": false }, "cost": { - "input": 0.22, - "output": 0.66 + "input": 0.2, + "output": 0.2 }, "type": "chat" }, { - "id": "groq-llama-4-scout-17b-16e-instruct", - "name": "groq-llama-4-scout-17b-16e-instruct", - "display_name": "groq-llama-4-scout-17b-16e-instruct", + "id": "deepseek-ai/DeepSeek-R1-Distill-Qwen-7B", + "name": "deepseek-ai/DeepSeek-R1-Distill-Qwen-7B", + "display_name": "deepseek-ai/DeepSeek-R1-Distill-Qwen-7B", "limit": { "context": 8192, "output": 8192 @@ -222861,8 +227020,8 @@ "supported": false }, "cost": { - "input": 0.122, - "output": 0.366 + "input": 0.01, + "output": 0.01 }, "type": "chat" }, @@ -224356,226 +228515,9 @@ } }, { - "id": "tts-1-hd-1106", - "name": "tts-1-hd-1106", - "display_name": "tts-1-hd-1106", - "modalities": { - "input": [ - "audio" - ] - }, - "limit": { - "context": 8192, - "output": 8192 - }, - "tool_call": false, - "reasoning": { - "supported": false - }, - "cost": { - "input": 30, - "output": 30 - } - }, - { - "id": "whisper-1", - "name": "whisper-1", - "display_name": "whisper-1", - "modalities": { - "input": [ - "audio" - ] - }, - "limit": { - "context": 8192, - "output": 8192 - }, - "tool_call": false, - "reasoning": { - "supported": false - }, - "cost": { - "input": 100, - "output": 100 - }, - "type": "chat" - }, - { - "id": "whisper-large-v3", - "name": "whisper-large-v3", - "display_name": "whisper-large-v3", - "modalities": { - "input": [ - "audio" - ] - }, - "limit": { - "context": 8192, - "output": 8192 - }, - "tool_call": false, - "reasoning": { - "supported": false - }, - "cost": { - "input": 30.834, - "output": 30.834 - }, - "type": "chat" - }, - { - "id": "whisper-large-v3-turbo", - "name": "whisper-large-v3-turbo", - "display_name": "whisper-large-v3-turbo", - "modalities": { - "input": [ - "audio" - ] - }, - "limit": { - "context": 8192, - "output": 8192 - }, - "tool_call": false, - "reasoning": { - "supported": false - }, - "cost": { - "input": 5.556, - "output": 5.556 - }, - "type": "chat" - }, - { - "id": "yi-large", - "name": "yi-large", - "display_name": "yi-large", - "limit": { - "context": 8192, - "output": 8192 - }, - "tool_call": false, - "reasoning": { - "supported": false - }, - "cost": { - "input": 3, - "output": 3 - }, - "type": "chat" - }, - { - "id": "yi-large-rag", - "name": "yi-large-rag", - "display_name": "yi-large-rag", - "limit": { - "context": 8192, - "output": 8192 - }, - "tool_call": false, - "reasoning": { - "supported": false - }, - "cost": { - "input": 4, - "output": 4 - }, - "type": "chat" - }, - { - "id": "yi-large-turbo", - "name": "yi-large-turbo", - "display_name": "yi-large-turbo", - "limit": { - "context": 8192, - "output": 8192 - }, - "tool_call": false, - "reasoning": { - "supported": false - }, - "cost": { - "input": 1.8, - "output": 1.8 - }, - "type": "chat" - }, - { - "id": "yi-lightning", - "name": "yi-lightning", - "display_name": "yi-lightning", - "limit": { - "context": 8192, - "output": 8192 - }, - "tool_call": false, - "reasoning": { - "supported": false - }, - "cost": { - "input": 0.2, - "output": 0.2 - }, - "type": "chat" - }, - { - "id": "yi-medium", - "name": "yi-medium", - "display_name": "yi-medium", - "limit": { - "context": 8192, - "output": 8192 - }, - "tool_call": false, - "reasoning": { - "supported": false - }, - "cost": { - "input": 0.4, - "output": 0.4 - }, - "type": "chat" - }, - { - "id": "yi-vl-plus", - "name": "yi-vl-plus", - "display_name": "yi-vl-plus", - "limit": { - "context": 8192, - "output": 8192 - }, - "tool_call": false, - "reasoning": { - "supported": false - }, - "cost": { - "input": 0.000852, - "output": 0.000852 - }, - "type": "chat" - }, - { - "id": "Baichuan3-Turbo", - "name": "Baichuan3-Turbo", - "display_name": "Baichuan3-Turbo", - "limit": { - "context": 8192, - "output": 8192 - }, - "tool_call": false, - "reasoning": { - "supported": false - }, - "cost": { - "input": 1.9, - "output": 1.9 - }, - "type": "chat" - }, - { - "id": "Baichuan3-Turbo-128k", - "name": "Baichuan3-Turbo-128k", - "display_name": "Baichuan3-Turbo-128k", + "id": "deepseek-ai/DeepSeek-V2-Chat", + "name": "deepseek-ai/DeepSeek-V2-Chat", + "display_name": "deepseek-ai/DeepSeek-V2-Chat", "limit": { "context": 8192, "output": 8192 @@ -224585,15 +228527,15 @@ "supported": false }, "cost": { - "input": 3.8, - "output": 3.8 + "input": 0.16, + "output": 0.32 }, "type": "chat" }, { - "id": "Baichuan4", - "name": "Baichuan4", - "display_name": "Baichuan4", + "id": "deepseek-ai/DeepSeek-V2.5", + "name": "deepseek-ai/DeepSeek-V2.5", + "display_name": "deepseek-ai/DeepSeek-V2.5", "limit": { "context": 8192, "output": 8192 @@ -224603,15 +228545,15 @@ "supported": false }, "cost": { - "input": 16, - "output": 16 + "input": 0.16, + "output": 0.32 }, "type": "chat" }, { - "id": "Baichuan4-Air", - "name": "Baichuan4-Air", - "display_name": "Baichuan4-Air", + "id": "deepseek-ai/deepseek-llm-67b-chat", + "name": "deepseek-ai/deepseek-llm-67b-chat", + "display_name": "deepseek-ai/deepseek-llm-67b-chat", "limit": { "context": 8192, "output": 8192 @@ -224627,477 +228569,9 @@ "type": "chat" }, { - "id": "Baichuan4-Turbo", - "name": "Baichuan4-Turbo", - "display_name": "Baichuan4-Turbo", - "limit": { - "context": 8192, - "output": 8192 - }, - "tool_call": false, - "reasoning": { - "supported": false - }, - "cost": { - "input": 2.4, - "output": 2.4 - }, - "type": "chat" - }, - { - "id": "DeepSeek-v3", - "name": "DeepSeek-v3", - "display_name": "DeepSeek-v3", - "limit": { - "context": 8192, - "output": 8192 - }, - "tool_call": false, - "reasoning": { - "supported": false - }, - "cost": { - "input": 0.272, - "output": 1.088 - }, - "type": "chat" - }, - { - "id": "Doubao-1.5-lite-32k", - "name": "Doubao-1.5-lite-32k", - "display_name": "Doubao-1.5-lite-32k", - "limit": { - "context": 8192, - "output": 8192 - }, - "tool_call": false, - "reasoning": { - "supported": false - }, - "cost": { - "input": 0.05, - "output": 0.1, - "cache_read": 0.01 - }, - "type": "chat" - }, - { - "id": "Doubao-1.5-pro-256k", - "name": "Doubao-1.5-pro-256k", - "display_name": "Doubao-1.5-pro-256k", - "limit": { - "context": 8192, - "output": 8192 - }, - "tool_call": false, - "reasoning": { - "supported": false - }, - "cost": { - "input": 0.8, - "output": 1.44, - "cache_read": 0.8 - }, - "type": "chat" - }, - { - "id": "Doubao-1.5-pro-32k", - "name": "Doubao-1.5-pro-32k", - "display_name": "Doubao-1.5-pro-32k", - "limit": { - "context": 8192, - "output": 8192 - }, - "tool_call": false, - "reasoning": { - "supported": false - }, - "cost": { - "input": 0.134, - "output": 0.335, - "cache_read": 0.0268 - }, - "type": "chat" - }, - { - "id": "Doubao-1.5-vision-pro-32k", - "name": "Doubao-1.5-vision-pro-32k", - "display_name": "Doubao-1.5-vision-pro-32k", - "limit": { - "context": 8192, - "output": 8192 - }, - "tool_call": false, - "reasoning": { - "supported": false - }, - "cost": { - "input": 0.46, - "output": 1.38 - }, - "type": "chat" - }, - { - "id": "Doubao-lite-128k", - "name": "Doubao-lite-128k", - "display_name": "Doubao-lite-128k", - "limit": { - "context": 8192, - "output": 8192 - }, - "tool_call": false, - "reasoning": { - "supported": false - }, - "cost": { - "input": 0.14, - "output": 0.28, - "cache_read": 0.14 - }, - "type": "chat" - }, - { - "id": "Doubao-lite-32k", - "name": "Doubao-lite-32k", - "display_name": "Doubao-lite-32k", - "limit": { - "context": 8192, - "output": 8192 - }, - "tool_call": false, - "reasoning": { - "supported": false - }, - "cost": { - "input": 0.06, - "output": 0.12, - "cache_read": 0.012 - }, - "type": "chat" - }, - { - "id": "Doubao-lite-4k", - "name": "Doubao-lite-4k", - "display_name": "Doubao-lite-4k", - "limit": { - "context": 8192, - "output": 8192 - }, - "tool_call": false, - "reasoning": { - "supported": false - }, - "cost": { - "input": 0.06, - "output": 0.12, - "cache_read": 0.06 - }, - "type": "chat" - }, - { - "id": "Doubao-pro-128k", - "name": "Doubao-pro-128k", - "display_name": "Doubao-pro-128k", - "limit": { - "context": 8192, - "output": 8192 - }, - "tool_call": false, - "reasoning": { - "supported": false - }, - "cost": { - "input": 0.8, - "output": 1.44 - }, - "type": "chat" - }, - { - "id": "Doubao-pro-256k", - "name": "Doubao-pro-256k", - "display_name": "Doubao-pro-256k", - "limit": { - "context": 8192, - "output": 8192 - }, - "tool_call": false, - "reasoning": { - "supported": false - }, - "cost": { - "input": 0.8, - "output": 1.44, - "cache_read": 0.8 - }, - "type": "chat" - }, - { - "id": "Doubao-pro-32k", - "name": "Doubao-pro-32k", - "display_name": "Doubao-pro-32k", - "limit": { - "context": 8192, - "output": 8192 - }, - "tool_call": false, - "reasoning": { - "supported": false - }, - "cost": { - "input": 0.14, - "output": 0.35, - "cache_read": 0.028 - }, - "type": "chat" - }, - { - "id": "Doubao-pro-4k", - "name": "Doubao-pro-4k", - "display_name": "Doubao-pro-4k", - "limit": { - "context": 8192, - "output": 8192 - }, - "tool_call": false, - "reasoning": { - "supported": false - }, - "cost": { - "input": 0.14, - "output": 0.35 - }, - "type": "chat" - }, - { - "id": "GPT-OSS-20B", - "name": "GPT-OSS-20B", - "display_name": "GPT-OSS-20B", - "limit": { - "context": 8192, - "output": 8192 - }, - "tool_call": false, - "reasoning": { - "supported": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true - } - }, - "cost": { - "input": 0.11, - "output": 0.55 - }, - "type": "chat" - }, - { - "id": "Gryphe/MythoMax-L2-13b", - "name": "Gryphe/MythoMax-L2-13b", - "display_name": "Gryphe/MythoMax-L2-13b", - "limit": { - "context": 8192, - "output": 8192 - }, - "tool_call": false, - "reasoning": { - "supported": false - }, - "cost": { - "input": 0.4, - "output": 0.4 - }, - "type": "chat" - }, - { - "id": "MiniMax-Text-01", - "name": "MiniMax-Text-01", - "display_name": "MiniMax-Text-01", - "modalities": { - "input": [ - "text" - ] - }, - "limit": { - "context": 8192, - "output": 8192 - }, - "tool_call": false, - "reasoning": { - "supported": false - }, - "cost": { - "input": 0.14, - "output": 1.12 - }, - "type": "chat" - }, - { - "id": "Mistral-large-2407", - "name": "Mistral-large-2407", - "display_name": "Mistral-large-2407", - "limit": { - "context": 8192, - "output": 8192 - }, - "tool_call": false, - "reasoning": { - "supported": false - }, - "cost": { - "input": 3, - "output": 9 - }, - "type": "chat" - }, - { - "id": "Qwen/Qwen2-1.5B-Instruct", - "name": "Qwen/Qwen2-1.5B-Instruct", - "display_name": "Qwen/Qwen2-1.5B-Instruct", - "limit": { - "context": 8192, - "output": 8192 - }, - "tool_call": false, - "reasoning": { - "supported": false - }, - "cost": { - "input": 0.2, - "output": 0.2 - }, - "type": "chat" - }, - { - "id": "Qwen/Qwen2-57B-A14B-Instruct", - "name": "Qwen/Qwen2-57B-A14B-Instruct", - "display_name": "Qwen/Qwen2-57B-A14B-Instruct", - "limit": { - "context": 8192, - "output": 8192 - }, - "tool_call": false, - "reasoning": { - "supported": false - }, - "cost": { - "input": 0.24, - "output": 0.24 - }, - "type": "chat" - }, - { - "id": "Qwen/Qwen2-72B-Instruct", - "name": "Qwen/Qwen2-72B-Instruct", - "display_name": "Qwen/Qwen2-72B-Instruct", - "limit": { - "context": 8192, - "output": 8192 - }, - "tool_call": false, - "reasoning": { - "supported": false - }, - "cost": { - "input": 0.8, - "output": 0.8 - }, - "type": "chat" - }, - { - "id": "Qwen/Qwen2-7B-Instruct", - "name": "Qwen/Qwen2-7B-Instruct", - "display_name": "Qwen/Qwen2-7B-Instruct", - "limit": { - "context": 8192, - "output": 8192 - }, - "tool_call": false, - "reasoning": { - "supported": false - }, - "cost": { - "input": 0.08, - "output": 0.08 - }, - "type": "chat" - }, - { - "id": "Qwen/Qwen2.5-32B-Instruct", - "name": "Qwen/Qwen2.5-32B-Instruct", - "display_name": "Qwen/Qwen2.5-32B-Instruct", - "limit": { - "context": 8192, - "output": 8192 - }, - "tool_call": false, - "reasoning": { - "supported": false - }, - "cost": { - "input": 0.6, - "output": 0.6 - }, - "type": "chat" - }, - { - "id": "Qwen/Qwen2.5-72B-Instruct", - "name": "Qwen/Qwen2.5-72B-Instruct", - "display_name": "Qwen/Qwen2.5-72B-Instruct", - "limit": { - "context": 8192, - "output": 8192 - }, - "tool_call": false, - "reasoning": { - "supported": false - }, - "cost": { - "input": 0.8, - "output": 0.8 - }, - "type": "chat" - }, - { - "id": "Qwen/Qwen2.5-72B-Instruct-128K", - "name": "Qwen/Qwen2.5-72B-Instruct-128K", - "display_name": "Qwen/Qwen2.5-72B-Instruct-128K", - "limit": { - "context": 8192, - "output": 8192 - }, - "tool_call": false, - "reasoning": { - "supported": false - }, - "cost": { - "input": 0.8, - "output": 0.8 - }, - "type": "chat" - }, - { - "id": "Qwen/Qwen2.5-7B-Instruct", - "name": "Qwen/Qwen2.5-7B-Instruct", - "display_name": "Qwen/Qwen2.5-7B-Instruct", - "limit": { - "context": 8192, - "output": 8192 - }, - "tool_call": false, - "reasoning": { - "supported": false - }, - "cost": { - "input": 0.4, - "output": 0.4 - }, - "type": "chat" - }, - { - "id": "Qwen/Qwen2.5-Coder-32B-Instruct", - "name": "Qwen/Qwen2.5-Coder-32B-Instruct", - "display_name": "Qwen/Qwen2.5-Coder-32B-Instruct", + "id": "deepseek-ai/deepseek-vl2", + "name": "deepseek-ai/deepseek-vl2", + "display_name": "deepseek-ai/deepseek-vl2", "limit": { "context": 8192, "output": 8192 @@ -225113,44 +228587,9 @@ "type": "chat" }, { - "id": "Qwen3-235B-A22B-Thinking-2507", - "name": "Qwen3-235B-A22B-Thinking-2507", - "display_name": "Qwen3-235B-A22B-Thinking-2507", - "limit": { - "context": 8192, - "output": 8192 - }, - "tool_call": false, - "reasoning": { - "supported": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } - }, - "cost": { - "input": 0.28, - "output": 2.8 - }, - "type": "chat" - }, - { - "id": "Stable-Diffusion-3-5-Large", - "name": "Stable-Diffusion-3-5-Large", - "display_name": "Stable-Diffusion-3-5-Large", - "modalities": { - "input": [ - "text", - "image" - ] - }, + "id": "deepseek-v3", + "name": "deepseek-v3", + "display_name": "deepseek-v3", "limit": { "context": 8192, "output": 8192 @@ -225160,189 +228599,21 @@ "supported": false }, "cost": { - "input": 4, - "output": 4, + "input": 0.272, + "output": 1.088, "cache_read": 0 }, - "type": "imageGeneration" - }, - { - "id": "WizardLM/WizardCoder-Python-34B-V1.0", - "name": "WizardLM/WizardCoder-Python-34B-V1.0", - "display_name": "WizardLM/WizardCoder-Python-34B-V1.0", - "limit": { - "context": 8192, - "output": 8192 - }, - "tool_call": false, - "reasoning": { - "supported": false - }, - "cost": { - "input": 0.9, - "output": 0.9 - }, - "type": "chat" - }, - { - "id": "ahm-Phi-3-5-MoE-instruct", - "name": "ahm-Phi-3-5-MoE-instruct", - "display_name": "ahm-Phi-3-5-MoE-instruct", - "limit": { - "context": 8192, - "output": 8192 - }, - "tool_call": false, - "reasoning": { - "supported": false - }, - "cost": { - "input": 0.4, - "output": 1.6 - }, - "type": "chat" - }, - { - "id": "ahm-Phi-3-5-mini-instruct", - "name": "ahm-Phi-3-5-mini-instruct", - "display_name": "ahm-Phi-3-5-mini-instruct", - "limit": { - "context": 8192, - "output": 8192 - }, - "tool_call": false, - "reasoning": { - "supported": false - }, - "cost": { - "input": 1, - "output": 3 - }, - "type": "chat" - }, - { - "id": "ahm-Phi-3-5-vision-instruct", - "name": "ahm-Phi-3-5-vision-instruct", - "display_name": "ahm-Phi-3-5-vision-instruct", - "modalities": { - "input": [ - "text", - "image" - ] - }, - "limit": { - "context": 8192, - "output": 8192 - }, - "tool_call": false, - "reasoning": { - "supported": false - }, - "cost": { - "input": 0.4, - "output": 1.6 - }, - "type": "chat" - }, - { - "id": "ahm-Phi-3-medium-128k", - "name": "ahm-Phi-3-medium-128k", - "display_name": "ahm-Phi-3-medium-128k", - "limit": { - "context": 8192, - "output": 8192 - }, - "tool_call": false, - "reasoning": { - "supported": false - }, - "cost": { - "input": 6, - "output": 18 - }, - "type": "chat" - }, - { - "id": "ahm-Phi-3-medium-4k", - "name": "ahm-Phi-3-medium-4k", - "display_name": "ahm-Phi-3-medium-4k", - "limit": { - "context": 8192, - "output": 8192 - }, - "tool_call": false, - "reasoning": { - "supported": false - }, - "cost": { - "input": 1, - "output": 3 - }, - "type": "chat" - }, - { - "id": "ahm-Phi-3-small-128k", - "name": "ahm-Phi-3-small-128k", - "display_name": "ahm-Phi-3-small-128k", - "limit": { - "context": 8192, - "output": 8192 - }, - "tool_call": false, - "reasoning": { - "supported": false - }, - "cost": { - "input": 1, - "output": 3 - }, - "type": "chat" - }, - { - "id": "aihubmix-Codestral-2501", - "name": "aihubmix-Codestral-2501", - "display_name": "aihubmix-Codestral-2501", - "limit": { - "context": 8192, - "output": 8192 - }, - "tool_call": false, - "reasoning": { - "supported": false - }, - "cost": { - "input": 0.4, - "output": 1.2 - }, "type": "chat" }, { - "id": "aihubmix-Cohere-command-r", - "name": "aihubmix-Cohere-command-r", - "display_name": "aihubmix-Cohere-command-r", + "id": "distil-whisper-large-v3-en", + "name": "distil-whisper-large-v3-en", + "display_name": "distil-whisper-large-v3-en", "modalities": { "input": [ - "text" - ] - }, - "limit": { - "context": 8192, - "output": 8192 - }, - "tool_call": false, - "reasoning": { - "supported": false - }, - "cost": { - "input": 0.64, - "output": 1.92 - }, - "type": "chat" - }, - { - "id": "aihubmix-Jamba-1-5-Large", - "name": "aihubmix-Jamba-1-5-Large", - "display_name": "aihubmix-Jamba-1-5-Large", + "audio" + ] + }, "limit": { "context": 8192, "output": 8192 @@ -225352,15 +228623,15 @@ "supported": false }, "cost": { - "input": 2.2, - "output": 8.8 + "input": 5.556, + "output": 5.556 }, "type": "chat" }, { - "id": "aihubmix-Llama-3-1-405B-Instruct", - "name": "aihubmix-Llama-3-1-405B-Instruct", - "display_name": "aihubmix-Llama-3-1-405B-Instruct", + "id": "doubao-1-5-thinking-vision-pro-250428", + "name": "doubao-1-5-thinking-vision-pro-250428", + "display_name": "doubao-1-5-thinking-vision-pro-250428", "limit": { "context": 8192, "output": 8192 @@ -225370,15 +228641,16 @@ "supported": false }, "cost": { - "input": 5, - "output": 15 + "input": 2, + "output": 2, + "cache_read": 2 }, "type": "chat" }, { - "id": "aihubmix-Llama-3-1-70B-Instruct", - "name": "aihubmix-Llama-3-1-70B-Instruct", - "display_name": "aihubmix-Llama-3-1-70B-Instruct", + "id": "fx-flux-2-pro", + "name": "fx-flux-2-pro", + "display_name": "fx-flux-2-pro", "limit": { "context": 8192, "output": 8192 @@ -225388,33 +228660,68 @@ "supported": false }, "cost": { - "input": 0.6, - "output": 0.78 + "input": 2, + "output": 0, + "cache_read": 0 }, "type": "chat" }, { - "id": "aihubmix-Llama-3-1-8B-Instruct", - "name": "aihubmix-Llama-3-1-8B-Instruct", - "display_name": "aihubmix-Llama-3-1-8B-Instruct", + "id": "gemini-2.5-pro-exp-03-25", + "name": "gemini-2.5-pro-exp-03-25", + "display_name": "gemini-2.5-pro-exp-03-25", + "modalities": { + "input": [ + "text", + "image", + "audio", + "video" + ] + }, "limit": { "context": 8192, "output": 8192 }, - "tool_call": false, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "default_enabled": true, + "mode": "budget", + "budget": { + "default": -1, + "min": 128, + "max": 32768, + "auto": -1, + "unit": "tokens" + }, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thought_signatures" + ] + } }, "cost": { - "input": 0.3, - "output": 0.6 + "input": 1.25, + "output": 5, + "cache_read": 0.125 }, "type": "chat" }, { - "id": "aihubmix-Llama-3-2-11B-Vision", - "name": "aihubmix-Llama-3-2-11B-Vision", - "display_name": "aihubmix-Llama-3-2-11B-Vision", + "id": "gemini-embedding-exp-03-07", + "name": "gemini-embedding-exp-03-07", + "display_name": "gemini-embedding-exp-03-07", + "modalities": { + "input": [ + "text" + ] + }, "limit": { "context": 8192, "output": 8192 @@ -225424,15 +228731,15 @@ "supported": false }, "cost": { - "input": 0.4, - "output": 0.4 + "input": 0.02, + "output": 0.02 }, - "type": "chat" + "type": "embedding" }, { - "id": "aihubmix-Llama-3-2-90B-Vision", - "name": "aihubmix-Llama-3-2-90B-Vision", - "display_name": "aihubmix-Llama-3-2-90B-Vision", + "id": "gemini-exp-1114", + "name": "gemini-exp-1114", + "display_name": "gemini-exp-1114", "limit": { "context": 8192, "output": 8192 @@ -225442,15 +228749,15 @@ "supported": false }, "cost": { - "input": 2.4, - "output": 2.4 + "input": 1.25, + "output": 5 }, "type": "chat" }, { - "id": "aihubmix-Llama-3-70B-Instruct", - "name": "aihubmix-Llama-3-70B-Instruct", - "display_name": "aihubmix-Llama-3-70B-Instruct", + "id": "gemini-exp-1121", + "name": "gemini-exp-1121", + "display_name": "gemini-exp-1121", "limit": { "context": 8192, "output": 8192 @@ -225460,15 +228767,15 @@ "supported": false }, "cost": { - "input": 0.7, - "output": 0.7 + "input": 1.25, + "output": 5 }, "type": "chat" }, { - "id": "aihubmix-Mistral-large", - "name": "aihubmix-Mistral-large", - "display_name": "aihubmix-Mistral-large", + "id": "gemini-pro", + "name": "gemini-pro", + "display_name": "gemini-pro", "limit": { "context": 8192, "output": 8192 @@ -225478,20 +228785,15 @@ "supported": false }, "cost": { - "input": 4, - "output": 12 + "input": 0.2, + "output": 0.6 }, "type": "chat" }, { - "id": "aihubmix-command-r-08-2024", - "name": "aihubmix-command-r-08-2024", - "display_name": "aihubmix-command-r-08-2024", - "modalities": { - "input": [ - "text" - ] - }, + "id": "gemini-pro-vision", + "name": "gemini-pro-vision", + "display_name": "gemini-pro-vision", "limit": { "context": 8192, "output": 8192 @@ -225501,20 +228803,15 @@ "supported": false }, "cost": { - "input": 0.2, - "output": 0.8 + "input": 1, + "output": 1 }, "type": "chat" }, { - "id": "aihubmix-command-r-plus", - "name": "aihubmix-command-r-plus", - "display_name": "aihubmix-command-r-plus", - "modalities": { - "input": [ - "text" - ] - }, + "id": "gemma-7b-it", + "name": "gemma-7b-it", + "display_name": "gemma-7b-it", "limit": { "context": 8192, "output": 8192 @@ -225524,20 +228821,15 @@ "supported": false }, "cost": { - "input": 3.84, - "output": 19.2 + "input": 0.1, + "output": 0.1 }, "type": "chat" }, { - "id": "aihubmix-command-r-plus-08-2024", - "name": "aihubmix-command-r-plus-08-2024", - "display_name": "aihubmix-command-r-plus-08-2024", - "modalities": { - "input": [ - "text" - ] - }, + "id": "glm-3-turbo", + "name": "glm-3-turbo", + "display_name": "glm-3-turbo", "limit": { "context": 8192, "output": 8192 @@ -225547,15 +228839,15 @@ "supported": false }, "cost": { - "input": 2.8, - "output": 11.2 + "input": 0.71, + "output": 0.71 }, "type": "chat" }, { - "id": "alicloud-deepseek-v3.2", - "name": "alicloud-deepseek-v3.2", - "display_name": "alicloud-deepseek-v3.2", + "id": "glm-4", + "name": "glm-4", + "display_name": "glm-4", "limit": { "context": 8192, "output": 8192 @@ -225565,16 +228857,15 @@ "supported": false }, "cost": { - "input": 0.274, - "output": 0.411, - "cache_read": 0.0548 + "input": 14.2, + "output": 14.2 }, "type": "chat" }, { - "id": "alicloud-glm-4.7", - "name": "alicloud-glm-4.7", - "display_name": "alicloud-glm-4.7", + "id": "glm-4-flash", + "name": "glm-4-flash", + "display_name": "glm-4-flash", "limit": { "context": 8192, "output": 8192 @@ -225584,16 +228875,15 @@ "supported": false }, "cost": { - "input": 0.41096, - "output": 1.917786, - "cache_read": 0.41096 + "input": 0.1, + "output": 0.1 }, "type": "chat" }, { - "id": "alicloud-kimi-k2-thinking", - "name": "alicloud-kimi-k2-thinking", - "display_name": "alicloud-kimi-k2-thinking", + "id": "glm-4-plus", + "name": "glm-4-plus", + "display_name": "glm-4-plus", "limit": { "context": 8192, "output": 8192 @@ -225603,34 +228893,39 @@ "supported": false }, "cost": { - "input": 0.548, - "output": 2.192 + "input": 8, + "output": 8 }, "type": "chat" }, { - "id": "alicloud-kimi-k2.5", - "name": "alicloud-kimi-k2.5", - "display_name": "alicloud-kimi-k2.5", + "id": "glm-4.5-airx", + "name": "glm-4.5-airx", + "display_name": "glm-4.5-airx", + "modalities": { + "input": [ + "text" + ] + }, "limit": { - "context": 256000, - "output": 256000 + "context": 8192, + "output": 8192 }, "tool_call": false, "reasoning": { "supported": false }, "cost": { - "input": 0.548, - "output": 2.877, - "cache_read": 0.0959 + "input": 1.1, + "output": 4.51, + "cache_read": 0.22 }, "type": "chat" }, { - "id": "alicloud-minimax-m2.5", - "name": "alicloud-minimax-m2.5", - "display_name": "alicloud-minimax-m2.5", + "id": "glm-4v", + "name": "glm-4v", + "display_name": "glm-4v", "limit": { "context": 8192, "output": 8192 @@ -225640,47 +228935,33 @@ "supported": false }, "cost": { - "input": 0.2876, - "output": 1.1504, - "cache_read": 0.05752 + "input": 14.2, + "output": 14.2 }, "type": "chat" }, { - "id": "anthropic-opus-4-6", - "name": "anthropic-opus-4-6", - "display_name": "anthropic-opus-4-6", - "modalities": { - "input": [ - "text", - "image" - ] - }, + "id": "glm-4v-plus", + "name": "glm-4v-plus", + "display_name": "glm-4v-plus", "limit": { - "context": 200000, - "output": 200000 + "context": 8192, + "output": 8192 }, - "tool_call": true, + "tool_call": false, "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true - } + "supported": false }, "cost": { - "input": 5, - "output": 25, - "cache_read": 0.5 + "input": 2, + "output": 2 }, "type": "chat" }, { - "id": "azure-deepseek-v3.2", - "name": "azure-deepseek-v3.2", - "display_name": "azure-deepseek-v3.2", + "id": "google-gemma-3-12b-it", + "name": "google-gemma-3-12b-it", + "display_name": "google-gemma-3-12b-it", "limit": { "context": 8192, "output": 8192 @@ -225690,15 +228971,15 @@ "supported": false }, "cost": { - "input": 0.58, - "output": 1.680028 + "input": 0.2, + "output": 0.2 }, "type": "chat" }, { - "id": "azure-deepseek-v3.2-speciale", - "name": "azure-deepseek-v3.2-speciale", - "display_name": "azure-deepseek-v3.2-speciale", + "id": "google-gemma-3-27b-it", + "name": "google-gemma-3-27b-it", + "display_name": "google-gemma-3-27b-it", "limit": { "context": 8192, "output": 8192 @@ -225708,33 +228989,35 @@ "supported": false }, "cost": { - "input": 0.58, - "output": 1.680028 + "input": 0.2, + "output": 0.2, + "cache_read": 0 }, "type": "chat" }, { - "id": "azure-kimi-k2.5", - "name": "azure-kimi-k2.5", - "display_name": "azure-kimi-k2.5", + "id": "google-gemma-3-4b-it", + "name": "google-gemma-3-4b-it", + "display_name": "google-gemma-3-4b-it", "limit": { - "context": 256000, - "output": 256000 + "context": 8192, + "output": 8192 }, "tool_call": false, "reasoning": { "supported": false }, "cost": { - "input": 0.6, - "output": 3 + "input": 0.2, + "output": 0.2, + "cache_read": 0 }, "type": "chat" }, { - "id": "cbs-glm-4.7", - "name": "cbs-glm-4.7", - "display_name": "cbs-glm-4.7", + "id": "google/gemini-exp-1114", + "name": "google/gemini-exp-1114", + "display_name": "google/gemini-exp-1114", "limit": { "context": 8192, "output": 8192 @@ -225744,15 +229027,15 @@ "supported": false }, "cost": { - "input": 2.25, - "output": 2.749995 + "input": 1.25, + "output": 5 }, "type": "chat" }, { - "id": "cerebras-llama-3.3-70b", - "name": "cerebras-llama-3.3-70b", - "display_name": "cerebras-llama-3.3-70b", + "id": "google/gemma-2-27b-it", + "name": "google/gemma-2-27b-it", + "display_name": "google/gemma-2-27b-it", "limit": { "context": 8192, "output": 8192 @@ -225762,15 +229045,15 @@ "supported": false }, "cost": { - "input": 0.6, - "output": 0.6 + "input": 0.8, + "output": 0.8 }, "type": "chat" }, { - "id": "chatglm_lite", - "name": "chatglm_lite", - "display_name": "chatglm_lite", + "id": "google/gemma-2-9b-it:free", + "name": "google/gemma-2-9b-it:free", + "display_name": "google/gemma-2-9b-it:free", "limit": { "context": 8192, "output": 8192 @@ -225780,15 +229063,15 @@ "supported": false }, "cost": { - "input": 0.2858, - "output": 0.2858 + "input": 0.02, + "output": 0.02 }, "type": "chat" }, { - "id": "chatglm_pro", - "name": "chatglm_pro", - "display_name": "chatglm_pro", + "id": "gpt-3.5-turbo", + "name": "gpt-3.5-turbo", + "display_name": "gpt-3.5-turbo", "limit": { "context": 8192, "output": 8192 @@ -225798,15 +229081,15 @@ "supported": false }, "cost": { - "input": 1.4286, - "output": 1.4286 + "input": 0.5, + "output": 1.5 }, "type": "chat" }, { - "id": "chatglm_std", - "name": "chatglm_std", - "display_name": "chatglm_std", + "id": "gpt-3.5-turbo-0301", + "name": "gpt-3.5-turbo-0301", + "display_name": "gpt-3.5-turbo-0301", "limit": { "context": 8192, "output": 8192 @@ -225816,15 +229099,15 @@ "supported": false }, "cost": { - "input": 0.7144, - "output": 0.7144 + "input": 1.5, + "output": 1.5 }, "type": "chat" }, { - "id": "chatglm_turbo", - "name": "chatglm_turbo", - "display_name": "chatglm_turbo", + "id": "gpt-3.5-turbo-0613", + "name": "gpt-3.5-turbo-0613", + "display_name": "gpt-3.5-turbo-0613", "limit": { "context": 8192, "output": 8192 @@ -225834,15 +229117,15 @@ "supported": false }, "cost": { - "input": 0.7144, - "output": 0.7144 + "input": 1.5, + "output": 2 }, "type": "chat" }, { - "id": "claude-2", - "name": "claude-2", - "display_name": "claude-2", + "id": "gpt-3.5-turbo-1106", + "name": "gpt-3.5-turbo-1106", + "display_name": "gpt-3.5-turbo-1106", "limit": { "context": 8192, "output": 8192 @@ -225852,15 +229135,15 @@ "supported": false }, "cost": { - "input": 8.8, - "output": 8.8 + "input": 1, + "output": 2 }, "type": "chat" }, { - "id": "claude-2.0", - "name": "claude-2.0", - "display_name": "claude-2.0", + "id": "gpt-3.5-turbo-16k", + "name": "gpt-3.5-turbo-16k", + "display_name": "gpt-3.5-turbo-16k", "limit": { "context": 8192, "output": 8192 @@ -225870,15 +229153,15 @@ "supported": false }, "cost": { - "input": 8.8, - "output": 39.6 + "input": 3, + "output": 4 }, "type": "chat" }, { - "id": "claude-2.1", - "name": "claude-2.1", - "display_name": "claude-2.1", + "id": "gpt-3.5-turbo-16k-0613", + "name": "gpt-3.5-turbo-16k-0613", + "display_name": "gpt-3.5-turbo-16k-0613", "limit": { "context": 8192, "output": 8192 @@ -225888,45 +229171,33 @@ "supported": false }, "cost": { - "input": 8.8, - "output": 39.6 + "input": 3, + "output": 4 }, "type": "chat" }, { - "id": "claude-3-5-sonnet-20240620", - "name": "claude-3-5-sonnet-20240620", - "display_name": "claude-3-5-sonnet-20240620", - "modalities": { - "input": [ - "text", - "image" - ] - }, + "id": "gpt-3.5-turbo-instruct", + "name": "gpt-3.5-turbo-instruct", + "display_name": "gpt-3.5-turbo-instruct", "limit": { - "context": 200000, - "output": 200000 + "context": 8192, + "output": 8192 }, "tool_call": false, "reasoning": { "supported": false }, "cost": { - "input": 3.3, - "output": 16.5 + "input": 1.5, + "output": 2 }, "type": "chat" }, { - "id": "claude-3-haiku-20240229", - "name": "claude-3-haiku-20240229", - "display_name": "claude-3-haiku-20240229", - "modalities": { - "input": [ - "text", - "image" - ] - }, + "id": "gpt-4", + "name": "gpt-4", + "display_name": "gpt-4", "limit": { "context": 8192, "output": 8192 @@ -225936,21 +229207,15 @@ "supported": false }, "cost": { - "input": 0.275, - "output": 0.275 + "input": 30, + "output": 60 }, "type": "chat" }, { - "id": "claude-3-haiku-20240307", - "name": "claude-3-haiku-20240307", - "display_name": "claude-3-haiku-20240307", - "modalities": { - "input": [ - "text", - "image" - ] - }, + "id": "gpt-4-0125-preview", + "name": "gpt-4-0125-preview", + "display_name": "gpt-4-0125-preview", "limit": { "context": 8192, "output": 8192 @@ -225960,21 +229225,15 @@ "supported": false }, "cost": { - "input": 0.275, - "output": 1.375 + "input": 10, + "output": 30 }, "type": "chat" }, { - "id": "claude-3-sonnet-20240229", - "name": "claude-3-sonnet-20240229", - "display_name": "claude-3-sonnet-20240229", - "modalities": { - "input": [ - "text", - "image" - ] - }, + "id": "gpt-4-0314", + "name": "gpt-4-0314", + "display_name": "gpt-4-0314", "limit": { "context": 8192, "output": 8192 @@ -225984,15 +229243,15 @@ "supported": false }, "cost": { - "input": 3.3, - "output": 16.5 + "input": 30, + "output": 60 }, "type": "chat" }, { - "id": "claude-instant-1", - "name": "claude-instant-1", - "display_name": "claude-instant-1", + "id": "gpt-4-0613", + "name": "gpt-4-0613", + "display_name": "gpt-4-0613", "limit": { "context": 8192, "output": 8192 @@ -226002,15 +229261,15 @@ "supported": false }, "cost": { - "input": 1.793, - "output": 1.793 + "input": 30, + "output": 60 }, "type": "chat" }, { - "id": "claude-instant-1.2", - "name": "claude-instant-1.2", - "display_name": "claude-instant-1.2", + "id": "gpt-4-1106-preview", + "name": "gpt-4-1106-preview", + "display_name": "gpt-4-1106-preview", "limit": { "context": 8192, "output": 8192 @@ -226020,15 +229279,15 @@ "supported": false }, "cost": { - "input": 0.88, - "output": 3.96 + "input": 10, + "output": 30 }, "type": "chat" }, { - "id": "code-davinci-edit-001", - "name": "code-davinci-edit-001", - "display_name": "code-davinci-edit-001", + "id": "gpt-4-32k-0314", + "name": "gpt-4-32k-0314", + "display_name": "gpt-4-32k-0314", "limit": { "context": 8192, "output": 8192 @@ -226038,15 +229297,15 @@ "supported": false }, "cost": { - "input": 20, - "output": 20 + "input": 60, + "output": 120 }, "type": "chat" }, { - "id": "cogview-3", - "name": "cogview-3", - "display_name": "cogview-3", + "id": "gpt-4-32k-0613", + "name": "gpt-4-32k-0613", + "display_name": "gpt-4-32k-0613", "limit": { "context": 8192, "output": 8192 @@ -226056,15 +229315,15 @@ "supported": false }, "cost": { - "input": 35.5, - "output": 35.5 + "input": 60, + "output": 120 }, "type": "chat" }, { - "id": "cogview-3-plus", - "name": "cogview-3-plus", - "display_name": "cogview-3-plus", + "id": "gpt-4-turbo", + "name": "gpt-4-turbo", + "display_name": "gpt-4-turbo", "limit": { "context": 8192, "output": 8192 @@ -226075,19 +229334,14 @@ }, "cost": { "input": 10, - "output": 10 + "output": 30 }, "type": "chat" }, { - "id": "command", - "name": "command", - "display_name": "command", - "modalities": { - "input": [ - "text" - ] - }, + "id": "gpt-4-turbo-2024-04-09", + "name": "gpt-4-turbo-2024-04-09", + "display_name": "gpt-4-turbo-2024-04-09", "limit": { "context": 8192, "output": 8192 @@ -226097,15 +229351,15 @@ "supported": false }, "cost": { - "input": 1, - "output": 2 + "input": 10, + "output": 30 }, "type": "chat" }, { - "id": "command-light", - "name": "command-light", - "display_name": "command-light", + "id": "gpt-4-turbo-preview", + "name": "gpt-4-turbo-preview", + "display_name": "gpt-4-turbo-preview", "limit": { "context": 8192, "output": 8192 @@ -226115,15 +229369,15 @@ "supported": false }, "cost": { - "input": 1, - "output": 2 + "input": 10, + "output": 30 }, "type": "chat" }, { - "id": "command-light-nightly", - "name": "command-light-nightly", - "display_name": "command-light-nightly", + "id": "gpt-4-vision-preview", + "name": "gpt-4-vision-preview", + "display_name": "gpt-4-vision-preview", "limit": { "context": 8192, "output": 8192 @@ -226133,36 +229387,38 @@ "supported": false }, "cost": { - "input": 1, - "output": 2 + "input": 10, + "output": 30 }, "type": "chat" }, { - "id": "command-nightly", - "name": "command-nightly", - "display_name": "command-nightly", + "id": "gpt-4o-2024-05-13", + "name": "gpt-4o-2024-05-13", + "display_name": "gpt-4o-2024-05-13", "limit": { - "context": 8192, - "output": 8192 + "context": 128000, + "output": 128000 }, "tool_call": false, "reasoning": { "supported": false }, "cost": { - "input": 1, - "output": 2 + "input": 5, + "output": 15, + "cache_read": 5 }, "type": "chat" }, { - "id": "command-r", - "name": "command-r", - "display_name": "command-r", + "id": "gpt-4o-mini-2024-07-18", + "name": "gpt-4o-mini-2024-07-18", + "display_name": "gpt-4o-mini-2024-07-18", "modalities": { "input": [ - "text" + "text", + "image" ] }, "limit": { @@ -226174,41 +229430,49 @@ "supported": false }, "cost": { - "input": 0.64, - "output": 1.92 + "input": 0.15, + "output": 0.6, + "cache_read": 0.075 }, "type": "chat" }, { - "id": "command-r-08-2024", - "name": "command-r-08-2024", - "display_name": "command-r-08-2024", + "id": "gpt-oss-20b", + "name": "gpt-oss-20b", + "display_name": "gpt-oss-20b", "modalities": { "input": [ "text" ] }, "limit": { - "context": 8192, - "output": 8192 + "context": 128000, + "output": 128000 }, - "tool_call": false, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true + } }, "cost": { - "input": 0.2, - "output": 0.8 + "input": 0.11, + "output": 0.55 }, "type": "chat" }, { - "id": "command-r-plus", - "name": "command-r-plus", - "display_name": "command-r-plus", + "id": "grok-2-vision-1212", + "name": "grok-2-vision-1212", + "display_name": "grok-2-vision-1212", "modalities": { "input": [ - "text" + "text", + "image" ] }, "limit": { @@ -226220,18 +229484,19 @@ "supported": false }, "cost": { - "input": 3.84, - "output": 19.2 + "input": 1.8, + "output": 9 }, "type": "chat" }, { - "id": "command-r-plus-08-2024", - "name": "command-r-plus-08-2024", - "display_name": "command-r-plus-08-2024", + "id": "grok-vision-beta", + "name": "grok-vision-beta", + "display_name": "grok-vision-beta", "modalities": { "input": [ - "text" + "text", + "image" ] }, "limit": { @@ -226243,21 +229508,15 @@ "supported": false }, "cost": { - "input": 2.8, - "output": 11.2 + "input": 5.6, + "output": 16.8 }, "type": "chat" }, { - "id": "dall-e-2", - "name": "dall-e-2", - "display_name": "dall-e-2", - "modalities": { - "input": [ - "text", - "image" - ] - }, + "id": "groq-llama-3.1-8b-instant", + "name": "groq-llama-3.1-8b-instant", + "display_name": "groq-llama-3.1-8b-instant", "limit": { "context": 8192, "output": 8192 @@ -226267,15 +229526,15 @@ "supported": false }, "cost": { - "input": 16, - "output": 16 + "input": 0.055, + "output": 0.088 }, - "type": "imageGeneration" + "type": "chat" }, { - "id": "davinci", - "name": "davinci", - "display_name": "davinci", + "id": "groq-llama-3.3-70b-versatile", + "name": "groq-llama-3.3-70b-versatile", + "display_name": "groq-llama-3.3-70b-versatile", "limit": { "context": 8192, "output": 8192 @@ -226285,15 +229544,15 @@ "supported": false }, "cost": { - "input": 20, - "output": 20 + "input": 0.649, + "output": 0.869011 }, "type": "chat" }, { - "id": "davinci-002", - "name": "davinci-002", - "display_name": "davinci-002", + "id": "groq-llama-4-maverick-17b-128e-instruct", + "name": "groq-llama-4-maverick-17b-128e-instruct", + "display_name": "groq-llama-4-maverick-17b-128e-instruct", "limit": { "context": 8192, "output": 8192 @@ -226303,15 +229562,15 @@ "supported": false }, "cost": { - "input": 2, - "output": 2 + "input": 0.22, + "output": 0.66 }, "type": "chat" }, { - "id": "deepinfra-llama-3.1-8b-instant", - "name": "deepinfra-llama-3.1-8b-instant", - "display_name": "deepinfra-llama-3.1-8b-instant", + "id": "groq-llama-4-scout-17b-16e-instruct", + "name": "groq-llama-4-scout-17b-16e-instruct", + "display_name": "groq-llama-4-scout-17b-16e-instruct", "limit": { "context": 8192, "output": 8192 @@ -226321,15 +229580,20 @@ "supported": false }, "cost": { - "input": 0.033, - "output": 0.054978 + "input": 0.122, + "output": 0.366 }, "type": "chat" }, { - "id": "deepinfra-llama-3.3-70b-instant-turbo", - "name": "deepinfra-llama-3.3-70b-instant-turbo", - "display_name": "deepinfra-llama-3.3-70b-instant-turbo", + "id": "whisper-1", + "name": "whisper-1", + "display_name": "whisper-1", + "modalities": { + "input": [ + "audio" + ] + }, "limit": { "context": 8192, "output": 8192 @@ -226339,15 +229603,20 @@ "supported": false }, "cost": { - "input": 0.11, - "output": 0.352 + "input": 100, + "output": 100 }, "type": "chat" }, { - "id": "deepinfra-llama-4-maverick-17b-128e-instruct", - "name": "deepinfra-llama-4-maverick-17b-128e-instruct", - "display_name": "deepinfra-llama-4-maverick-17b-128e-instruct", + "id": "whisper-large-v3", + "name": "whisper-large-v3", + "display_name": "whisper-large-v3", + "modalities": { + "input": [ + "audio" + ] + }, "limit": { "context": 8192, "output": 8192 @@ -226357,15 +229626,20 @@ "supported": false }, "cost": { - "input": 1.65, - "output": 6.6 + "input": 30.834, + "output": 30.834 }, "type": "chat" }, { - "id": "deepinfra-llama-4-scout-17b-16e-instruct", - "name": "deepinfra-llama-4-scout-17b-16e-instruct", - "display_name": "deepinfra-llama-4-scout-17b-16e-instruct", + "id": "whisper-large-v3-turbo", + "name": "whisper-large-v3-turbo", + "display_name": "whisper-large-v3-turbo", + "modalities": { + "input": [ + "audio" + ] + }, "limit": { "context": 8192, "output": 8192 @@ -226375,16 +229649,15 @@ "supported": false }, "cost": { - "input": 0.088, - "output": 0.33, - "cache_read": 0 + "input": 5.556, + "output": 5.556 }, "type": "chat" }, { - "id": "deepseek-ai/DeepSeek-Coder-V2-Instruct", - "name": "deepseek-ai/DeepSeek-Coder-V2-Instruct", - "display_name": "deepseek-ai/DeepSeek-Coder-V2-Instruct", + "id": "yi-large", + "name": "yi-large", + "display_name": "yi-large", "limit": { "context": 8192, "output": 8192 @@ -226394,38 +229667,33 @@ "supported": false }, "cost": { - "input": 0.16, - "output": 0.32 + "input": 3, + "output": 3 }, "type": "chat" }, { - "id": "deepseek-ai/DeepSeek-R1-Distill-Llama-70B", - "name": "deepseek-ai/DeepSeek-R1-Distill-Llama-70B", - "display_name": "deepseek-ai/DeepSeek-R1-Distill-Llama-70B", + "id": "yi-large-rag", + "name": "yi-large-rag", + "display_name": "yi-large-rag", "limit": { "context": 8192, "output": 8192 }, "tool_call": false, "reasoning": { - "supported": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true - } + "supported": false }, "cost": { - "input": 0.6, - "output": 0.6 + "input": 4, + "output": 4 }, "type": "chat" }, { - "id": "deepseek-ai/DeepSeek-R1-Distill-Llama-8B", - "name": "deepseek-ai/DeepSeek-R1-Distill-Llama-8B", - "display_name": "deepseek-ai/DeepSeek-R1-Distill-Llama-8B", + "id": "yi-large-turbo", + "name": "yi-large-turbo", + "display_name": "yi-large-turbo", "limit": { "context": 8192, "output": 8192 @@ -226435,15 +229703,15 @@ "supported": false }, "cost": { - "input": 0.01, - "output": 0.01 + "input": 1.8, + "output": 1.8 }, "type": "chat" }, { - "id": "deepseek-ai/DeepSeek-R1-Distill-Qwen-1.5B", - "name": "deepseek-ai/DeepSeek-R1-Distill-Qwen-1.5B", - "display_name": "deepseek-ai/DeepSeek-R1-Distill-Qwen-1.5B", + "id": "yi-lightning", + "name": "yi-lightning", + "display_name": "yi-lightning", "limit": { "context": 8192, "output": 8192 @@ -226453,15 +229721,15 @@ "supported": false }, "cost": { - "input": 0.01, - "output": 0.01 + "input": 0.2, + "output": 0.2 }, "type": "chat" }, { - "id": "deepseek-ai/DeepSeek-R1-Distill-Qwen-14B", - "name": "deepseek-ai/DeepSeek-R1-Distill-Qwen-14B", - "display_name": "deepseek-ai/DeepSeek-R1-Distill-Qwen-14B", + "id": "yi-medium", + "name": "yi-medium", + "display_name": "yi-medium", "limit": { "context": 8192, "output": 8192 @@ -226471,15 +229739,15 @@ "supported": false }, "cost": { - "input": 0.1, - "output": 0.1 + "input": 0.4, + "output": 0.4 }, "type": "chat" }, { - "id": "deepseek-ai/DeepSeek-R1-Distill-Qwen-32B", - "name": "deepseek-ai/DeepSeek-R1-Distill-Qwen-32B", - "display_name": "deepseek-ai/DeepSeek-R1-Distill-Qwen-32B", + "id": "yi-vl-plus", + "name": "yi-vl-plus", + "display_name": "yi-vl-plus", "limit": { "context": 8192, "output": 8192 @@ -226489,15 +229757,20 @@ "supported": false }, "cost": { - "input": 0.2, - "output": 0.2 + "input": 0.000852, + "output": 0.000852 }, "type": "chat" }, { - "id": "deepseek-ai/DeepSeek-R1-Distill-Qwen-7B", - "name": "deepseek-ai/DeepSeek-R1-Distill-Qwen-7B", - "display_name": "deepseek-ai/DeepSeek-R1-Distill-Qwen-7B", + "id": "tts-1-hd-1106", + "name": "tts-1-hd-1106", + "display_name": "tts-1-hd-1106", + "modalities": { + "input": [ + "audio" + ] + }, "limit": { "context": 8192, "output": 8192 @@ -226507,10 +229780,9 @@ "supported": false }, "cost": { - "input": 0.01, - "output": 0.01 - }, - "type": "chat" + "input": 30, + "output": 30 + } }, { "id": "aistudio_gpt-4.1-mini", @@ -228342,8 +231614,8 @@ ] }, "limit": { - "context": 131072, - "output": 16384 + "context": 8192, + "output": 8192 }, "tool_call": false, "reasoning": { @@ -228469,8 +231741,8 @@ ] }, "limit": { - "context": 1048576, - "output": 131072 + "context": 1048575, + "output": 1048575 }, "tool_call": true, "reasoning": { @@ -229343,8 +232615,8 @@ ] }, "limit": { - "context": 256000, - "output": 8192 + "context": 262144, + "output": 262144 }, "temperature": true, "tool_call": true, @@ -230288,7 +233560,7 @@ ] }, "limit": { - "context": 204800, + "context": 196608, "output": 131072 }, "temperature": true, @@ -230891,8 +234163,8 @@ ] }, "limit": { - "context": 256000, - "output": 256000 + "context": 262144, + "output": 262144 }, "tool_call": true, "reasoning": { @@ -230926,8 +234198,8 @@ ] }, "limit": { - "context": 262142, - "output": 262142 + "context": 262144, + "output": 262144 }, "tool_call": true, "reasoning": { @@ -230941,30 +234213,6 @@ }, "type": "imageGeneration" }, - { - "id": "moonshotai/kimi-k2.6:free", - "name": "MoonshotAI: Kimi K2.6 (free)", - "display_name": "MoonshotAI: Kimi K2.6 (free)", - "modalities": { - "input": [ - "text", - "image" - ], - "output": [ - "text" - ] - }, - "limit": { - "context": 262144, - "output": 262144 - }, - "tool_call": true, - "reasoning": { - "supported": true, - "default": true - }, - "type": "imageGeneration" - }, { "id": "morph/morph-v3-fast", "name": "Morph: Morph V3 Fast", @@ -231388,29 +234636,6 @@ }, "type": "imageGeneration" }, - { - "id": "nvidia/nemotron-nano-9b-v2", - "name": "NVIDIA: Nemotron Nano 9B V2", - "display_name": "NVIDIA: Nemotron Nano 9B V2", - "modalities": { - "input": [ - "text" - ], - "output": [ - "text" - ] - }, - "limit": { - "context": 131072, - "output": 16384 - }, - "tool_call": true, - "reasoning": { - "supported": true, - "default": true - }, - "type": "chat" - }, { "id": "nvidia/nemotron-nano-9b-v2:free", "name": "NVIDIA: Nemotron Nano 9B V2 (free)", @@ -234052,8 +237277,8 @@ ] }, "limit": { - "context": 32000, - "output": 32000 + "context": 128000, + "output": 128000 }, "tool_call": false, "reasoning": { @@ -235170,8 +238395,8 @@ ] }, "limit": { - "context": 262140, - "output": 262140 + "context": 262144, + "output": 262144 }, "temperature": true, "tool_call": true, @@ -241166,7 +244391,8 @@ "modalities": { "input": [ "text", - "image" + "image", + "pdf" ], "output": [ "text" @@ -241183,6 +244409,7 @@ }, "attachment": true, "open_weights": false, + "knowledge": "2024-07-31", "release_date": "2024-10-22", "last_updated": "2024-10-22", "cost": { @@ -241211,7 +244438,7 @@ "context": 1000000, "output": 128000 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, @@ -241262,8 +244489,9 @@ "display_name": "Anthropic: Claude Haiku 4.5", "modalities": { "input": [ + "text", "image", - "text" + "pdf" ], "output": [ "text" @@ -241302,6 +244530,7 @@ }, "attachment": true, "open_weights": false, + "knowledge": "2025-02-28", "release_date": "2025-10-15", "last_updated": "2025-10-15", "cost": { @@ -241318,9 +244547,9 @@ "display_name": "Anthropic: Claude Opus 4", "modalities": { "input": [ + "text", "image", - "pdf", - "text" + "pdf" ], "output": [ "text" @@ -241359,8 +244588,9 @@ }, "attachment": true, "open_weights": false, + "knowledge": "2025-03-31", "release_date": "2025-05-22", - "last_updated": "2026-03-15", + "last_updated": "2025-05-22", "cost": { "input": 15, "output": 75, @@ -241375,9 +244605,9 @@ "display_name": "Anthropic: Claude Opus 4.1", "modalities": { "input": [ + "text", "image", - "pdf", - "text" + "pdf" ], "output": [ "text" @@ -241416,8 +244646,9 @@ }, "attachment": true, "open_weights": false, + "knowledge": "2025-03-31", "release_date": "2025-08-05", - "last_updated": "2026-03-15", + "last_updated": "2025-08-05", "cost": { "input": 15, "output": 75, @@ -241432,9 +244663,9 @@ "display_name": "Anthropic: Claude Opus 4.5", "modalities": { "input": [ + "text", "image", - "pdf", - "text" + "pdf" ], "output": [ "text" @@ -241479,8 +244710,9 @@ }, "attachment": true, "open_weights": false, - "release_date": "2025-11-24", - "last_updated": "2026-03-15", + "knowledge": "2025-03-31", + "release_date": "2024-11-24", + "last_updated": "2025-11-24", "cost": { "input": 5, "output": 25, @@ -241507,6 +244739,7 @@ "context": 1000000, "output": 128000 }, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, @@ -241542,11 +244775,14 @@ }, "attachment": true, "open_weights": false, + "knowledge": "2025-05-31", "release_date": "2026-02-05", - "last_updated": "2026-02-05", + "last_updated": "2026-03-13", "cost": { - "input": 4.998, - "output": 25.007 + "input": 5, + "output": 25, + "cache_read": 0.5, + "cache_write": 6.25 }, "type": "chat" }, @@ -241568,6 +244804,7 @@ "context": 1000000, "output": 128000 }, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, @@ -241601,12 +244838,14 @@ }, "attachment": true, "open_weights": false, + "knowledge": "2026-01-31", "release_date": "2026-04-16", "last_updated": "2026-04-16", "cost": { - "input": 4.998, - "output": 25.007, - "cache_read": 0.4998 + "input": 5, + "output": 25, + "cache_read": 0.5, + "cache_write": 6.25 }, "type": "chat" }, @@ -241628,6 +244867,7 @@ "context": 1000000, "output": 128000 }, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, @@ -241664,9 +244904,10 @@ "release_date": "2026-05-28", "last_updated": "2026-05-28", "cost": { - "input": 4.998, - "output": 25.007, - "cache_read": 0.4998 + "input": 5, + "output": 25, + "cache_read": 0.5, + "cache_write": 6.25 }, "type": "chat" }, @@ -241676,9 +244917,9 @@ "display_name": "Anthropic: Claude Sonnet 4", "modalities": { "input": [ + "text", "image", - "pdf", - "text" + "pdf" ], "output": [ "text" @@ -241717,8 +244958,9 @@ }, "attachment": true, "open_weights": false, + "knowledge": "2025-03-31", "release_date": "2025-05-22", - "last_updated": "2026-03-15", + "last_updated": "2025-05-22", "cost": { "input": 3, "output": 15, @@ -241733,16 +244975,16 @@ "display_name": "Anthropic: Claude Sonnet 4.5", "modalities": { "input": [ + "text", "image", - "pdf", - "text" + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 1000000, + "context": 200000, "output": 64000 }, "temperature": true, @@ -241774,8 +245016,9 @@ }, "attachment": true, "open_weights": false, + "knowledge": "2025-07-31", "release_date": "2025-09-29", - "last_updated": "2026-03-15", + "last_updated": "2025-09-29", "cost": { "input": 3, "output": 15, @@ -241802,6 +245045,7 @@ "context": 1000000, "output": 128000 }, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, @@ -241839,10 +245083,12 @@ "open_weights": false, "knowledge": "2025-08-31", "release_date": "2026-02-17", - "last_updated": "2026-02-17", + "last_updated": "2026-03-13", "cost": { - "input": 2.992, - "output": 14.993999999999998 + "input": 3, + "output": 15, + "cache_read": 0.3, + "cache_write": 3.75 }, "type": "chat" }, @@ -242210,23 +245456,14 @@ ] }, "limit": { - "context": 32768, - "output": 7168 + "context": 131072, + "output": 32768 }, - "temperature": true, "tool_call": true, "reasoning": { "supported": true, "default": true }, - "attachment": false, - "open_weights": true, - "release_date": "2025-08-21", - "last_updated": "2025-08-21", - "cost": { - "input": 0.15, - "output": 0.75 - }, "type": "chat" }, { @@ -242236,6 +245473,7 @@ "modalities": { "input": [ "text", + "image", "pdf" ], "output": [ @@ -242243,10 +245481,11 @@ ] }, "limit": { - "context": 163000, - "output": 65536 + "context": 128000, + "output": 8000 }, - "tool_call": true, + "temperature": true, + "tool_call": false, "reasoning": { "supported": true }, @@ -242255,13 +245494,15 @@ "supported": true } }, - "attachment": true, + "attachment": false, "open_weights": false, + "knowledge": "2024-07", "release_date": "2025-12-01", "last_updated": "2025-12-01", "cost": { - "input": 0.27999999999999997, - "output": 0.42000000000000004 + "input": 0.28, + "output": 0.42, + "cache_read": 0.028 }, "type": "chat" }, @@ -242271,16 +245512,19 @@ "display_name": "DeepSeek: DeepSeek V4 Flash", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 1048576, + "context": 1000000, "output": 384000 }, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, @@ -242298,13 +245542,14 @@ } }, "attachment": false, - "open_weights": false, - "release_date": "2026-04-24", + "open_weights": true, + "knowledge": "2025-05", + "release_date": "2026-04-23", "last_updated": "2026-04-24", "cost": { "input": 0.14, "output": 0.28, - "cache_read": 0.028 + "cache_read": 0.0028 }, "type": "chat" }, @@ -242314,16 +245559,18 @@ "display_name": "DeepSeek: DeepSeek V4 Pro", "modalities": { "input": [ - "text" + "text", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 1048576, + "context": 1000000, "output": 384000 }, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, @@ -242341,13 +245588,14 @@ } }, "attachment": false, - "open_weights": false, - "release_date": "2026-04-24", + "open_weights": true, + "knowledge": "2025-05", + "release_date": "2026-04-23", "last_updated": "2026-04-24", "cost": { - "input": 1.1, - "output": 2.2, - "cache_read": 0.11 + "input": 0.435, + "output": 0.87, + "cache_read": 0.0036 }, "type": "chat" }, @@ -242364,23 +245612,19 @@ ] }, "limit": { - "context": 163840, - "output": 163840 + "context": 1000000, + "output": 384000 }, "temperature": true, "tool_call": true, "reasoning": { "supported": false }, - "attachment": false, + "attachment": true, "open_weights": true, - "release_date": "2024-12-01", - "last_updated": "2026-03-15", - "cost": { - "input": 0.32, - "output": 0.89, - "cache_read": 0.15 - }, + "knowledge": "2025-09", + "release_date": "2025-12-01", + "last_updated": "2026-02-28", "type": "chat" }, { @@ -242441,23 +245685,18 @@ ] }, "limit": { - "context": 163840, - "output": 65536 + "context": 128000, + "output": 32000 }, "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": false }, "attachment": false, - "open_weights": true, + "open_weights": false, "release_date": "2025-09-29", "last_updated": "2025-09-29", - "cost": { - "input": 0.27, - "output": 0.41 - }, "type": "chat" }, { @@ -242466,11 +245705,11 @@ "display_name": "Google: Gemini 2.5 Flash", "modalities": { "input": [ - "audio", - "image", - "pdf", "text", - "video" + "image", + "audio", + "video", + "pdf" ], "output": [ "text" @@ -242478,7 +245717,7 @@ }, "limit": { "context": 1048576, - "output": 65535 + "output": 65536 }, "temperature": true, "tool_call": true, @@ -242508,13 +245747,14 @@ }, "attachment": true, "open_weights": false, - "release_date": "2025-07-17", - "last_updated": "2026-03-15", + "knowledge": "2025-01", + "release_date": "2025-06-17", + "last_updated": "2025-06-17", "cost": { "input": 0.3, "output": 2.5, - "cache_read": 0.03, - "cache_write": 0.083333 + "cache_read": 0.075, + "cache_write": 0.55 }, "type": "chat" }, @@ -242524,11 +245764,9 @@ "display_name": "Google: Gemini 2.5 Flash Lite", "modalities": { "input": [ - "audio", - "image", - "pdf", "text", - "video" + "image", + "pdf" ], "output": [ "text" @@ -242536,7 +245774,7 @@ }, "limit": { "context": 1048576, - "output": 65535 + "output": 65536 }, "temperature": true, "tool_call": true, @@ -242565,13 +245803,13 @@ }, "attachment": true, "open_weights": false, + "knowledge": "2025-01", "release_date": "2025-06-17", - "last_updated": "2026-03-15", + "last_updated": "2025-06-17", "cost": { "input": 0.1, "output": 0.4, - "cache_read": 0.01, - "cache_write": 0.083333 + "cache_read": 0.01 }, "type": "chat" }, @@ -242581,11 +245819,11 @@ "display_name": "Google: Gemini 2.5 Pro", "modalities": { "input": [ - "audio", - "image", - "pdf", "text", - "video" + "image", + "audio", + "video", + "pdf" ], "output": [ "text" @@ -242622,13 +245860,14 @@ }, "attachment": true, "open_weights": false, + "knowledge": "2025-01", "release_date": "2025-03-20", - "last_updated": "2026-03-15", + "last_updated": "2025-06-05", "cost": { "input": 1.25, "output": 10, - "cache_read": 0.125, - "cache_write": 0.375 + "cache_read": 0.31, + "cache_write": 2.375 }, "type": "chat" }, @@ -242639,16 +245878,20 @@ "modalities": { "input": [ "text", - "image" + "image", + "audio", + "video", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 1048756, + "context": 1048576, "output": 65536 }, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, @@ -242675,11 +245918,14 @@ }, "attachment": true, "open_weights": false, + "knowledge": "2025-01", "release_date": "2025-12-17", "last_updated": "2025-12-17", "cost": { "input": 0.5, - "output": 3 + "output": 3, + "cache_read": 0.05, + "cache_write": 1 }, "type": "chat" }, @@ -242698,9 +245944,10 @@ ] }, "limit": { - "context": 1048576, - "output": 65536 + "context": 1000000, + "output": 65000 }, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, @@ -242713,12 +245960,13 @@ }, "attachment": true, "open_weights": false, - "release_date": "2026-03-03", - "last_updated": "2026-03-03", + "knowledge": "2025-01", + "release_date": "2026-05-07", + "last_updated": "2026-05-07", "cost": { "input": 0.25, "output": 1.5, - "cache_read": 0.025 + "cache_read": 0.03 }, "type": "chat" }, @@ -242728,19 +245976,17 @@ "display_name": "Google: Gemini 3.1 Flash Lite Preview", "modalities": { "input": [ - "audio", - "image", - "pdf", "text", - "video" + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 1048576, - "output": 65536 + "context": 1000000, + "output": 65000 }, "temperature": true, "tool_call": true, @@ -242755,11 +246001,13 @@ }, "attachment": true, "open_weights": false, + "knowledge": "2025-01", "release_date": "2026-03-03", - "last_updated": "2026-03-15", + "last_updated": "2026-03-03", "cost": { "input": 0.25, - "output": 1.5 + "output": 1.5, + "cache_read": 0.03 }, "type": "chat" }, @@ -242770,16 +246018,18 @@ "modalities": { "input": [ "text", - "image" + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 1048756, - "output": 65536 + "context": 1000000, + "output": 64000 }, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, @@ -242804,7 +246054,8 @@ }, "attachment": true, "open_weights": false, - "release_date": "2026-02-19", + "knowledge": "2025-01", + "release_date": "2025-11-18", "last_updated": "2026-02-19", "cost": { "input": 2, @@ -242821,16 +246072,17 @@ "input": [ "text", "image", - "audio" + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 1048576, - "output": 65536 + "context": 1000000, + "output": 64000 }, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, @@ -242857,6 +246109,7 @@ }, "attachment": true, "open_weights": false, + "knowledge": "2025-01", "release_date": "2026-05-19", "last_updated": "2026-05-19", "cost": { @@ -242912,12 +246165,23 @@ }, "limit": { "context": 131072, - "output": 8192 + "output": 131072 }, + "temperature": true, "tool_call": true, "reasoning": { "supported": false }, + "attachment": false, + "open_weights": false, + "knowledge": "2025-01-01", + "release_date": "2025-10-09", + "last_updated": "2025-10-09", + "cost": { + "input": 0.56, + "output": 2.24, + "cache_read": 0.11 + }, "type": "chat" }, { @@ -242936,18 +246200,18 @@ "context": 262144, "output": 32768 }, + "temperature": true, "tool_call": true, "reasoning": { "supported": false }, "attachment": false, - "open_weights": false, + "open_weights": true, "release_date": "2026-04-23", "last_updated": "2026-04-23", "cost": { - "input": 0.3, - "output": 2.5, - "cache_read": 0.06 + "input": 0, + "output": 0 }, "type": "chat" }, @@ -242967,17 +246231,19 @@ "context": 262144, "output": 32768 }, + "temperature": true, "tool_call": true, "reasoning": { "supported": false }, "attachment": false, - "open_weights": false, - "release_date": "2026-04-21", - "last_updated": "2026-04-21", + "open_weights": true, + "release_date": "2026-04-24", + "last_updated": "2026-04-24", "cost": { - "input": 0.08, - "output": 0.24 + "input": 0.1, + "output": 0.3, + "cache_read": 0.02 }, "type": "chat" }, @@ -243022,8 +246288,9 @@ }, "limit": { "context": 131072, - "output": 8192 + "output": 131072 }, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, @@ -243034,6 +246301,16 @@ "supported": true } }, + "attachment": false, + "open_weights": false, + "knowledge": "2025-01-01", + "release_date": "2025-10-12", + "last_updated": "2025-10-12", + "cost": { + "input": 0.56, + "output": 2.24, + "cache_read": 0.11 + }, "type": "chat" }, { @@ -243052,6 +246329,7 @@ "context": 262144, "output": 65536 }, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, @@ -243060,10 +246338,11 @@ "attachment": false, "open_weights": false, "release_date": "2026-05-08", - "last_updated": "2026-05-08", + "last_updated": "2026-05-27", "cost": { - "input": 1, - "output": 3 + "input": 0.3, + "output": 2.5, + "cache_read": 0.06 }, "type": "chat" }, @@ -243179,8 +246458,8 @@ ] }, "limit": { - "context": 204800, - "output": 131072 + "context": 200000, + "output": 128000 }, "temperature": true, "tool_call": true, @@ -243190,24 +246469,13 @@ }, "extra_capabilities": { "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] + "supported": true } }, "attachment": false, - "open_weights": true, - "release_date": "2025-10-27", - "last_updated": "2025-10-27", - "cost": { - "input": 0.3, - "output": 1.2, - "cache_read": 0.03 - }, + "open_weights": false, + "release_date": "2025-10-28", + "last_updated": "2025-10-28", "type": "chat" }, { @@ -243223,20 +246491,21 @@ ] }, "limit": { - "context": 65532, + "context": 65536, "output": 2048 }, + "temperature": true, "tool_call": false, "reasoning": { "supported": false }, "attachment": false, - "open_weights": false, - "release_date": "2026-01-24", - "last_updated": "2026-01-24", + "open_weights": true, + "release_date": "2026-01-23", + "last_updated": "2026-03-15", "cost": { - "input": 0.30200000000000005, - "output": 1.2069999999999999 + "input": 0.3, + "output": 1.2 }, "type": "chat" }, @@ -243253,9 +246522,10 @@ ] }, "limit": { - "context": 200000, - "output": 131072 + "context": 204800, + "output": 128000 }, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, @@ -243268,12 +246538,8 @@ }, "attachment": false, "open_weights": false, - "release_date": "2025-12-19", - "last_updated": "2025-12-19", - "cost": { - "input": 0.33, - "output": 1.32 - }, + "release_date": "2025-12-23", + "last_updated": "2025-12-23", "type": "chat" }, { @@ -243290,8 +246556,9 @@ }, "limit": { "context": 204800, - "output": 131072 + "output": 128000 }, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, @@ -243306,10 +246573,6 @@ "open_weights": false, "release_date": "2026-02-12", "last_updated": "2026-02-12", - "cost": { - "input": 0.3, - "output": 1.2 - }, "type": "chat" }, { @@ -243363,48 +246626,6 @@ "context": 204800, "output": 131072 }, - "tool_call": true, - "reasoning": { - "supported": true, - "default": true - }, - "extra_capabilities": { - "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] - } - }, - "attachment": false, - "open_weights": false, - "release_date": "2026-03-18", - "last_updated": "2026-03-18", - "cost": { - "input": 0.3, - "output": 1.2 - }, - "type": "chat" - }, - { - "id": "minimax/minimax-m2.7-highspeed", - "name": "MiniMax: MiniMax M2.7 highspeed", - "display_name": "MiniMax: MiniMax M2.7 highspeed", - "modalities": { - "input": [ - "text" - ], - "output": [ - "text" - ] - }, - "limit": { - "context": 204800, - "output": 131072 - }, "temperature": true, "tool_call": true, "reasoning": { @@ -243425,7 +246646,52 @@ "attachment": false, "open_weights": true, "release_date": "2026-03-18", - "last_updated": "2026-05-27", + "last_updated": "2026-03-18", + "cost": { + "input": 0.3, + "output": 1.2, + "cache_read": 0.06, + "cache_write": 0.375 + }, + "type": "chat" + }, + { + "id": "minimax/minimax-m2.7-highspeed", + "name": "MiniMax: MiniMax M2.7 highspeed", + "display_name": "MiniMax: MiniMax M2.7 highspeed", + "modalities": { + "input": [ + "text" + ], + "output": [ + "text" + ] + }, + "limit": { + "context": 204800, + "output": 131100 + }, + "temperature": true, + "tool_call": true, + "reasoning": { + "supported": true, + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } + }, + "attachment": true, + "open_weights": true, + "release_date": "2026-03-18", + "last_updated": "2026-03-18", "cost": { "input": 0.6, "output": 2.4, @@ -243441,19 +246707,22 @@ "modalities": { "input": [ "text", - "image" + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 512000, - "output": 80000 + "context": 1000000, + "output": 1000000 }, + "temperature": true, "tool_call": true, "reasoning": { - "supported": true + "supported": true, + "default": true }, "extra_capabilities": { "reasoning": { @@ -243462,7 +246731,7 @@ }, "attachment": true, "open_weights": false, - "release_date": "2026-06-01", + "release_date": "2026-05-31", "last_updated": "2026-06-01", "cost": { "input": 0.3, @@ -243486,7 +246755,7 @@ }, "limit": { "context": 262144, - "output": 52429 + "output": 262144 }, "temperature": true, "tool_call": true, @@ -243495,12 +246764,9 @@ }, "attachment": true, "open_weights": true, + "knowledge": "2024-11", "release_date": "2024-11-01", - "last_updated": "2025-12-16", - "cost": { - "input": 0.5, - "output": 1.5 - }, + "last_updated": "2025-12-02", "type": "chat" }, { @@ -243510,7 +246776,8 @@ "modalities": { "input": [ "text", - "image" + "image", + "video" ], "output": [ "text" @@ -243518,8 +246785,9 @@ }, "limit": { "context": 256000, - "output": 65536 + "output": 256000 }, + "temperature": true, "tool_call": true, "reasoning": { "supported": true @@ -243537,12 +246805,8 @@ }, "attachment": true, "open_weights": false, - "release_date": "2026-01-26", - "last_updated": "2026-01-26", - "cost": { - "input": 0.3, - "output": 1.9 - }, + "release_date": "2026-01-28", + "last_updated": "2026-01-28", "type": "chat" }, { @@ -243552,15 +246816,16 @@ "modalities": { "input": [ "text", - "image" + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 262144, - "output": 262144 + "context": 262000, + "output": 262000 }, "temperature": true, "tool_call": true, @@ -243570,25 +246835,18 @@ }, "extra_capabilities": { "reasoning": { - "supported": true, - "interleaved": true, - "summaries": true, - "visibility": "summary", - "continuation": [ - "thinking_blocks" - ] + "supported": true } }, "attachment": true, "open_weights": true, "knowledge": "2025-01", - "release_date": "2026-04-21", + "release_date": "2026-04-20", "last_updated": "2026-04-21", "cost": { "input": 0.95, "output": 4, - "cache_read": 0.2, - "cache_write": 0 + "cache_read": 0.16 }, "type": "chat" }, @@ -243634,8 +246892,7 @@ "modalities": { "input": [ "text", - "image", - "pdf" + "image" ], "output": [ "text" @@ -243645,17 +246902,20 @@ "context": 1047576, "output": 32768 }, + "temperature": true, "tool_call": true, "reasoning": { "supported": false }, "attachment": true, "open_weights": false, - "release_date": "2025-09-10", - "last_updated": "2025-09-10", + "knowledge": "2024-04", + "release_date": "2025-04-14", + "last_updated": "2025-04-14", "cost": { "input": 2, - "output": 8 + "output": 8, + "cache_read": 0.5 }, "type": "chat" }, @@ -243676,17 +246936,20 @@ "context": 1047576, "output": 32768 }, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { "supported": false }, "attachment": true, "open_weights": false, + "knowledge": "2024-04", "release_date": "2025-04-14", "last_updated": "2025-04-14", "cost": { "input": 0.4, - "output": 1.6 + "output": 1.6, + "cache_read": 0.1 }, "type": "chat" }, @@ -243697,8 +246960,7 @@ "modalities": { "input": [ "text", - "image", - "pdf" + "image" ], "output": [ "text" @@ -243708,17 +246970,20 @@ "context": 1047576, "output": 32768 }, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { "supported": false }, "attachment": true, "open_weights": false, + "knowledge": "2024-04", "release_date": "2025-04-14", "last_updated": "2025-04-14", "cost": { "input": 0.1, - "output": 0.4 + "output": 0.4, + "cache_read": 0.025 }, "type": "chat" }, @@ -243729,7 +246994,8 @@ "modalities": { "input": [ "text", - "image" + "image", + "pdf" ], "output": [ "text" @@ -243739,17 +247005,20 @@ "context": 128000, "output": 16384 }, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { "supported": false }, "attachment": true, "open_weights": false, + "knowledge": "2023-09", "release_date": "2024-05-13", - "last_updated": "2024-05-13", + "last_updated": "2024-08-06", "cost": { - "input": 2.499, - "output": 9.996 + "input": 2.5, + "output": 10, + "cache_read": 1.25 }, "type": "chat" }, @@ -243770,17 +247039,20 @@ "context": 128000, "output": 16384 }, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { "supported": false }, "attachment": true, "open_weights": false, + "knowledge": "2024-10", "release_date": "2024-07-18", "last_updated": "2024-07-18", "cost": { - "input": 0.1496, - "output": 0.595 + "input": 0.15, + "output": 0.6, + "cache_read": 0.08 }, "type": "chat" }, @@ -243791,17 +247063,21 @@ "modalities": { "input": [ "text", + "audio", "image", - "pdf" + "video" ], "output": [ - "text" + "text", + "audio", + "image" ] }, "limit": { "context": 400000, "output": 128000 }, + "temperature": false, "tool_call": true, "reasoning": { "supported": true, @@ -243830,13 +247106,15 @@ }, "attachment": true, "open_weights": false, + "knowledge": "2024-09-30", "release_date": "2025-08-07", "last_updated": "2025-08-07", "cost": { "input": 1.25, - "output": 10 + "output": 10, + "cache_read": 0.13 }, - "type": "chat" + "type": "imageGeneration" }, { "id": "openai/gpt-5-chat", @@ -243844,31 +247122,31 @@ "display_name": "OpenAI: GPT-5 Chat", "modalities": { "input": [ - "image", - "pdf", - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 128000, - "output": 16384 + "context": 400000, + "output": 128000 }, - "temperature": false, + "temperature": true, "tool_call": false, "reasoning": { - "supported": false + "supported": true, + "default": true }, "attachment": true, "open_weights": false, + "knowledge": "2024-09-30", "release_date": "2025-08-07", - "last_updated": "2026-03-15", + "last_updated": "2025-08-07", "cost": { "input": 1.25, - "output": 10, - "cache_read": 0.125 + "output": 10 }, "type": "chat" }, @@ -243878,17 +247156,19 @@ "display_name": "OpenAI: GPT-5 Codex", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" ] }, "limit": { - "context": 256000, - "output": 32768 + "context": 400000, + "output": 128000 }, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { "supported": true, "default": true @@ -243914,13 +247194,15 @@ "visibility": "hidden" } }, - "attachment": false, + "attachment": true, "open_weights": false, + "knowledge": "2024-10-01", "release_date": "2025-09-15", "last_updated": "2025-09-15", "cost": { - "input": 9.996, - "output": 19.992 + "input": 1.25, + "output": 10, + "cache_read": 0.125 }, "type": "chat" }, @@ -243938,10 +247220,11 @@ ] }, "limit": { - "context": 400000, - "output": 128000 + "context": 128000, + "output": 32000 }, - "tool_call": false, + "temperature": false, + "tool_call": true, "reasoning": { "supported": true, "default": true @@ -243969,11 +247252,13 @@ }, "attachment": true, "open_weights": false, + "knowledge": "2024-05-30", "release_date": "2025-08-07", "last_updated": "2025-08-07", "cost": { "input": 0.25, - "output": 2 + "output": 2, + "cache_read": 0.03 }, "type": "chat" }, @@ -243983,18 +247268,18 @@ "display_name": "OpenAI: GPT-5 Nano", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "text" ] }, "limit": { - "context": 400000, - "output": 128000 + "context": 16000, + "output": 4000 }, - "tool_call": false, + "temperature": false, + "tool_call": true, "reasoning": { "supported": true, "default": true @@ -244022,11 +247307,13 @@ }, "attachment": true, "open_weights": false, + "knowledge": "2024-05-30", "release_date": "2025-08-07", "last_updated": "2025-08-07", "cost": { "input": 0.05, - "output": 0.4 + "output": 0.4, + "cache_read": 0.01 }, "type": "chat" }, @@ -244045,9 +247332,10 @@ }, "limit": { "context": 400000, - "output": 128000 + "output": 272000 }, - "tool_call": false, + "temperature": false, + "tool_call": true, "reasoning": { "supported": true, "default": true @@ -244069,8 +247357,9 @@ }, "attachment": true, "open_weights": false, - "release_date": "2025-08-07", - "last_updated": "2025-08-07", + "knowledge": "2024-09-30", + "release_date": "2025-10-06", + "last_updated": "2025-10-06", "cost": { "input": 15, "output": 120 @@ -244084,8 +247373,7 @@ "modalities": { "input": [ "text", - "image", - "pdf" + "image" ], "output": [ "text" @@ -244095,6 +247383,7 @@ "context": 400000, "output": 128000 }, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, @@ -244123,11 +247412,13 @@ }, "attachment": true, "open_weights": false, + "knowledge": "2024-09-30", "release_date": "2025-11-13", "last_updated": "2025-11-13", "cost": { "input": 1.25, - "output": 10 + "output": 10, + "cache_read": 0.125 }, "type": "chat" }, @@ -244137,9 +247428,8 @@ "display_name": "OpenAI: GPT-5.1 Chat", "modalities": { "input": [ - "image", - "pdf", - "text" + "text", + "image" ], "output": [ "text" @@ -244149,15 +247439,17 @@ "context": 128000, "output": 16384 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "attachment": true, "open_weights": false, + "knowledge": "2024-09-30", "release_date": "2025-11-13", - "last_updated": "2026-03-15", + "last_updated": "2025-11-13", "cost": { "input": 1.25, "output": 10, @@ -244182,7 +247474,8 @@ "context": 400000, "output": 128000 }, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { "supported": true, "default": false @@ -244210,11 +247503,13 @@ }, "attachment": true, "open_weights": false, + "knowledge": "2024-09-30", "release_date": "2025-11-13", "last_updated": "2025-11-13", "cost": { "input": 1.25, - "output": 10 + "output": 10, + "cache_read": 0.125 }, "type": "chat" }, @@ -244233,9 +247528,10 @@ }, "limit": { "context": 400000, - "output": 128000 + "output": 100000 }, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { "supported": true, "default": false @@ -244263,11 +247559,13 @@ }, "attachment": true, "open_weights": false, + "knowledge": "2024-09-30", "release_date": "2025-11-13", "last_updated": "2025-11-13", "cost": { "input": 0.25, - "output": 2 + "output": 2, + "cache_read": 0.025 }, "type": "chat" }, @@ -244278,8 +247576,7 @@ "modalities": { "input": [ "text", - "image", - "pdf" + "image" ], "output": [ "text" @@ -244289,6 +247586,7 @@ "context": 400000, "output": 128000 }, + "temperature": false, "tool_call": true, "reasoning": { "supported": true, @@ -244318,11 +247616,13 @@ }, "attachment": true, "open_weights": false, - "release_date": "2026-01-01", - "last_updated": "2026-01-01", + "knowledge": "2025-08-31", + "release_date": "2025-12-11", + "last_updated": "2025-12-11", "cost": { "input": 1.75, - "output": 14 + "output": 14, + "cache_read": 0.175 }, "type": "chat" }, @@ -244332,9 +247632,8 @@ "display_name": "OpenAI: GPT-5.2 Chat", "modalities": { "input": [ - "image", - "pdf", - "text" + "text", + "image" ], "output": [ "text" @@ -244347,12 +247646,14 @@ "temperature": false, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "attachment": true, "open_weights": false, + "knowledge": "2025-08-31", "release_date": "2025-12-11", - "last_updated": "2026-03-15", + "last_updated": "2025-12-11", "cost": { "input": 1.75, "output": 14, @@ -244367,8 +247668,7 @@ "modalities": { "input": [ "text", - "image", - "pdf" + "image" ], "output": [ "text" @@ -244378,6 +247678,7 @@ "context": 400000, "output": 128000 }, + "temperature": false, "tool_call": true, "reasoning": { "supported": true, @@ -244405,8 +247706,9 @@ }, "attachment": true, "open_weights": false, - "release_date": "2026-01-01", - "last_updated": "2026-01-01", + "knowledge": "2025-08-31", + "release_date": "2025-12-11", + "last_updated": "2025-12-11", "cost": { "input": 21, "output": 168 @@ -244420,8 +247722,7 @@ "modalities": { "input": [ "text", - "image", - "pdf" + "image" ], "output": [ "text" @@ -244431,6 +247732,7 @@ "context": 400000, "output": 128000 }, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, @@ -244459,11 +247761,13 @@ }, "attachment": true, "open_weights": false, + "knowledge": "2025-08-31", "release_date": "2026-01-14", "last_updated": "2026-01-14", "cost": { "input": 1.75, - "output": 14 + "output": 14, + "cache_read": 0.175 }, "type": "chat" }, @@ -244473,9 +247777,9 @@ "display_name": "OpenAI: GPT-5.3 Chat", "modalities": { "input": [ + "text", "image", - "pdf", - "text" + "pdf" ], "output": [ "text" @@ -244485,17 +247789,20 @@ "context": 128000, "output": 16384 }, + "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "attachment": true, "open_weights": false, - "release_date": "2026-03-04", - "last_updated": "2026-03-15", + "release_date": "2026-03-03", + "last_updated": "2026-03-06", "cost": { "input": 1.75, - "output": 14 + "output": 14, + "cache_read": 0.175 }, "type": "chat" }, @@ -244517,6 +247824,7 @@ "context": 400000, "output": 128000 }, + "temperature": false, "tool_call": true, "reasoning": { "supported": true, @@ -244545,6 +247853,7 @@ }, "attachment": true, "open_weights": false, + "knowledge": "2025-08-31", "release_date": "2026-02-24", "last_updated": "2026-02-24", "cost": { @@ -244569,9 +247878,10 @@ ] }, "limit": { - "context": 922000, + "context": 1050000, "output": 128000 }, + "temperature": false, "tool_call": true, "reasoning": { "supported": true, @@ -244601,6 +247911,7 @@ }, "attachment": true, "open_weights": false, + "knowledge": "2025-08-31", "release_date": "2026-03-05", "last_updated": "2026-03-05", "cost": { @@ -244628,6 +247939,7 @@ "context": 400000, "output": 128000 }, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, @@ -244657,6 +247969,7 @@ }, "attachment": true, "open_weights": false, + "knowledge": "2025-08-31", "release_date": "2026-03-17", "last_updated": "2026-03-17", "cost": { @@ -244684,6 +247997,7 @@ "context": 400000, "output": 128000 }, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, @@ -244713,6 +248027,7 @@ }, "attachment": true, "open_weights": false, + "knowledge": "2025-08-31", "release_date": "2026-03-17", "last_updated": "2026-03-17", "cost": { @@ -244737,9 +248052,10 @@ ] }, "limit": { - "context": 922000, + "context": 1050000, "output": 128000 }, + "temperature": false, "tool_call": true, "reasoning": { "supported": true, @@ -244767,12 +248083,13 @@ }, "attachment": true, "open_weights": false, + "knowledge": "2025-08-31", "release_date": "2026-03-05", "last_updated": "2026-03-05", "cost": { "input": 30, "output": 180, - "cache_read": 3 + "cache_read": 30 }, "type": "chat" }, @@ -244794,6 +248111,7 @@ "context": 1000000, "output": 128000 }, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, @@ -244822,7 +248140,8 @@ }, "attachment": true, "open_weights": false, - "release_date": "2026-04-23", + "knowledge": "2025-12-01", + "release_date": "2026-04-24", "last_updated": "2026-04-23", "cost": { "input": 5, @@ -244846,10 +248165,10 @@ ] }, "limit": { - "context": 1050000, + "context": 1000000, "output": 128000 }, - "temperature": false, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, @@ -244862,8 +248181,9 @@ }, "attachment": true, "open_weights": false, + "knowledge": "2025-12-01", "release_date": "2026-04-24", - "last_updated": "2026-05-01", + "last_updated": "2026-04-23", "cost": { "input": 30, "output": 180 @@ -244876,26 +248196,30 @@ "display_name": "OpenAI: GPT-Image-1.5", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "image" ] }, "limit": { - "context": 128000, + "context": 8192, "output": 8192 }, - "temperature": false, + "temperature": true, "tool_call": false, "reasoning": { "supported": false }, - "attachment": true, + "attachment": false, "open_weights": false, "release_date": "2025-12-16", "last_updated": "2025-12-16", + "cost": { + "input": 5, + "output": 32, + "cache_read": 1.25 + }, "type": "imageGeneration" }, { @@ -244904,8 +248228,7 @@ "display_name": "OpenAI: GPT-Image-2", "modalities": { "input": [ - "text", - "image" + "text" ], "output": [ "image" @@ -244915,19 +248238,19 @@ "context": 8192, "output": 8192 }, - "temperature": false, + "temperature": true, "tool_call": false, "reasoning": { "supported": false }, - "attachment": true, + "attachment": false, "open_weights": false, "release_date": "2026-04-21", "last_updated": "2026-04-21", "cost": { - "input": 5.0505, - "output": 32.3232, - "cache_read": 1.2626 + "input": 5, + "output": 30, + "cache_read": 1.25 }, "type": "imageGeneration" }, @@ -244937,7 +248260,8 @@ "display_name": "OpenAI: o4 Mini", "modalities": { "input": [ - "text" + "text", + "image" ], "output": [ "text" @@ -244947,6 +248271,7 @@ "context": 200000, "output": 100000 }, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, @@ -244966,13 +248291,15 @@ "visibility": "hidden" } }, - "attachment": false, + "attachment": true, "open_weights": false, + "knowledge": "2024-06", "release_date": "2025-04-16", "last_updated": "2025-04-16", "cost": { "input": 1.1, - "output": 4.4 + "output": 4.4, + "cache_read": 0.28 }, "type": "chat" }, @@ -245044,22 +248371,13 @@ }, "limit": { "context": 262144, - "output": 52429 + "output": 262144 }, - "temperature": true, "tool_call": true, "reasoning": { "supported": true, "default": true }, - "attachment": false, - "open_weights": true, - "release_date": "2025-04", - "last_updated": "2026-01", - "cost": { - "input": 0.071, - "output": 0.1 - }, "type": "chat" }, { @@ -245075,12 +248393,14 @@ ] }, "limit": { - "context": 256000, - "output": 256000 + "context": 262144, + "output": 131072 }, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { - "supported": true + "supported": true, + "default": true }, "extra_capabilities": { "reasoning": { @@ -245094,12 +248414,12 @@ } }, "attachment": false, - "open_weights": false, - "release_date": "2025-09-11", - "last_updated": "2025-09-11", + "open_weights": true, + "release_date": "2025-08-23", + "last_updated": "2025-08-23", "cost": { - "input": 0.3, - "output": 0.5 + "input": 0.2, + "output": 0.6 }, "type": "chat" }, @@ -245116,10 +248436,11 @@ ] }, "limit": { - "context": 41000, - "output": 32768 + "context": 131072, + "output": 8192 }, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { "supported": true }, @@ -245136,11 +248457,11 @@ }, "attachment": false, "open_weights": false, - "release_date": "2024-01-01", - "last_updated": "2024-01-01", + "release_date": "2025-04-30", + "last_updated": "2025-11-25", "cost": { - "input": 0.08, - "output": 0.24 + "input": 0.07, + "output": 0.28 }, "type": "chat" }, @@ -245157,20 +248478,13 @@ ] }, "limit": { - "context": 262000, - "output": 65536 + "context": 262144, + "output": 262144 }, "tool_call": true, "reasoning": { - "supported": false - }, - "attachment": false, - "open_weights": false, - "release_date": "2026-03-17", - "last_updated": "2026-03-17", - "cost": { - "input": 0.13, - "output": 0.5 + "supported": true, + "default": true }, "type": "chat" }, @@ -245187,20 +248501,24 @@ ] }, "limit": { - "context": 128000, - "output": 65536 + "context": 4096, + "output": 4096 }, + "temperature": true, "tool_call": false, "reasoning": { "supported": false }, "attachment": false, "open_weights": false, - "release_date": "2025-09-17", - "last_updated": "2025-09-17", + "knowledge": "2025-01-01", + "release_date": "2025-07-23", + "last_updated": "2025-07-23", "cost": { "input": 1, - "output": 5 + "output": 5, + "cache_read": 0.1, + "cache_write": 1.25 }, "type": "chat" }, @@ -245217,10 +248535,11 @@ ] }, "limit": { - "context": 256000, - "output": 32768 + "context": 262144, + "output": 65536 }, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { "supported": true }, @@ -245237,11 +248556,12 @@ }, "attachment": false, "open_weights": false, - "release_date": "2025-09-05", - "last_updated": "2025-09-05", + "knowledge": "2025-04", + "release_date": "2025-09-24", + "last_updated": "2025-09-24", "cost": { - "input": 1.08018, - "output": 5.4009 + "input": 2.11, + "output": 8.45 }, "type": "chat" }, @@ -245332,20 +248652,21 @@ "modalities": { "input": [ "text", - "image", - "video" + "image" ], "output": [ "text" ] }, "limit": { - "context": 983616, - "output": 65536 + "context": 1000000, + "output": 64000 }, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { - "supported": true + "supported": true, + "default": true }, "extra_capabilities": { "reasoning": { @@ -245360,12 +248681,12 @@ }, "attachment": true, "open_weights": false, - "release_date": "2026-02-16", - "last_updated": "2026-02-16", + "knowledge": "2025-01-01", + "release_date": "2026-03-20", + "last_updated": "2026-03-20", "cost": { - "input": 0.4, - "output": 2.4, - "cache_read": 0.04 + "input": 0.8, + "output": 4.8 }, "type": "chat" }, @@ -245465,7 +248786,6 @@ "display_name": "Qwen: Qwen3.6-Plus", "modalities": { "input": [ - "image", "text" ], "output": [ @@ -245474,7 +248794,7 @@ }, "limit": { "context": 1000000, - "output": 65536 + "output": 64000 }, "temperature": true, "tool_call": true, @@ -245493,15 +248813,15 @@ ] } }, - "attachment": true, + "attachment": false, "open_weights": false, - "release_date": "2025-08-26", - "last_updated": "2026-04-11", + "release_date": "2026-03-30", + "last_updated": "2026-03-30", "cost": { - "input": 0.325, - "output": 1.95, - "cache_read": 0.0325, - "cache_write": 0.40625 + "input": 0.5, + "output": 3, + "cache_read": 0.05, + "cache_write": 0.625 }, "type": "chat" }, @@ -245619,7 +248939,36 @@ "display_name": "StepFun: Step 3.5 Flash", "modalities": { "input": [ + "text", + "image" + ], + "output": [ "text" + ] + }, + "limit": { + "context": 64000, + "output": 4096 + }, + "temperature": true, + "tool_call": false, + "reasoning": { + "supported": false + }, + "attachment": true, + "open_weights": false, + "release_date": "2026-02-02", + "last_updated": "2026-02-02", + "type": "chat" + }, + { + "id": "stepfun/step-3.7-flash", + "name": "StepFun: Step 3.7 Flash", + "display_name": "StepFun: Step 3.7 Flash", + "modalities": { + "input": [ + "text", + "image" ], "output": [ "text" @@ -245635,21 +248984,22 @@ "supported": true, "default": true }, - "attachment": false, - "open_weights": true, - "release_date": "2026-01-29", - "last_updated": "2026-01-29", + "attachment": true, + "open_weights": false, + "knowledge": "2026-01-01", + "release_date": "2026-05-28", + "last_updated": "2026-05-29", "cost": { - "input": 0.1, - "output": 0.3, - "cache_read": 0.02 + "input": 0.2, + "output": 1.15, + "cache_read": 0.04 }, "type": "chat" }, { - "id": "stepfun/step-3.7-flash", - "name": "StepFun: Step 3.7 Flash", - "display_name": "StepFun: Step 3.7 Flash", + "id": "stepfun/step-3.7-flash-free", + "name": "StepFun: Step 3.7 Flash (Free)", + "display_name": "StepFun: Step 3.7 Flash (Free)", "modalities": { "input": [ "text", @@ -245670,13 +249020,14 @@ "default": true }, "attachment": true, - "open_weights": true, + "open_weights": false, "knowledge": "2026-01-01", - "release_date": "2026-05-29", + "release_date": "2026-05-28", "last_updated": "2026-05-29", "cost": { "input": 0.2, - "output": 1.15 + "output": 1.15, + "cache_read": 0.04 }, "type": "chat" }, @@ -245772,12 +249123,14 @@ ] }, "limit": { - "context": 262144, - "output": 262144 + "context": 256000, + "output": 64000 }, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { - "supported": true + "supported": true, + "default": true }, "extra_capabilities": { "reasoning": { @@ -245785,13 +249138,14 @@ } }, "attachment": false, - "open_weights": false, - "release_date": "2026-04-23", - "last_updated": "2026-04-23", + "open_weights": true, + "release_date": "2026-04-20", + "last_updated": "2026-04-20", "cost": { - "input": 0.066, - "output": 0.26, - "cache_read": 0.029 + "input": 0.172, + "output": 0.572, + "cache_read": 0.058, + "cache_write": 0 }, "type": "chat" }, @@ -245871,7 +249225,8 @@ "modalities": { "input": [ "text", - "image" + "image", + "pdf" ], "output": [ "text" @@ -245881,6 +249236,7 @@ "context": 1000000, "output": 1000000 }, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, @@ -245893,12 +249249,13 @@ }, "attachment": true, "open_weights": false, - "release_date": "2026-04-30", - "last_updated": "2026-04-30", + "release_date": "2026-04-17", + "last_updated": "2026-04-17", "cost": { "input": 1.25, "output": 2.5, - "cache_read": 0.2 + "cache_read": 0.2, + "cache_write": 0 }, "type": "chat" }, @@ -245909,7 +249266,8 @@ "modalities": { "input": [ "text", - "image" + "image", + "pdf" ], "output": [ "text" @@ -245919,6 +249277,7 @@ "context": 256000, "output": 256000 }, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, @@ -245931,8 +249290,8 @@ }, "attachment": true, "open_weights": false, - "release_date": "2026-05-20", - "last_updated": "2026-05-20", + "release_date": "2026-04-16", + "last_updated": "2026-04-16", "cost": { "input": 1, "output": 2, @@ -245954,19 +249313,23 @@ }, "limit": { "context": 256000, - "output": 32768 + "output": 256000 }, - "tool_call": false, + "temperature": true, + "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true }, "attachment": false, - "open_weights": false, - "release_date": "2025-12-17", - "last_updated": "2025-12-17", + "open_weights": true, + "knowledge": "2024-12-01", + "release_date": "2025-12-16", + "last_updated": "2026-02-04", "cost": { - "input": 0.102, - "output": 0.306 + "input": 0.1, + "output": 0.3, + "cache_read": 0.01 }, "type": "chat" }, @@ -245978,16 +249341,17 @@ "input": [ "text", "image", - "video" + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 1048576, - "output": 131072 + "context": 1050000, + "output": 131100 }, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, @@ -245995,6 +249359,7 @@ }, "attachment": true, "open_weights": false, + "knowledge": "2024-12", "release_date": "2026-04-22", "last_updated": "2026-04-22", "cost": { @@ -246010,23 +249375,27 @@ "display_name": "Xiaomi: MiMo-V2.5-Pro", "modalities": { "input": [ - "text" + "text", + "image", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 1048576, - "output": 131072 + "context": 1050000, + "output": 131000 }, + "temperature": true, "tool_call": true, "reasoning": { "supported": true, "default": true }, - "attachment": false, + "attachment": true, "open_weights": false, + "knowledge": "2024-12", "release_date": "2026-04-22", "last_updated": "2026-04-22", "cost": { @@ -246060,12 +249429,14 @@ }, "attachment": false, "open_weights": true, + "knowledge": "2025-04", "release_date": "2025-07-28", - "last_updated": "2026-03-15", + "last_updated": "2025-07-28", "cost": { "input": 0.6, "output": 2.2, - "cache_read": 0.175 + "cache_read": 0.11, + "cache_write": 0 }, "type": "chat" }, @@ -246093,12 +249464,14 @@ }, "attachment": false, "open_weights": true, + "knowledge": "2025-04", "release_date": "2025-07-28", "last_updated": "2025-07-28", "cost": { - "input": 0.13, - "output": 0.85, - "cache_read": 0.025 + "input": 0.2, + "output": 1.1, + "cache_read": 0.03, + "cache_write": 0 }, "type": "chat" }, @@ -246116,12 +249489,12 @@ }, "limit": { "context": 200000, - "output": 65535 + "output": 200000 }, + "temperature": true, "tool_call": true, "reasoning": { - "supported": true, - "default": true + "supported": true }, "extra_capabilities": { "reasoning": { @@ -246130,12 +249503,8 @@ }, "attachment": false, "open_weights": false, - "release_date": "2025-09-30", - "last_updated": "2025-09-30", - "cost": { - "input": 0.4, - "output": 1.5 - }, + "release_date": "2025-10-11", + "last_updated": "2025-10-11", "type": "chat" }, { @@ -246144,8 +249513,8 @@ "display_name": "Z.AI: GLM 4.6V", "modalities": { "input": [ - "image", "text", + "image", "video" ], "output": [ @@ -246153,8 +249522,8 @@ ] }, "limit": { - "context": 131072, - "output": 131072 + "context": 200000, + "output": 64000 }, "temperature": true, "tool_call": true, @@ -246163,12 +249532,14 @@ "default": true }, "attachment": true, - "open_weights": true, - "release_date": "2025-09-30", - "last_updated": "2026-01-10", + "open_weights": false, + "knowledge": "2025-01-01", + "release_date": "2025-12-08", + "last_updated": "2025-12-08", "cost": { - "input": 0.3, - "output": 0.9 + "input": 0.14, + "output": 0.42, + "cache_read": 0.03 }, "type": "chat" }, @@ -246257,8 +249628,8 @@ ] }, "limit": { - "context": 202752, - "output": 65535 + "context": 200000, + "output": 200000 }, "temperature": true, "tool_call": true, @@ -246278,14 +249649,9 @@ } }, "attachment": false, - "open_weights": true, - "release_date": "2025-12-22", - "last_updated": "2026-03-15", - "cost": { - "input": 0.38, - "output": 1.98, - "cache_read": 0.2 - }, + "open_weights": false, + "release_date": "2025-12-23", + "last_updated": "2025-12-23", "type": "chat" }, { @@ -246384,8 +249750,8 @@ ] }, "limit": { - "context": 202752, - "output": 131072 + "context": 200000, + "output": 128000 }, "temperature": true, "tool_call": true, @@ -246405,13 +249771,9 @@ } }, "attachment": false, - "open_weights": true, + "open_weights": false, "release_date": "2026-02-12", - "last_updated": "2026-03-15", - "cost": { - "input": 0.72, - "output": 2.3 - }, + "last_updated": "2026-02-12", "type": "chat" }, { @@ -246427,26 +249789,28 @@ ] }, "limit": { - "context": 202800, - "output": 131072 + "context": 200000, + "output": 128000 }, + "temperature": true, "tool_call": true, "reasoning": { - "supported": true + "supported": true, + "default": true }, "extra_capabilities": { "reasoning": { "supported": true } }, - "attachment": false, + "attachment": true, "open_weights": false, - "release_date": "2026-03-15", - "last_updated": "2026-03-15", + "knowledge": "2025-01-01", + "release_date": "2026-03-20", + "last_updated": "2026-03-20", "cost": { - "input": 1.2, - "output": 4, - "cache_read": 0.24 + "input": 0.88, + "output": 3.48 }, "type": "chat" }, @@ -246463,7 +249827,7 @@ ] }, "limit": { - "context": 202752, + "context": 200000, "output": 131072 }, "temperature": true, @@ -246474,16 +249838,23 @@ }, "extra_capabilities": { "reasoning": { - "supported": true + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] } }, "attachment": false, - "open_weights": true, - "release_date": "2026-03-27", - "last_updated": "2026-03-27", + "open_weights": false, + "release_date": "2026-04-03", + "last_updated": "2026-04-03", "cost": { - "input": 1.26, - "output": 3.96 + "input": 0.8781, + "output": 3.5126, + "cache_read": 0.1903 }, "type": "chat" }, @@ -246494,28 +249865,43 @@ "modalities": { "input": [ "text", - "image" + "image", + "video", + "pdf" ], "output": [ "text" ] }, "limit": { - "context": 202800, - "output": 131100 + "context": 200000, + "output": 128000 }, + "temperature": true, "tool_call": true, "reasoning": { - "supported": false + "supported": true, + "default": true + }, + "extra_capabilities": { + "reasoning": { + "supported": true, + "interleaved": true, + "summaries": true, + "visibility": "summary", + "continuation": [ + "thinking_blocks" + ] + } }, "attachment": true, "open_weights": false, "release_date": "2026-04-01", "last_updated": "2026-04-01", "cost": { - "input": 1.2, - "output": 4, - "cache_read": 0.24 + "input": 0.726, + "output": 3.1946, + "cache_read": 0.1743 }, "type": "chat" } diff --git a/scripts/architecture-guard.mjs b/scripts/architecture-guard.mjs index fef93c95d..83ecd468b 100644 --- a/scripts/architecture-guard.mjs +++ b/scripts/architecture-guard.mjs @@ -22,13 +22,15 @@ const MAIN_GUARD_PATHS = [ ] const RENDERER_SOURCE_ROOT = path.join(ROOT, 'src/renderer/src') +const RENDERER_SETTINGS_ROOT = path.join(ROOT, 'src/renderer/settings') +const RENDERER_BUSINESS_ROOTS = [RENDERER_SOURCE_ROOT, RENDERER_SETTINGS_ROOT] const RENDERER_TYPED_BOUNDARY_ROOT = path.join(ROOT, 'src/renderer/api') const RENDERER_QUARANTINE_ROOT = path.join(ROOT, 'src/renderer/api/legacy') -const RENDERER_QUARANTINE_ROOTS = [RENDERER_QUARANTINE_ROOT] +const RENDERER_QUARANTINE_ROOTS = [] const RETIRED_RENDERER_LEGACY_ENTRY_PATHS = [ - path.join(ROOT, 'src/renderer/src/composables/usePresenter.ts') + path.join(ROOT, 'src/renderer/src/composables/usePresenter.ts'), + RENDERER_QUARANTINE_ROOT ] -const RENDERER_QUARANTINE_MAX_SOURCE_FILES = 3 const RENDERER_TYPED_BOUNDARY_WINDOW_API_ALLOWLIST = [ path.join(ROOT, 'src/renderer/api/runtime.ts') ] @@ -63,6 +65,7 @@ const MIGRATED_RAW_CHANNEL_GUARD_PATHS = [ path.join(ROOT, 'src/renderer/src/stores/ui/pageRouter.ts'), path.join(ROOT, 'src/renderer/src/pages/ChatPage.vue'), path.join(ROOT, 'src/renderer/src/pages/NewThreadPage.vue'), + path.join(ROOT, 'src/renderer/settings'), path.join(ROOT, 'src/main/presenter/windowPresenter'), path.join(ROOT, 'src/main/presenter/configPresenter'), path.join(ROOT, 'src/main/presenter/agentSessionPresenter'), @@ -99,6 +102,8 @@ const LEGACY_PRESENTER_HELPER_CALL_PATTERN = /(? RENDERER_QUARANTINE_MAX_SOURCE_FILES) { - violations.push( - `[renderer-quarantine-growth] ${relativePath(RENDERER_QUARANTINE_ROOT)} expected <= ${RENDERER_QUARANTINE_MAX_SOURCE_FILES} source files, found ${quarantineFiles.length}` - ) - } - for (const retiredEntryPath of RETIRED_RENDERER_LEGACY_ENTRY_PATHS) { if (await pathExists(retiredEntryPath)) { violations.push( @@ -371,13 +363,14 @@ async function main() { const source = await fs.readFile(filePath, 'utf8') const specifiers = extractModuleSpecifiers(source) - if (isUnder(filePath, RENDERER_SOURCE_ROOT)) { + if (RENDERER_BUSINESS_ROOTS.some((root) => isUnder(filePath, root))) { const file = relativePath(filePath) const legacyPresenterHelperCount = countMatches( source, LEGACY_PRESENTER_HELPER_CALL_PATTERN ) const legacyPresenterImportCount = countMatches(source, LEGACY_PRESENTER_IMPORT_PATTERN) + const legacyRuntimeImportCount = countMatches(source, LEGACY_RUNTIME_IMPORT_PATTERN) const windowElectronCount = countMatches(source, WINDOW_ELECTRON_PATTERN) const windowApiCount = countMatches(source, WINDOW_API_PATTERN) const actualListenerCount = countMatches(source, IPC_RENDERER_LISTENER_PATTERN) @@ -388,6 +381,12 @@ async function main() { ) } + if (legacyRuntimeImportCount > 0) { + violations.push( + `[renderer-business-direct-legacy-runtime-import] ${file} must not import renderer legacy runtime helpers` + ) + } + if (legacyPresenterHelperCount > 0) { violations.push( `[renderer-business-direct-use-presenter] ${file} expected 0, found ${legacyPresenterHelperCount}` diff --git a/scripts/generate-architecture-baseline.mjs b/scripts/generate-architecture-baseline.mjs index fc5c29d9c..345d21e08 100644 --- a/scripts/generate-architecture-baseline.mjs +++ b/scripts/generate-architecture-baseline.mjs @@ -21,16 +21,22 @@ const ANALYSIS_TARGETS = [ root: path.join(ROOT, 'src/main') }, { - label: 'renderer', + label: 'renderer-main', root: path.join(ROOT, 'src/renderer/src') + }, + { + label: 'renderer-settings', + root: path.join(ROOT, 'src/renderer/settings') } ] const MAIN_SOURCE_ROOT = path.join(ROOT, 'src/main') const RENDERER_SOURCE_ROOT = path.join(ROOT, 'src/renderer/src') +const RENDERER_SETTINGS_ROOT = path.join(ROOT, 'src/renderer/settings') +const RENDERER_BUSINESS_ROOTS = [RENDERER_SOURCE_ROOT, RENDERER_SETTINGS_ROOT] const RENDERER_QUARANTINE_ROOT = path.join(ROOT, 'src/renderer/api/legacy') -const RENDERER_QUARANTINE_ROOTS = [RENDERER_QUARANTINE_ROOT] -const RENDERER_QUARANTINE_EXIT_MAX_FILES = 3 +const RENDERER_QUARANTINE_ROOTS = [] +const RENDERER_QUARANTINE_EXIT_MAX_FILES = 0 const BRIDGE_REGISTER_PATH = path.join( ROOT, 'docs/architecture/baselines/main-kernel-bridge-register.json' @@ -444,7 +450,7 @@ function combineCountMaps(...maps) { } async function collectRendererPatternCountsByLayer(pattern) { - const businessFiles = await walk(RENDERER_SOURCE_ROOT) + const businessFiles = await collectFilesFromTargets(RENDERER_BUSINESS_ROOTS) const quarantineFiles = await collectFilesFromTargets(RENDERER_QUARANTINE_ROOTS) const business = await collectPatternCounts(businessFiles, pattern) @@ -739,8 +745,8 @@ function renderBoundaryBaselineReport({ lines.push('## Renderer Single-Track Split') lines.push('') - lines.push('- Business layer: `src/renderer/src/**`') - lines.push('- Quarantine layer: `src/renderer/api/legacy/**`') + lines.push('- Business layer: `src/renderer/src/**`, `src/renderer/settings/**`') + lines.push('- Retired quarantine layer: `src/renderer/api/legacy/**` must remain deleted') lines.push('') lines.push('| Legacy surface | Business layer | Quarantine layer | Total |') lines.push('| --- | --- | --- | --- |') @@ -757,12 +763,12 @@ function renderBoundaryBaselineReport({ lines.push('## Quarantine Exit Snapshot') lines.push('') - lines.push('- Retained capability family: `renderer legacy transport`') + lines.push('- Retained capability family: none; `renderer legacy transport` is retired') lines.push( `- Source files: ${quarantineSourceFiles.length} / ${RENDERER_QUARANTINE_EXIT_MAX_FILES}` ) lines.push( - '- Delete condition: remove after settings compatibility surfaces stop importing the quarantine adapters.' + '- Delete condition: already satisfied; a recreated quarantine directory is a regression.' ) lines.push('') @@ -882,8 +888,11 @@ async function main() { } const archiveReferences = await collectArchiveReferences() - const mainAndRendererFiles = await collectFilesFromTargets([MAIN_SOURCE_ROOT, RENDERER_SOURCE_ROOT]) - const rendererBusinessFiles = await walk(RENDERER_SOURCE_ROOT) + const mainAndRendererFiles = await collectFilesFromTargets([ + MAIN_SOURCE_ROOT, + ...RENDERER_BUSINESS_ROOTS + ]) + const rendererBusinessFiles = await collectFilesFromTargets(RENDERER_BUSINESS_ROOTS) const quarantineExists = await pathExists(RENDERER_QUARANTINE_ROOT) const quarantineSourceFiles = await collectFilesFromTargets(RENDERER_QUARANTINE_ROOTS) const usePresenterCountsByLayer = await collectRendererPatternCountsByLayer( @@ -957,16 +966,19 @@ async function main() { const p2Ready = Object.values(p2PresenterCounts).every((count) => count === 0) const p3Ready = Object.values(p3PresenterCounts).every((count) => count === 0) const p4Ready = Object.values(p4PresenterCounts).every((count) => count === 0) - const p5Ready = p1Ready && quarantineSourceFiles.length <= RENDERER_QUARANTINE_EXIT_MAX_FILES + const p5Ready = + p1Ready && + !quarantineExists && + quarantineSourceFiles.length <= RENDERER_QUARANTINE_EXIT_MAX_FILES const phaseGates = [ { phase: 'P0', indicator: - 'Fixed quarantine path `src/renderer/api/legacy/**` exists and baseline emits business/quarantine split metrics', + 'Retired quarantine path `src/renderer/api/legacy/**` must remain deleted and baseline emits business/retired split metrics', current: quarantineExists - ? '`src/renderer/api/legacy/**` exists; split metrics emitted' - : '`src/renderer/api/legacy/**` missing', - status: quarantineExists ? 'ready' : 'blocked' + ? '`src/renderer/api/legacy/**` exists' + : '`src/renderer/api/legacy/**` deleted; split metrics emitted', + status: quarantineExists ? 'blocked' : 'ready' }, { phase: 'P1', @@ -1017,7 +1029,7 @@ async function main() { { phase: 'P5', indicator: - 'Business layer direct legacy access must be `0`, and quarantine source files must satisfy the exit standard (`<= 3` source files)', + 'Business layer direct legacy access must be `0`, and retired quarantine source files must stay at `0`', current: `businessLegacy=${metrics['renderer.business.usePresenter.count']}/` + `${metrics['renderer.business.windowElectron.count']}/` + diff --git a/src/main/appMain.ts b/src/main/appMain.ts index 32fddf512..f2a14fc97 100644 --- a/src/main/appMain.ts +++ b/src/main/appMain.ts @@ -4,9 +4,8 @@ import { LifecycleManager, registerCoreHooks } from './presenter/lifecyclePresen import { getInstance, Presenter } from './presenter' import { electronApp } from '@electron-toolkit/utils' import log from 'electron-log' -import { eventBus, SendTarget } from './eventbus' -import { NOTIFICATION_EVENTS } from './events' import { registerWorkspacePreviewSchemes } from './presenter/workspacePresenter/workspacePreviewProtocol' +import { publishDeepchatEvent } from './routes/publishDeepchatEvent' import { findDeepLinkArg, findStartupDeepLink, @@ -25,6 +24,11 @@ export function startApp(): void { } appStarted = true + const e2eUserDataDir = process.env.DEEPCHAT_E2E_USER_DATA_DIR?.trim() + if (e2eUserDataDir) { + app.setPath('userData', e2eUserDataDir) + } + app.setName(APP_NAME) if (process.platform === 'darwin') { if (app.isReady()) { @@ -55,7 +59,7 @@ export function startApp(): void { if (isNetworkError) { // Send error to renderer to show a toast notification // This is "elegant" and non-blocking - eventBus.sendToRenderer(NOTIFICATION_EVENTS.SHOW_ERROR, SendTarget.ALL_WINDOWS, { + publishDeepchatEvent('notification.error', { id: Date.now().toString(), title: 'Network Error', message: msg, diff --git a/src/main/contextMenuHelper.ts b/src/main/contextMenuHelper.ts index 31487c16f..594ed8a8b 100644 --- a/src/main/contextMenuHelper.ts +++ b/src/main/contextMenuHelper.ts @@ -2,6 +2,7 @@ import logger from '@shared/logger' import { BrowserWindow, Menu, MenuItemConstructorOptions, WebContents, dialog, net } from 'electron' import path from 'path' import sharp from 'sharp' +import { publishDeepchatEventToWebContents } from './routes/publishDeepchatEvent' interface ContextMenuOptions { webContents: WebContents @@ -249,11 +250,14 @@ export default function contextMenu(options: ContextMenuOptions): () => void { id: 'translate', label: options.labels?.translate || '翻译', click: () => { - options.webContents.send( - 'context-menu-translate', - params.selectionText, - params.x, - params.y + publishDeepchatEventToWebContents( + options.webContents.id, + 'contextMenu.translateRequested', + { + text: params.selectionText, + x: params.x, + y: params.y + } ) } }) @@ -263,7 +267,9 @@ export default function contextMenu(options: ContextMenuOptions): () => void { id: 'askAI', label: options.labels?.askAI || '询问AI', click: () => { - options.webContents.send('context-menu-ask-ai', params.selectionText) + publishDeepchatEventToWebContents(options.webContents.id, 'contextMenu.askAiRequested', { + text: params.selectionText + }) } }) } diff --git a/src/main/events.ts b/src/main/events.ts index 898923cc8..634658979 100644 --- a/src/main/events.ts +++ b/src/main/events.ts @@ -1,3 +1,5 @@ +export { FLOATING_BUTTON_EVENTS } from '@shared/floatingButtonChannels' + /** * 事件系统常量定义 * @@ -40,10 +42,8 @@ export const CONFIG_EVENTS = { OAUTH_LOGIN_SUCCESS: 'config:oauth-login-success', // OAuth登录成功 OAUTH_LOGIN_ERROR: 'config:oauth-login-error', // OAuth登录失败 THEME_CHANGED: 'config:theme-changed', // 主题变更事件 - FONT_SIZE_CHANGED: 'config:font-size-changed', // 字体大小变更事件 DEFAULT_SYSTEM_PROMPT_CHANGED: 'config:default-system-prompt-changed', // Default system prompt changed event CUSTOM_PROMPTS_CHANGED: 'config:custom-prompts-changed', // 自定义提示词变更事件 - NOWLEDGE_MEM_CONFIG_UPDATED: 'config:nowledge-mem-config-updated', // Nowledge-mem configuration updated event DEFAULT_PROJECT_PATH_CHANGED: 'config:default-project-path-changed', AGENTS_CHANGED: 'config:agents-changed' } @@ -54,36 +54,6 @@ export const PROVIDER_DB_EVENTS = { UPDATED: 'provider-db:updated' // 远端刷新成功 } -// 会话相关事件 -export const CONVERSATION_EVENTS = { - LIST_UPDATED: 'conversation:list-updated', // 用于推送完整的会话列表 - - ACTIVATED: 'conversation:activated', // 替代 conversation-activated - DEACTIVATED: 'conversation:deactivated', // 替代 active-conversation-cleared - MESSAGE_EDITED: 'conversation:message-edited', // 替代 message-edited - SCROLL_TO_MESSAGE: 'conversation:scroll-to-message', - - MESSAGE_GENERATED: 'conversation:message-generated' // 主进程内部事件,一条完整的消息已生成 -} - -// 通信相关事件 -export const STREAM_EVENTS = { - RESPONSE: 'stream:response', // 替代 stream-response - END: 'stream:end', // 替代 stream-end - ERROR: 'stream:error', // 替代 stream-error - PERMISSION_UPDATED: 'stream:permission-updated' // 权限状态更新,通知前端刷新UI -} - -// New agent session events -export const SESSION_EVENTS = { - LIST_UPDATED: 'session:list-updated', - ACTIVATED: 'session:activated', - DEACTIVATED: 'session:deactivated', - STATUS_CHANGED: 'session:status-changed', - COMPACTION_UPDATED: 'session:compaction-updated', - PENDING_INPUTS_UPDATED: 'session:pending-inputs-updated' -} - // 系统相关事件 export const SYSTEM_EVENTS = { SYSTEM_THEME_UPDATED: 'system:theme-updated' @@ -91,10 +61,6 @@ export const SYSTEM_EVENTS = { // 应用更新相关事件 export const UPDATE_EVENTS = { - STATUS_CHANGED: 'update:status-changed', // 替代 update-status-changed - ERROR: 'update:error', // 替代 update-error - PROGRESS: 'update:progress', // 下载进度 - WILL_RESTART: 'update:will-restart', // 准备重启 STATE_CHANGED: 'update:state-changed' // 更新状态变化(用于生命周期管理通信) } @@ -132,45 +98,21 @@ export const DEV_EVENTS = { START_GUIDED_ONBOARDING: 'dev:start-guided-onboarding' } -// ollama 相关事件 -export const OLLAMA_EVENTS = { - PULL_MODEL_PROGRESS: 'ollama:pull-model-progress' -} - // MCP 相关事件 export const MCP_EVENTS = { SERVER_STARTED: 'mcp:server-started', SERVER_STOPPED: 'mcp:server-stopped', CONFIG_CHANGED: 'mcp:config-changed', - TOOL_CALL_RESULT: 'mcp:tool-call-result', SERVER_STATUS_CHANGED: 'mcp:server-status-changed', CLIENT_LIST_UPDATED: 'mcp:client-list-updated', - INITIALIZED: 'mcp:initialized', // 新增:MCP初始化完成事件 - SAMPLING_REQUEST: 'mcp:sampling-request', - SAMPLING_DECISION: 'mcp:sampling-decision', - SAMPLING_CANCELLED: 'mcp:sampling-cancelled' + INITIALIZED: 'mcp:initialized' // 新增:MCP初始化完成事件 } // 同步相关事件 export const SYNC_EVENTS = { - BACKUP_STARTED: 'sync:backup-started', - BACKUP_COMPLETED: 'sync:backup-completed', - BACKUP_ERROR: 'sync:backup-error', - BACKUP_STATUS_CHANGED: 'sync:backup-status-changed', - IMPORT_STARTED: 'sync:import-started', - IMPORT_COMPLETED: 'sync:import-completed', - IMPORT_ERROR: 'sync:import-error', DATA_CHANGED: 'sync:data-changed' } -// 速率限制相关事件 -export const RATE_LIMIT_EVENTS = { - CONFIG_UPDATED: 'rate-limit:config-updated', - REQUEST_QUEUED: 'rate-limit:request-queued', - REQUEST_EXECUTED: 'rate-limit:request-executed', - LIMIT_EXCEEDED: 'rate-limit:limit-exceeded' -} - // DeepLink 相关事件 export const DEEPLINK_EVENTS = { PROTOCOL_RECEIVED: 'deeplink:protocol-received', @@ -178,14 +120,6 @@ export const DEEPLINK_EVENTS = { MCP_INSTALL: 'deeplink:mcp-install' } -// 全局通知相关事件 -export const NOTIFICATION_EVENTS = { - SHOW_ERROR: 'notification:show-error', // 显示错误通知 - DATABASE_REPAIR_SUGGESTED: 'notification:database-repair-suggested', - SYS_NOTIFY_CLICKED: 'notification:sys-notify-clicked', // 系统通知点击事件 - DATA_RESET_COMPLETE_DEV: 'notification:data-reset-complete-dev' // 开发环境数据重置完成通知 -} - export const SHORTCUT_EVENTS = { ZOOM_IN: 'shortcut:zoom-in', ZOOM_OUT: 'shortcut:zoom-out', @@ -202,7 +136,6 @@ export const SHORTCUT_EVENTS = { // 标签页相关事件 export const TAB_EVENTS = { - TITLE_UPDATED: 'tab:title-updated', // 标签页标题更新 CONTENT_UPDATED: 'tab:content-updated', // 标签页内容更新 STATE_CHANGED: 'tab:state-changed', // 标签页状态变化 VISIBILITY_CHANGED: 'tab:visibility-changed', // 标签页可见性变化 @@ -211,58 +144,12 @@ export const TAB_EVENTS = { CLOSED: 'tab:closed' // 标签页被关闭事件 } -// Yo Browser 相关事件 -export const YO_BROWSER_EVENTS = { - OPEN_REQUESTED: 'yo-browser:open-requested', - WINDOW_CREATED: 'yo-browser:window-created', - WINDOW_UPDATED: 'yo-browser:window-updated', - WINDOW_CLOSED: 'yo-browser:window-closed', - WINDOW_FOCUSED: 'yo-browser:window-focused', - WINDOW_COUNT_CHANGED: 'yo-browser:window-count-changed', - WINDOW_VISIBILITY_CHANGED: 'yo-browser:window-visibility-changed' -} - // 托盘相关事件 export const TRAY_EVENTS = { SHOW_HIDDEN_WINDOW: 'tray:show-hidden-window', // 从托盘显示/隐藏窗口 CHECK_FOR_UPDATES: 'tray:check-for-updates' // 托盘检查更新 } -// 悬浮按钮相关事件 -export const FLOATING_BUTTON_EVENTS = { - CLICKED: 'floating-button:clicked', // 悬浮按钮被点击 - RIGHT_CLICKED: 'floating-button:right-clicked', // 悬浮按钮被右键点击 - VISIBILITY_CHANGED: 'floating-button:visibility-changed', // 悬浮按钮显示状态改变 - POSITION_CHANGED: 'floating-button:position-changed', // 悬浮按钮位置改变 - ENABLED_CHANGED: 'floating-button:enabled-changed', // 悬浮按钮启用状态改变 - HOVER_STATE_CHANGED: 'floating-button:hover-state-changed', - SNAPSHOT_REQUEST: 'floating-button:snapshot-request', - SNAPSHOT_UPDATED: 'floating-button:snapshot-updated', - LANGUAGE_REQUEST: 'floating-button:language-request', - LANGUAGE_CHANGED: 'floating-button:language-changed', - THEME_REQUEST: 'floating-button:theme-request', - THEME_CHANGED: 'floating-button:theme-changed', - ACP_REGISTRY_ICON_REQUEST: 'floating-button:acp-registry-icon-request', - TOGGLE_EXPANDED: 'floating-button:toggle-expanded', - SET_EXPANDED: 'floating-button:set-expanded', - OPEN_SESSION: 'floating-button:open-session', - DRAG_START: 'floating-button:drag-start', // 悬浮按钮开始拖拽 - DRAG_MOVE: 'floating-button:drag-move', // 悬浮按钮拖拽移动 - DRAG_END: 'floating-button:drag-end' // 悬浮按钮结束拖拽 -} - -// Dialog related events -export const DIALOG_EVENTS = { - REQUEST: 'dialog:request', // Main -> Renderer: Request to show dialog - RESPONSE: 'dialog:response' // Renderer -> Main: Dialog result response -} - -// Knowledge base events -export const RAG_EVENTS = { - FILE_UPDATED: 'rag:file-updated', // File status update - FILE_PROGRESS: 'rag:file-progress' // File processing progress update -} - // Lifecycle management events export const LIFECYCLE_EVENTS = { PHASE_STARTED: 'lifecycle:phase-started', // Lifecycle phase started @@ -274,43 +161,3 @@ export const LIFECYCLE_EVENTS = { PROGRESS_UPDATED: 'lifecycle:progress-updated', // Lifecycle progress updated SHUTDOWN_REQUESTED: 'lifecycle:shutdown-requested' // Application shutdown requested } - -// Workspace events -export const WORKSPACE_EVENTS = { - INVALIDATED: 'workspace:files-changed', // Workspace invalidation event - FILES_CHANGED: 'workspace:files-changed' // Legacy alias -} - -// ACP-specific workspace events -export const ACP_WORKSPACE_EVENTS = { - SESSION_MODES_READY: 'acp-workspace:session-modes-ready', // Session modes available - SESSION_COMMANDS_READY: 'acp-workspace:session-commands-ready', // Session commands available - SESSION_CONFIG_OPTIONS_READY: 'acp-workspace:session-config-options-ready' // Session config options available -} - -export const ACP_DEBUG_EVENTS = { - EVENT: 'acp-debug:event' -} - -// Skills system events -export const SKILL_EVENTS = { - DISCOVERED: 'skill:discovered', // Skills discovery completed - METADATA_UPDATED: 'skill:metadata-updated', // Metadata hot-reload updated - INSTALLED: 'skill:installed', // Skill installation completed - UNINSTALLED: 'skill:uninstalled', // Skill uninstallation completed - ACTIVATED: 'skill:activated', // Skill activated in session - DEACTIVATED: 'skill:deactivated' // Skill deactivated in session -} - -// Skill sync events (cross-tool synchronization) -export const SKILL_SYNC_EVENTS = { - SCAN_STARTED: 'skill-sync:scan-started', // Scan operation started - SCAN_COMPLETED: 'skill-sync:scan-completed', // Scan operation completed - NEW_DISCOVERIES: 'skill-sync:new-discoveries', // New skills discovered (after comparing with cache) - IMPORT_STARTED: 'skill-sync:import-started', // Import operation started - IMPORT_PROGRESS: 'skill-sync:import-progress', // Import progress update - IMPORT_COMPLETED: 'skill-sync:import-completed', // Import operation completed - EXPORT_STARTED: 'skill-sync:export-started', // Export operation started - EXPORT_PROGRESS: 'skill-sync:export-progress', // Export progress update - EXPORT_COMPLETED: 'skill-sync:export-completed' // Export operation completed -} diff --git a/src/main/presenter/agentRuntimePresenter/dispatch.ts b/src/main/presenter/agentRuntimePresenter/dispatch.ts index 6a4ab6398..3eaa7417d 100644 --- a/src/main/presenter/agentRuntimePresenter/dispatch.ts +++ b/src/main/presenter/agentRuntimePresenter/dispatch.ts @@ -1,5 +1,3 @@ -import { eventBus, SendTarget } from '@/eventbus' -import { STREAM_EVENTS } from '@/events' import type { MCPToolCall, MCPContentItem, @@ -870,12 +868,6 @@ function appendSkillDraftQuestionActionBlock( function flushBlocksToRenderer(io: IoParams, blocks: AssistantMessageBlock[]): void { const renderedBlocks = cloneBlocksForRenderer(blocks) - eventBus.sendToRenderer(STREAM_EVENTS.RESPONSE, SendTarget.ALL_WINDOWS, { - conversationId: io.sessionId, - eventId: io.messageId, - messageId: io.messageId, - blocks: renderedBlocks - }) publishDeepchatEvent('chat.stream.updated', { kind: 'snapshot', requestId: io.requestId, @@ -1456,10 +1448,11 @@ export function finalizePaused(state: StreamState, io: IoParams): void { io.messageStore.updateAssistantContent(io.messageId, state.blocks) flushBlocksToRenderer(io, state.blocks) - eventBus.sendToRenderer(STREAM_EVENTS.END, SendTarget.ALL_WINDOWS, { - conversationId: io.sessionId, - eventId: io.messageId, - messageId: io.messageId + publishDeepchatEvent('chat.stream.completed', { + requestId: io.requestId, + sessionId: io.sessionId, + messageId: io.messageId, + completedAt: Date.now() }) } @@ -1485,11 +1478,6 @@ export function finalize(state: StreamState, io: IoParams): void { JSON.stringify(state.metadata) ) flushBlocksToRenderer(io, state.blocks) - eventBus.sendToRenderer(STREAM_EVENTS.END, SendTarget.ALL_WINDOWS, { - conversationId: io.sessionId, - eventId: io.messageId, - messageId: io.messageId - }) publishDeepchatEvent('chat.stream.completed', { requestId: io.requestId, sessionId: io.sessionId, @@ -1515,12 +1503,6 @@ export function finalizeError(state: StreamState, io: IoParams, error: unknown): io.messageStore.setMessageError(io.messageId, state.blocks, JSON.stringify(state.metadata)) flushBlocksToRenderer(io, state.blocks) - eventBus.sendToRenderer(STREAM_EVENTS.ERROR, SendTarget.ALL_WINDOWS, { - conversationId: io.sessionId, - eventId: io.messageId, - messageId: io.messageId, - error: errorMessage - }) publishDeepchatEvent('chat.stream.failed', { requestId: io.requestId, sessionId: io.sessionId, diff --git a/src/main/presenter/agentRuntimePresenter/echo.ts b/src/main/presenter/agentRuntimePresenter/echo.ts index 78aecfabd..f5f849605 100644 --- a/src/main/presenter/agentRuntimePresenter/echo.ts +++ b/src/main/presenter/agentRuntimePresenter/echo.ts @@ -3,8 +3,6 @@ import { AssistantMessageBlockSchema } from '@shared/contracts/common' import type { AssistantMessageBlock } from '@shared/types/agent-interface' import type { StreamState, IoParams } from './types' import { createThrottle } from '@shared/utils/throttle' -import { eventBus, SendTarget } from '@/eventbus' -import { STREAM_EVENTS } from '@/events' import { publishDeepchatEvent } from '@/routes/publishDeepchatEvent' const RENDERER_FLUSH_INTERVAL = 120 @@ -27,12 +25,6 @@ export function cloneBlocksForRenderer( export function startEcho(state: StreamState, io: IoParams): EchoHandle { function flushToRenderer(): void { const renderedBlocks = cloneBlocksForRenderer(state.blocks) - eventBus.sendToRenderer(STREAM_EVENTS.RESPONSE, SendTarget.ALL_WINDOWS, { - conversationId: io.sessionId, - eventId: io.messageId, - messageId: io.messageId, - blocks: renderedBlocks - }) publishDeepchatEvent('chat.stream.updated', { kind: 'snapshot', requestId: io.requestId, diff --git a/src/main/presenter/agentRuntimePresenter/index.ts b/src/main/presenter/agentRuntimePresenter/index.ts index eb540d1bb..d5ebbcba4 100644 --- a/src/main/presenter/agentRuntimePresenter/index.ts +++ b/src/main/presenter/agentRuntimePresenter/index.ts @@ -74,8 +74,8 @@ import { import { nanoid } from 'nanoid' import type { SQLitePresenter } from '../sqlitePresenter' import type { DeepChatTapeEntryRow } from '../sqlitePresenter/tables/deepchatTapeEntries' -import { eventBus, SendTarget } from '@/eventbus' -import { MCP_EVENTS, SESSION_EVENTS, STREAM_EVENTS } from '@/events' +import { eventBus } from '@/eventbus' +import { MCP_EVENTS } from '@/events' import { buildRuntimeCapabilitiesPrompt, buildSystemEnvPrompt @@ -1257,12 +1257,6 @@ export class AgentRuntimePresenter implements IAgentImplementation { this.updateToolCallResponse(blocks, toolCall.id, execution.terminalError, true) this.messageStore.setMessageError(messageId, blocks) this.emitMessageRefresh(sessionId, messageId) - eventBus.sendToRenderer(STREAM_EVENTS.ERROR, SendTarget.ALL_WINDOWS, { - conversationId: sessionId, - eventId: messageId, - messageId, - error: execution.terminalError - }) publishDeepchatEvent('chat.stream.failed', { requestId: this.resolveStreamRequestId(sessionId, messageId), sessionId, @@ -2888,12 +2882,6 @@ export class AgentRuntimePresenter implements IAgentImplementation { } const renderedBlocks = cloneBlocksForRenderer([block]) - eventBus.sendToRenderer(STREAM_EVENTS.RESPONSE, SendTarget.ALL_WINDOWS, { - conversationId: sessionId, - eventId: messageId, - messageId, - blocks: renderedBlocks - }) publishDeepchatEvent('chat.stream.updated', { kind: 'snapshot', requestId, @@ -2909,12 +2897,6 @@ export class AgentRuntimePresenter implements IAgentImplementation { messageId: string, requestId: string ): void { - eventBus.sendToRenderer(STREAM_EVENTS.RESPONSE, SendTarget.ALL_WINDOWS, { - conversationId: sessionId, - eventId: messageId, - messageId, - blocks: [] - }) publishDeepchatEvent('chat.stream.updated', { kind: 'snapshot', requestId, @@ -3093,12 +3075,6 @@ export class AgentRuntimePresenter implements IAgentImplementation { this.updateToolCallResponse(initialBlocks, budgetToolCall.id, resumeBudget.message, true) this.messageStore.setMessageError(messageId, initialBlocks) this.emitMessageRefresh(sessionId, messageId) - eventBus.sendToRenderer(STREAM_EVENTS.ERROR, SendTarget.ALL_WINDOWS, { - conversationId: sessionId, - eventId: messageId, - messageId, - error: resumeBudget.message - }) publishDeepchatEvent('chat.stream.failed', { requestId: this.resolveStreamRequestId(sessionId, messageId), sessionId, @@ -5562,11 +5538,12 @@ export class AgentRuntimePresenter implements IAgentImplementation { private emitCompactionState(sessionId: string, state: SessionCompactionState): void { this.sessionCompactionStates.set(sessionId, { ...state }) - eventBus.sendToRenderer(SESSION_EVENTS.COMPACTION_UPDATED, SendTarget.ALL_WINDOWS, { + publishDeepchatEvent('sessions.compaction.changed', { sessionId, status: state.status, cursorOrderSeq: state.cursorOrderSeq, - summaryUpdatedAt: state.summaryUpdatedAt + summaryUpdatedAt: state.summaryUpdatedAt, + version: Date.now() }) } @@ -5591,10 +5568,6 @@ export class AgentRuntimePresenter implements IAgentImplementation { return } current.status = status - eventBus.sendToRenderer(SESSION_EVENTS.STATUS_CHANGED, SendTarget.ALL_WINDOWS, { - sessionId, - status - }) publishDeepchatEvent('sessions.status.changed', { sessionId, status, @@ -5615,10 +5588,11 @@ export class AgentRuntimePresenter implements IAgentImplementation { } private emitMessageRefresh(sessionId: string, messageId: string): void { - eventBus.sendToRenderer(STREAM_EVENTS.END, SendTarget.ALL_WINDOWS, { - conversationId: sessionId, - eventId: messageId, - messageId + publishDeepchatEvent('chat.stream.completed', { + requestId: this.resolveStreamRequestId(sessionId, messageId), + sessionId, + messageId, + completedAt: Date.now() }) const message = this.messageStore.getMessage(messageId) diff --git a/src/main/presenter/agentRuntimePresenter/pendingInputCoordinator.ts b/src/main/presenter/agentRuntimePresenter/pendingInputCoordinator.ts index 21f7ce902..35dd54b68 100644 --- a/src/main/presenter/agentRuntimePresenter/pendingInputCoordinator.ts +++ b/src/main/presenter/agentRuntimePresenter/pendingInputCoordinator.ts @@ -1,5 +1,3 @@ -import { eventBus, SendTarget } from '@/eventbus' -import { SESSION_EVENTS } from '@/events' import { publishDeepchatEvent } from '@/routes/publishDeepchatEvent' import type { PendingSessionInputRecord, @@ -222,9 +220,6 @@ export class PendingInputCoordinator { } private emitUpdated(sessionId: string): void { - eventBus.sendToRenderer(SESSION_EVENTS.PENDING_INPUTS_UPDATED, SendTarget.ALL_WINDOWS, { - sessionId - }) publishDeepchatEvent('sessions.pendingInputs.changed', { sessionId, version: Date.now() diff --git a/src/main/presenter/agentSessionPresenter/index.ts b/src/main/presenter/agentSessionPresenter/index.ts index dff1c3875..8d6ad3a99 100644 --- a/src/main/presenter/agentSessionPresenter/index.ts +++ b/src/main/presenter/agentSessionPresenter/index.ts @@ -56,8 +56,6 @@ import { AgentRegistry } from './agentRegistry' import { NewSessionManager } from './sessionManager' import { NewMessageManager } from './messageManager' import { LegacyChatImportService } from './legacyImportService' -import { eventBus, SendTarget } from '@/eventbus' -import { SESSION_EVENTS } from '@/events' import { publishDeepchatEvent } from '@/routes/publishDeepchatEvent' import { buildConversationExportContent, @@ -295,17 +293,6 @@ export class AgentSessionPresenter { { id: 'deepchat', name: 'DeepChat', type: 'deepchat', enabled: true }, agentRuntimeAgent ) - - eventBus.on( - SESSION_EVENTS.STATUS_CHANGED, - (payload: { sessionId?: string; status?: SessionWithState['status'] }) => { - if (!payload?.sessionId || !payload?.status) { - return - } - - this.sessionStatusSnapshots.set(payload.sessionId, payload.status) - } - ) } // ---- IPC-facing methods ---- @@ -406,10 +393,6 @@ export class AgentSessionPresenter { // Bind to window and emit activated this.sessionManager.bindWindow(webContentsId, sessionId) - eventBus.sendToRenderer(SESSION_EVENTS.ACTIVATED, SendTarget.ALL_WINDOWS, { - webContentsId, - sessionId - }) this.emitSessionListUpdated({ sessionIds: [sessionId], reason: 'created', @@ -1764,10 +1747,6 @@ export class AgentSessionPresenter { async activateSession(webContentsId: number, sessionId: string): Promise { this.sessionManager.bindWindow(webContentsId, sessionId) - eventBus.sendToRenderer(SESSION_EVENTS.ACTIVATED, SendTarget.ALL_WINDOWS, { - webContentsId, - sessionId - }) publishDeepchatEvent('sessions.updated', { sessionIds: [sessionId], reason: 'activated', @@ -1778,9 +1757,6 @@ export class AgentSessionPresenter { async deactivateSession(webContentsId: number): Promise { this.sessionManager.unbindWindow(webContentsId) - eventBus.sendToRenderer(SESSION_EVENTS.DEACTIVATED, SendTarget.ALL_WINDOWS, { - webContentsId - }) publishDeepchatEvent('sessions.updated', { sessionIds: [], reason: 'deactivated', @@ -2457,7 +2433,6 @@ export class AgentSessionPresenter { ) const reason = options.reason ?? (sessionIds.length > 0 ? 'updated' : 'list-refreshed') - eventBus.sendToRenderer(SESSION_EVENTS.LIST_UPDATED, SendTarget.ALL_WINDOWS) publishDeepchatEvent('sessions.updated', { sessionIds, reason, diff --git a/src/main/presenter/browser/YoBrowserPresenter.ts b/src/main/presenter/browser/YoBrowserPresenter.ts index d139786f7..7502124a2 100644 --- a/src/main/presenter/browser/YoBrowserPresenter.ts +++ b/src/main/presenter/browser/YoBrowserPresenter.ts @@ -2,8 +2,6 @@ import { BrowserWindow, WebContents, WebContentsView } from 'electron' import type { Rectangle } from 'electron' import { is } from '@electron-toolkit/utils' import { nanoid } from 'nanoid' -import { eventBus, SendTarget } from '@/eventbus' -import { YO_BROWSER_EVENTS } from '@/events' import { publishDeepchatEvent } from '@/routes/publishDeepchatEvent' import logger from '@shared/logger' import { @@ -231,7 +229,6 @@ export class YoBrowserPresenter implements IYoBrowserPresenter { } this.emitWindowClosed(sessionId) - this.emitWindowCount() } async goBack(sessionId: string): Promise { @@ -385,7 +382,6 @@ export class YoBrowserPresenter implements IYoBrowserPresenter { this.sessionBrowsers.set(sessionId, state) this.setupPageListeners(state, view.webContents) this.emitWindowCreated(sessionId) - this.emitWindowCount() return state } @@ -491,7 +487,6 @@ export class YoBrowserPresenter implements IYoBrowserPresenter { state.visible = false this.sessionBrowsers.delete(sessionId) this.emitWindowClosed(sessionId) - this.emitWindowCount() } private attachHostWindowListeners(windowId: number): void { @@ -722,7 +717,6 @@ export class YoBrowserPresenter implements IYoBrowserPresenter { status: this.toStatus(this.sessionBrowsers.get(sessionId) ?? null) } - eventBus.sendToRenderer(YO_BROWSER_EVENTS.WINDOW_CREATED, SendTarget.ALL_WINDOWS, payload) publishDeepchatEvent('browser.status.changed', { sessionId, reason: 'created', @@ -741,7 +735,6 @@ export class YoBrowserPresenter implements IYoBrowserPresenter { url } - eventBus.sendToRenderer(YO_BROWSER_EVENTS.OPEN_REQUESTED, SendTarget.ALL_WINDOWS, payload) publishDeepchatEvent('browser.open.requested', { ...payload, version: Date.now() @@ -750,10 +743,6 @@ export class YoBrowserPresenter implements IYoBrowserPresenter { private emitWindowUpdated(sessionId: string): void { const status = this.toStatus(this.sessionBrowsers.get(sessionId) ?? null) - eventBus.sendToRenderer(YO_BROWSER_EVENTS.WINDOW_UPDATED, SendTarget.ALL_WINDOWS, { - sessionId, - status - }) publishDeepchatEvent('browser.status.changed', { sessionId, reason: 'updated', @@ -764,9 +753,6 @@ export class YoBrowserPresenter implements IYoBrowserPresenter { } private emitWindowClosed(sessionId: string): void { - eventBus.sendToRenderer(YO_BROWSER_EVENTS.WINDOW_CLOSED, SendTarget.ALL_WINDOWS, { - sessionId - }) publishDeepchatEvent('browser.status.changed', { sessionId, reason: 'closed', @@ -777,10 +763,6 @@ export class YoBrowserPresenter implements IYoBrowserPresenter { } private emitWindowFocused(sessionId: string, windowId: number): void { - eventBus.sendToRenderer(YO_BROWSER_EVENTS.WINDOW_FOCUSED, SendTarget.ALL_WINDOWS, { - sessionId, - windowId - }) publishDeepchatEvent('browser.status.changed', { sessionId, reason: 'focused', @@ -790,19 +772,7 @@ export class YoBrowserPresenter implements IYoBrowserPresenter { }) } - private emitWindowCount(): void { - eventBus.sendToRenderer( - YO_BROWSER_EVENTS.WINDOW_COUNT_CHANGED, - SendTarget.ALL_WINDOWS, - this.sessionBrowsers.size - ) - } - private emitWindowVisibility(sessionId: string, visible: boolean): void { - eventBus.sendToRenderer(YO_BROWSER_EVENTS.WINDOW_VISIBILITY_CHANGED, SendTarget.ALL_WINDOWS, { - sessionId, - visible - }) publishDeepchatEvent('browser.status.changed', { sessionId, reason: 'visibility', diff --git a/src/main/presenter/configPresenter/acpInitHelper.ts b/src/main/presenter/configPresenter/acpInitHelper.ts index 79c92273d..5659513e5 100644 --- a/src/main/presenter/configPresenter/acpInitHelper.ts +++ b/src/main/presenter/configPresenter/acpInitHelper.ts @@ -14,6 +14,8 @@ import { mergeCommandEnvironment, setPathEntriesOnEnv } from '@/lib/agentRuntime/shellEnvHelper' +import { DEEPCHAT_EVENT_CHANNEL } from '@shared/contracts/channels' +import { createDeepchatEventEnvelope } from '@/routes/publishDeepchatEvent' const execAsync = promisify(exec) @@ -229,10 +231,14 @@ class AcpInitHelper { missingCount: missingDeps.length }) if (webContents && !webContents.isDestroyed()) { - webContents.send('external-deps-required', { - agentId, - missingDeps - }) + webContents.send( + DEEPCHAT_EVENT_CHANNEL, + createDeepchatEventEnvelope('acpTerminal.externalDependenciesRequired', { + agentId, + missingDeps, + version: Date.now() + }) + ) } // Stop initialization - user must install dependencies first return null @@ -425,7 +431,14 @@ class AcpInitHelper { // Send output to renderer (PTY output is treated as stdout) if (!webContents.isDestroyed()) { - webContents.send('acp-init:output', { type: 'stdout', data }) + webContents.send( + DEEPCHAT_EVENT_CHANNEL, + createDeepchatEventEnvelope('acpTerminal.output', { + type: 'stdout', + data, + version: Date.now() + }) + ) } // Inject command once shell is ready @@ -460,7 +473,14 @@ class AcpInitHelper { commandInjected }) if (!webContents.isDestroyed()) { - webContents.send('acp-init:exit', { code: exitCode, signal: signal || null }) + webContents.send( + DEEPCHAT_EVENT_CHANNEL, + createDeepchatEventEnvelope('acpTerminal.exited', { + code: exitCode, + signal: signal || null, + version: Date.now() + }) + ) } if (this.activeShell === pty) { this.activeShell = null @@ -473,7 +493,13 @@ class AcpInitHelper { setTimeout(() => { if (!webContents.isDestroyed()) { logger.info('[ACP Init] Sending start event (delayed to ensure listeners ready)') - webContents.send('acp-init:start', { command: shell }) + webContents.send( + DEEPCHAT_EVENT_CHANNEL, + createDeepchatEventEnvelope('acpTerminal.started', { + command: shell, + version: Date.now() + }) + ) } // Fallback: inject command if shell hasn't become ready yet diff --git a/src/main/presenter/configPresenter/eventPublishers.ts b/src/main/presenter/configPresenter/eventPublishers.ts new file mode 100644 index 000000000..de81473cb --- /dev/null +++ b/src/main/presenter/configPresenter/eventPublishers.ts @@ -0,0 +1,200 @@ +import { eventBus } from '@/eventbus' +import { CONFIG_EVENTS, FLOATING_BUTTON_EVENTS, SYSTEM_EVENTS } from '@/events' +import { publishDeepchatEvent } from '@/routes/publishDeepchatEvent' +import { + readAcpState, + readLanguageState, + readSyncSettings, + readThemeState +} from '@/routes/config/configRouteSupport' +import type { IConfigPresenter } from '@shared/presenter' +import type { ProviderBatchUpdate, ProviderChange } from '@shared/provider-operations' + +export function emitLanguageChanged(configPresenter: IConfigPresenter, language: string): void { + eventBus.sendToMain(CONFIG_EVENTS.LANGUAGE_CHANGED, language) + publishDeepchatEvent('config.language.changed', { + ...readLanguageState(configPresenter), + version: Date.now() + }) +} + +export function emitThemeChanged( + configPresenter: IConfigPresenter, + theme: 'dark' | 'light' | 'system' +): void { + eventBus.sendToMain(CONFIG_EVENTS.THEME_CHANGED, theme) + void readThemeState(configPresenter) + .then((state) => { + publishDeepchatEvent('config.theme.changed', { + ...state, + version: Date.now() + }) + }) + .catch((error) => { + console.error('Failed to publish typed theme changed event:', error) + }) +} + +export function emitSystemThemeChanged(isDark: boolean): void { + eventBus.sendToMain(SYSTEM_EVENTS.SYSTEM_THEME_UPDATED, isDark) + publishDeepchatEvent('config.systemTheme.changed', { + isDark, + version: Date.now() + }) +} + +export function emitFloatingButtonChanged(enabled: boolean): void { + eventBus.sendToMain(FLOATING_BUTTON_EVENTS.ENABLED_CHANGED, enabled) + publishDeepchatEvent('config.floatingButton.changed', { + enabled, + version: Date.now() + }) +} + +export function emitSyncSettingsChanged( + configPresenter: IConfigPresenter, + change: { enabled?: boolean; folderPath?: string } +): void { + eventBus.sendToMain(CONFIG_EVENTS.SYNC_SETTINGS_CHANGED, change) + publishDeepchatEvent('config.syncSettings.changed', { + ...readSyncSettings(configPresenter), + version: Date.now() + }) +} + +export function emitDefaultProjectPathChanged(path: string | null): void { + eventBus.sendToMain(CONFIG_EVENTS.DEFAULT_PROJECT_PATH_CHANGED, { path }) + publishDeepchatEvent('config.defaultProjectPath.changed', { + path, + version: Date.now() + }) +} + +export function emitAcpAgentsChanged(configPresenter: IConfigPresenter, agentIds?: string[]): void { + eventBus.sendToMain(CONFIG_EVENTS.AGENTS_CHANGED, { agentIds }) + void readAcpState(configPresenter) + .then((state) => { + publishDeepchatEvent('config.agents.changed', { + ...state, + agentIds, + version: Date.now() + }) + }) + .catch((error) => { + console.error('Failed to publish typed ACP agents changed event:', error) + }) + publishDeepchatEvent('models.changed', { + reason: 'agents', + providerId: 'acp', + version: Date.now() + }) +} + +export async function emitCustomPromptsChanged(configPresenter: IConfigPresenter): Promise { + eventBus.sendToMain(CONFIG_EVENTS.CUSTOM_PROMPTS_CHANGED) + publishDeepchatEvent('config.customPrompts.changed', { + prompts: await configPresenter.getCustomPrompts(), + version: Date.now() + }) +} + +export function emitProvidersChanged(): void { + eventBus.sendToMain(CONFIG_EVENTS.PROVIDER_CHANGED) + publishDeepchatEvent('providers.changed', { + reason: 'providers', + version: Date.now() + }) +} + +export function emitProviderAtomicUpdate(change: ProviderChange): void { + eventBus.sendToMain(CONFIG_EVENTS.PROVIDER_ATOMIC_UPDATE, change) + publishDeepchatEvent('providers.changed', { + reason: 'provider-atomic-update', + providerIds: change.providerId ? [change.providerId] : undefined, + version: Date.now() + }) +} + +export function emitProviderBatchUpdate(batchUpdate: ProviderBatchUpdate): void { + eventBus.sendToMain(CONFIG_EVENTS.PROVIDER_BATCH_UPDATE, batchUpdate) + publishDeepchatEvent('providers.changed', { + reason: 'provider-batch-update', + providerIds: Array.isArray(batchUpdate.providers) + ? batchUpdate.providers.map((provider) => provider.id) + : undefined, + version: Date.now() + }) +} + +export function emitModelsChanged(providerId?: string): void { + eventBus.sendToMain(CONFIG_EVENTS.MODEL_LIST_CHANGED, providerId) + publishDeepchatEvent('models.changed', { + reason: 'runtime-refresh', + providerId, + version: Date.now() + }) +} + +export function emitModelStatusChanged(payload: { + providerId: string + modelId: string + enabled: boolean +}): void { + eventBus.sendToMain(CONFIG_EVENTS.MODEL_STATUS_CHANGED, payload) + publishDeepchatEvent('models.status.changed', { + ...payload, + version: Date.now() + }) +} + +export function emitModelBatchStatusChanged(payload: { + providerId: string + updates: { modelId: string; enabled: boolean }[] +}): void { + eventBus.sendToMain(CONFIG_EVENTS.MODEL_BATCH_STATUS_CHANGED, payload) + publishDeepchatEvent('models.batch.status.changed', { + ...payload, + version: Date.now() + }) +} + +export function emitModelConfigChanged( + providerId: string, + modelId: string, + config: Record +): void { + eventBus.sendToMain(CONFIG_EVENTS.MODEL_CONFIG_CHANGED, providerId, modelId, config) + publishDeepchatEvent('models.config.changed', { + changeType: 'updated', + providerId, + modelId, + config, + version: Date.now() + }) +} + +export function emitModelConfigReset(providerId: string, modelId: string): void { + eventBus.sendToMain(CONFIG_EVENTS.MODEL_CONFIG_RESET, providerId, modelId) + publishDeepchatEvent('models.config.changed', { + changeType: 'reset', + providerId, + modelId, + version: Date.now() + }) +} + +export function emitModelConfigsImported(overwrite: boolean): void { + eventBus.sendToMain(CONFIG_EVENTS.MODEL_CONFIGS_IMPORTED, overwrite) + publishDeepchatEvent('models.config.changed', { + changeType: 'imported', + overwrite, + version: Date.now() + }) +} + +export function emitDefaultSystemPromptChanged(payload: { + promptId: string + content: string +}): void { + eventBus.sendToMain(CONFIG_EVENTS.DEFAULT_SYSTEM_PROMPT_CHANGED, payload) +} diff --git a/src/main/presenter/configPresenter/index.ts b/src/main/presenter/configPresenter/index.ts index 5f75e9f7c..8087fb39a 100644 --- a/src/main/presenter/configPresenter/index.ts +++ b/src/main/presenter/configPresenter/index.ts @@ -1,5 +1,5 @@ import logger from '@shared/logger' -import { eventBus, SendTarget } from '@/eventbus' +import { eventBus } from '@/eventbus' import { IConfigPresenter, LLM_PROVIDER, @@ -46,13 +46,7 @@ import { DEFAULT_PROVIDERS } from './providers' import path from 'path' import { app, nativeTheme, shell, safeStorage } from 'electron' import fs from 'fs' -import { - CONFIG_EVENTS, - SYSTEM_EVENTS, - FLOATING_BUTTON_EVENTS, - SESSION_EVENTS, - MCP_EVENTS -} from '@/events' +import { CONFIG_EVENTS, MCP_EVENTS } from '@/events' import { McpConfHelper } from './mcpConfHelper' import { presenter } from '@/presenter' import { compare } from 'compare-versions' @@ -83,6 +77,21 @@ import { normalizeDeepChatSubagentConfig } from '@shared/lib/deepchatSubagents' import type { SQLitePresenter } from '../sqlitePresenter' import type { SettingsKey, SettingsSnapshotValues } from '@shared/contracts/routes' import { publishDeepchatEvent } from '@/routes/publishDeepchatEvent' +import { + emitAcpAgentsChanged, + emitCustomPromptsChanged, + emitDefaultProjectPathChanged, + emitDefaultSystemPromptChanged, + emitFloatingButtonChanged, + emitLanguageChanged, + emitModelConfigChanged, + emitModelConfigReset, + emitModelConfigsImported, + emitModelsChanged, + emitSyncSettingsChanged, + emitSystemThemeChanged, + emitThemeChanged +} from './eventPublishers' import type { HookTestResult, HooksNotificationsSettings } from '@shared/hooksNotifications' import type { Agent, @@ -1462,11 +1471,6 @@ export class ConfigPresenter implements IConfigPresenter { // Trigger setting change event (main process internal use only) eventBus.sendToMain(CONFIG_EVENTS.SETTING_CHANGED, key, value) - // Special handling: font size settings need to notify all tabs - if (key === 'fontSizeLevel') { - eventBus.sendToRenderer(CONFIG_EVENTS.FONT_SIZE_CHANGED, SendTarget.ALL_WINDOWS, value) - } - const trackedChange = toTrackedSettingsChangePayload(key, value) if (trackedChange) { publishDeepchatEvent('settings.changed', { @@ -1750,8 +1754,7 @@ export class ConfigPresenter implements IConfigPresenter { // Set application language setLanguage(language: string): void { this.setSetting('language', language) - // Trigger language change event (need to notify all tabs) - eventBus.send(CONFIG_EVENTS.LANGUAGE_CHANGED, SendTarget.ALL_WINDOWS, language) + emitLanguageChanged(this, language) try { presenter.floatingButtonPresenter.refreshLanguage() @@ -1855,7 +1858,7 @@ export class ConfigPresenter implements IConfigPresenter { setSyncEnabled(enabled: boolean): void { logger.info('setSyncEnabled', enabled) this.setSetting('syncEnabled', enabled) - eventBus.send(CONFIG_EVENTS.SYNC_SETTINGS_CHANGED, SendTarget.ALL_WINDOWS, { enabled }) + emitSyncSettingsChanged(this, { enabled }) } // Get sync folder path @@ -1868,7 +1871,7 @@ export class ConfigPresenter implements IConfigPresenter { // Set sync folder path setSyncFolderPath(folderPath: string): void { this.setSetting('syncFolderPath', folderPath) - eventBus.send(CONFIG_EVENTS.SYNC_SETTINGS_CHANGED, SendTarget.ALL_WINDOWS, { folderPath }) + emitSyncSettingsChanged(this, { folderPath }) } // Get last sync time @@ -2073,8 +2076,7 @@ export class ConfigPresenter implements IConfigPresenter { async setCustomSearchEngines(engines: SearchEngineTemplate[]): Promise { try { this.store.set('customSearchEngines', JSON.stringify(engines)) - // Send event to notify search engine update (need to notify all tabs) - eventBus.send(CONFIG_EVENTS.SEARCH_ENGINES_UPDATED, SendTarget.ALL_WINDOWS, engines) + eventBus.sendToMain(CONFIG_EVENTS.SEARCH_ENGINES_UPDATED, engines) } catch (error) { console.error('Failed to set custom search engines:', error) throw error @@ -2255,7 +2257,7 @@ export class ConfigPresenter implements IConfigPresenter { // Set floating button switch status setFloatingButtonEnabled(enabled: boolean): void { this.setSetting('floatingButtonEnabled', enabled) - eventBus.send(FLOATING_BUTTON_EVENTS.ENABLED_CHANGED, SendTarget.ALL_WINDOWS, enabled) + emitFloatingButtonChanged(enabled) try { presenter.floatingButtonPresenter.setEnabled(enabled) @@ -2775,9 +2777,12 @@ export class ConfigPresenter implements IConfigPresenter { private notifyAcpAgentsChanged(agentIds?: string[]) { logger.info('[ACP] notifyAcpAgentsChanged: sending MODEL_LIST_CHANGED event for provider "acp"') - eventBus.send(CONFIG_EVENTS.MODEL_LIST_CHANGED, SendTarget.ALL_WINDOWS, 'acp') - eventBus.send(CONFIG_EVENTS.AGENTS_CHANGED, SendTarget.ALL_WINDOWS, { agentIds }) - eventBus.sendToRendererIfAvailable(SESSION_EVENTS.LIST_UPDATED, SendTarget.ALL_WINDOWS) + emitModelsChanged('acp') + emitAcpAgentsChanged(this, agentIds) + publishDeepchatEvent('sessions.updated', { + sessionIds: [], + reason: 'list-refreshed' + }) } // Provide getMcpConfHelper method to get MCP configuration helper @@ -2809,14 +2814,7 @@ export class ConfigPresenter implements IConfigPresenter { ): void { const storedConfig = this.modelConfigHelper.setModelConfig(modelId, providerId, config, options) this.providerModelHelper.invalidateProviderModelsCache(providerId) - // Trigger model configuration change event (need to notify all tabs) - eventBus.send( - CONFIG_EVENTS.MODEL_CONFIG_CHANGED, - SendTarget.ALL_WINDOWS, - providerId, - modelId, - storedConfig - ) + emitModelConfigChanged(providerId, modelId, storedConfig as unknown as Record) } /** @@ -2827,8 +2825,7 @@ export class ConfigPresenter implements IConfigPresenter { resetModelConfig(modelId: string, providerId: string): void { this.modelConfigHelper.resetModelConfig(modelId, providerId) this.providerModelHelper.invalidateProviderModelsCache(providerId) - // 触发模型配置重置事件(需要通知所有标签页) - eventBus.send(CONFIG_EVENTS.MODEL_CONFIG_RESET, SendTarget.ALL_WINDOWS, providerId, modelId) + emitModelConfigReset(providerId, modelId) } /** @@ -2870,8 +2867,7 @@ export class ConfigPresenter implements IConfigPresenter { importModelConfigs(configs: Record, overwrite: boolean = false): void { this.modelConfigHelper.importConfigs(configs, overwrite) this.providerModelHelper.invalidateAllProviderModelsCache() - // 触发批量导入事件(需要通知所有标签页) - eventBus.send(CONFIG_EVENTS.MODEL_CONFIGS_IMPORTED, SendTarget.ALL_WINDOWS, overwrite) + emitModelConfigsImported(overwrite) } getNotificationsEnabled(): boolean { @@ -2891,7 +2887,7 @@ export class ConfigPresenter implements IConfigPresenter { nativeTheme.on('updated', () => { // 只有当主题设置为 system 时,才需要通知渲染进程系统主题变化 if (nativeTheme.themeSource === 'system') { - eventBus.sendToMain(SYSTEM_EVENTS.SYSTEM_THEME_UPDATED, nativeTheme.shouldUseDarkColors) + emitSystemThemeChanged(nativeTheme.shouldUseDarkColors) try { void presenter.floatingButtonPresenter.refreshTheme() @@ -2905,8 +2901,7 @@ export class ConfigPresenter implements IConfigPresenter { async setTheme(theme: 'dark' | 'light' | 'system'): Promise { nativeTheme.themeSource = theme this.setSetting('appTheme', theme) - // 通知所有窗口主题已更改 - eventBus.send(CONFIG_EVENTS.THEME_CHANGED, SendTarget.ALL_WINDOWS, theme) + emitThemeChanged(this, theme) try { void presenter.floatingButtonPresenter.refreshTheme() @@ -2960,10 +2955,7 @@ export class ConfigPresenter implements IConfigPresenter { } this.clearCustomPromptsCache() logger.info(`[Config] Custom prompts cache updated: ${prompts.length} prompts`) - // Notify all windows about custom prompts change - eventBus.send(CONFIG_EVENTS.CUSTOM_PROMPTS_CHANGED, SendTarget.ALL_WINDOWS, { - count: prompts.length - }) + await emitCustomPromptsChanged(this) } // 添加单个 prompt (optimized with cache) @@ -3111,7 +3103,7 @@ export class ConfigPresenter implements IConfigPresenter { if (promptId === 'empty') { await this.setSystemPrompts(updatedPrompts) await this.clearSystemPrompt() - eventBus.send(CONFIG_EVENTS.DEFAULT_SYSTEM_PROMPT_CHANGED, SendTarget.ALL_WINDOWS, { + emitDefaultSystemPromptChanged({ promptId: 'empty', content: '' }) @@ -3124,7 +3116,7 @@ export class ConfigPresenter implements IConfigPresenter { updatedPrompts[targetIndex].isDefault = true await this.setSystemPrompts(updatedPrompts) await this.setDefaultSystemPrompt(updatedPrompts[targetIndex].content) - eventBus.send(CONFIG_EVENTS.DEFAULT_SYSTEM_PROMPT_CHANGED, SendTarget.ALL_WINDOWS, { + emitDefaultSystemPromptChanged({ promptId, content: updatedPrompts[targetIndex].content }) @@ -3201,11 +3193,20 @@ export class ConfigPresenter implements IConfigPresenter { // 设置快捷键 setShortcutKey(customShortcutKey: ShortcutKeySetting) { this.setSetting('shortcutKey', customShortcutKey) + this.publishShortcutKeysChanged() } // 重置快捷键 resetShortcutKeys() { this.setSetting('shortcutKey', { ...defaultShortcutKey }) + this.publishShortcutKeysChanged() + } + + private publishShortcutKeysChanged(): void { + publishDeepchatEvent('config.shortcutKeys.changed', { + shortcuts: this.getShortcutKey(), + version: Date.now() + }) } // 获取知识库配置 @@ -3235,10 +3236,15 @@ export class ConfigPresenter implements IConfigPresenter { } void Promise.all([this.getMcpServers(), this.getMcpEnabled()]) .then(([mcpServers, mcpEnabled]) => { - eventBus.send(MCP_EVENTS.CONFIG_CHANGED, SendTarget.ALL_WINDOWS, { + eventBus.sendToMain(MCP_EVENTS.CONFIG_CHANGED, { mcpServers, mcpEnabled }) + publishDeepchatEvent('mcp.config.changed', { + mcpServers, + mcpEnabled, + version: Date.now() + }) }) .catch((error) => { console.error('Failed to notify MCP config change after knowledge config update:', error) @@ -3348,11 +3354,6 @@ export class ConfigPresenter implements IConfigPresenter { }): Promise { try { this.getSettingsStoreForKey('nowledgeMemConfig').set('nowledgeMemConfig', config) - eventBus.sendToRenderer( - CONFIG_EVENTS.NOWLEDGE_MEM_CONFIG_UPDATED, - SendTarget.ALL_WINDOWS, - config - ) } catch (error) { console.error('[Config] Failed to set nowledge-mem config:', error) throw error @@ -3426,9 +3427,7 @@ export class ConfigPresenter implements IConfigPresenter { setDefaultProjectPath(projectPath: string | null): void { const normalized = projectPath?.trim() ? projectPath.trim() : null this.setSetting('defaultProjectPath', normalized) - eventBus.send(CONFIG_EVENTS.DEFAULT_PROJECT_PATH_CHANGED, SendTarget.ALL_WINDOWS, { - path: normalized - }) + emitDefaultProjectPathChanged(normalized) } } diff --git a/src/main/presenter/configPresenter/mcpConfHelper.ts b/src/main/presenter/configPresenter/mcpConfHelper.ts index dac508c24..c372fbf3e 100644 --- a/src/main/presenter/configPresenter/mcpConfHelper.ts +++ b/src/main/presenter/configPresenter/mcpConfHelper.ts @@ -1,7 +1,8 @@ import logger from '@shared/logger' -import { eventBus, SendTarget } from '@/eventbus' +import { eventBus } from '@/eventbus' import { BuiltinKnowledgeConfig, MCPServerConfig } from '@shared/presenter' import { MCP_EVENTS } from '@/events' +import { publishDeepchatEvent } from '@/routes/publishDeepchatEvent' import ElectronStore from 'electron-store' // app is used in DEFAULT_INMEMORY_SERVERS but removed buildInFileSystem // import { app } from 'electron' @@ -327,9 +328,15 @@ export class McpConfHelper { } private emitConfigChanged(servers: Record): void { - eventBus.send(MCP_EVENTS.CONFIG_CHANGED, SendTarget.ALL_WINDOWS, { + const mcpEnabled = Boolean(this.mcpStore.get('mcpEnabled')) + eventBus.sendToMain(MCP_EVENTS.CONFIG_CHANGED, { mcpServers: servers, - mcpEnabled: this.mcpStore.get('mcpEnabled') + mcpEnabled + }) + publishDeepchatEvent('mcp.config.changed', { + mcpServers: servers, + mcpEnabled, + version: Date.now() }) } @@ -865,10 +872,18 @@ export class McpConfHelper { `MCP batch import completed. Imported: ${result.imported}, Skipped: ${result.skipped}, Errors: ${result.errors.length}` ) - // Emit event to notify about the import - eventBus.sendToRenderer(MCP_EVENTS.CONFIG_CHANGED, SendTarget.ALL_WINDOWS, { + const mcpServers = await this.getMcpServers() + const mcpEnabled = await this.getMcpEnabled() + eventBus.sendToMain(MCP_EVENTS.CONFIG_CHANGED, { action: 'batch_import', - result + result, + mcpServers, + mcpEnabled + }) + publishDeepchatEvent('mcp.config.changed', { + mcpServers, + mcpEnabled, + version: Date.now() }) return result diff --git a/src/main/presenter/configPresenter/modelStatusHelper.ts b/src/main/presenter/configPresenter/modelStatusHelper.ts index 4f0157249..261095edf 100644 --- a/src/main/presenter/configPresenter/modelStatusHelper.ts +++ b/src/main/presenter/configPresenter/modelStatusHelper.ts @@ -1,6 +1,5 @@ -import { eventBus, SendTarget } from '@/eventbus' -import { CONFIG_EVENTS } from '@/events' import type { StoreLike } from './storeLike' +import { emitModelBatchStatusChanged, emitModelStatusChanged } from './eventPublishers' type SetSetting = (key: string, value: T) => void @@ -155,7 +154,7 @@ export class ModelStatusHelper { this.setSetting(statusKey, enabled) this.cache.set(statusKey, enabled) this.statusSnapshot?.set(statusKey, enabled) - eventBus.send(CONFIG_EVENTS.MODEL_STATUS_CHANGED, SendTarget.ALL_WINDOWS, { + emitModelStatusChanged({ providerId, modelId, enabled @@ -229,7 +228,7 @@ export class ModelStatusHelper { this.statusSnapshot?.set(statusKey, enabled) } - eventBus.send(CONFIG_EVENTS.MODEL_BATCH_STATUS_CHANGED, SendTarget.ALL_WINDOWS, { + emitModelBatchStatusChanged({ providerId, updates }) diff --git a/src/main/presenter/configPresenter/providerDbLoader.ts b/src/main/presenter/configPresenter/providerDbLoader.ts index b781743a5..db94d7edb 100644 --- a/src/main/presenter/configPresenter/providerDbLoader.ts +++ b/src/main/presenter/configPresenter/providerDbLoader.ts @@ -8,8 +8,9 @@ import { sanitizeAggregate } from '@shared/types/model-db' import { resolveProviderId } from './providerId' -import { eventBus, SendTarget } from '@/eventbus' +import { eventBus } from '@/eventbus' import { PROVIDER_DB_EVENTS } from '@/events' +import { publishDeepchatEvent } from '@/routes/publishDeepchatEvent' const DEFAULT_PROVIDER_DB_URL = 'https://raw.githubusercontent.com/ThinkInAIXYZ/PublicProviderConf/refs/heads/dev/dist/all.json' @@ -22,6 +23,17 @@ type MetaFile = { lastAttemptedAt?: number } +function publishProviderDbCatalogChanged(reason: 'provider-db-loaded' | 'provider-db-updated') { + publishDeepchatEvent('providers.changed', { + reason, + version: Date.now() + }) + publishDeepchatEvent('models.changed', { + reason, + version: Date.now() + }) +} + export type ProviderDbRefreshResult = { status: 'updated' | 'not-modified' | 'skipped' | 'error' lastUpdated: number | null @@ -60,9 +72,10 @@ export class ProviderDbLoader { if (this.cache) { try { const providersCount = Object.keys(this.cache.providers || {}).length - eventBus.send(PROVIDER_DB_EVENTS.LOADED, SendTarget.ALL_WINDOWS, { + eventBus.sendToMain(PROVIDER_DB_EVENTS.LOADED, { providersCount }) + publishProviderDbCatalogChanged('provider-db-loaded') } catch {} } @@ -308,10 +321,11 @@ export class ProviderDbLoader { this.cache = sanitized try { const providersCount = Object.keys(this.cache.providers || {}).length - eventBus.send(PROVIDER_DB_EVENTS.UPDATED, SendTarget.ALL_WINDOWS, { + eventBus.sendToMain(PROVIDER_DB_EVENTS.UPDATED, { providersCount, lastUpdated: meta.lastUpdated }) + publishProviderDbCatalogChanged('provider-db-updated') } catch {} return this.createResult('updated', meta) } catch (error) { diff --git a/src/main/presenter/configPresenter/providerHelper.ts b/src/main/presenter/configPresenter/providerHelper.ts index a3c62f000..af0d5bb32 100644 --- a/src/main/presenter/configPresenter/providerHelper.ts +++ b/src/main/presenter/configPresenter/providerHelper.ts @@ -1,6 +1,4 @@ import logger from '@shared/logger' -import { eventBus, SendTarget } from '@/eventbus' -import { CONFIG_EVENTS } from '@/events' import { checkRequiresRebuild, ProviderBatchUpdate, @@ -8,6 +6,11 @@ import { } from '@shared/provider-operations' import { LLM_PROVIDER } from '@shared/presenter' import type { StoreLike } from './storeLike' +import { + emitProviderAtomicUpdate, + emitProviderBatchUpdate, + emitProvidersChanged +} from './eventPublishers' type SetSetting = (key: string, value: T) => void @@ -112,7 +115,7 @@ export class ProviderHelper { `[Config] Repaired providers store: ${providers.length} entries -> ${repairedProviders.length} valid providers` ) this.setSetting(PROVIDERS_STORE_KEY, repairedProviders) - eventBus.send(CONFIG_EVENTS.PROVIDER_CHANGED, SendTarget.ALL_WINDOWS) + emitProvidersChanged() } return repairedProviders } @@ -145,7 +148,7 @@ export class ProviderHelper { } this.setSetting(PROVIDERS_STORE_KEY, validProviders) - eventBus.send(CONFIG_EVENTS.PROVIDER_CHANGED, SendTarget.ALL_WINDOWS) + emitProvidersChanged() } getProviderById(id: string): LLM_PROVIDER | undefined { @@ -182,14 +185,14 @@ export class ProviderHelper { requiresRebuild, updates } - eventBus.send(CONFIG_EVENTS.PROVIDER_ATOMIC_UPDATE, SendTarget.ALL_WINDOWS, change) + emitProviderAtomicUpdate(change) return requiresRebuild } updateProvidersBatch(batchUpdate: ProviderBatchUpdate): void { this.setSetting(PROVIDERS_STORE_KEY, batchUpdate.providers) - eventBus.send(CONFIG_EVENTS.PROVIDER_BATCH_UPDATE, SendTarget.ALL_WINDOWS, batchUpdate) + emitProviderBatchUpdate(batchUpdate) } addProviderAtomic(provider: LLM_PROVIDER): void { @@ -203,7 +206,7 @@ export class ProviderHelper { requiresRebuild: true, provider } - eventBus.send(CONFIG_EVENTS.PROVIDER_ATOMIC_UPDATE, SendTarget.ALL_WINDOWS, change) + emitProviderAtomicUpdate(change) } removeProviderAtomic(providerId: string): void { @@ -228,7 +231,7 @@ export class ProviderHelper { providerId, requiresRebuild: true } - eventBus.send(CONFIG_EVENTS.PROVIDER_ATOMIC_UPDATE, SendTarget.ALL_WINDOWS, change) + emitProviderAtomicUpdate(change) } reorderProvidersAtomic(providers: LLM_PROVIDER[]): void { @@ -239,7 +242,7 @@ export class ProviderHelper { providerId: '', requiresRebuild: false } - eventBus.send(CONFIG_EVENTS.PROVIDER_ATOMIC_UPDATE, SendTarget.ALL_WINDOWS, change) + emitProviderAtomicUpdate(change) } getDefaultProviders(): LLM_PROVIDER[] { diff --git a/src/main/presenter/configPresenter/providerModelHelper.ts b/src/main/presenter/configPresenter/providerModelHelper.ts index 4966f6274..daa028866 100644 --- a/src/main/presenter/configPresenter/providerModelHelper.ts +++ b/src/main/presenter/configPresenter/providerModelHelper.ts @@ -1,12 +1,11 @@ import logger from '@shared/logger' -import { eventBus, SendTarget } from '@/eventbus' -import { CONFIG_EVENTS } from '@/events' import { ModelConfig, MODEL_META } from '@shared/presenter' import { ModelType } from '@shared/model' import { resolveVideoGenerationCompatType } from '@shared/videoGenerationSettings' import ElectronStore from 'electron-store' import path from 'path' import type { StoreLike } from './storeLike' +import { emitModelsChanged } from './eventPublishers' export interface IModelStore { models: MODEL_META[] @@ -302,7 +301,7 @@ export class ProviderModelHelper { this.setCustomModels(providerId, models) this.setModelStatus(providerId, model.id, true) - eventBus.send(CONFIG_EVENTS.MODEL_LIST_CHANGED, SendTarget.ALL_WINDOWS, providerId) + emitModelsChanged(providerId) } removeCustomModel(providerId: string, modelId: string): void { @@ -310,7 +309,7 @@ export class ProviderModelHelper { const filteredModels = models.filter((model) => model.id !== modelId) this.setCustomModels(providerId, filteredModels) this.deleteModelStatus(providerId, modelId) - eventBus.send(CONFIG_EVENTS.MODEL_LIST_CHANGED, SendTarget.ALL_WINDOWS, providerId) + emitModelsChanged(providerId) } updateCustomModel(providerId: string, modelId: string, updates: Partial): void { @@ -319,7 +318,7 @@ export class ProviderModelHelper { if (index !== -1) { models[index] = { ...models[index], ...updates } this.setCustomModels(providerId, models) - eventBus.send(CONFIG_EVENTS.MODEL_LIST_CHANGED, SendTarget.ALL_WINDOWS, providerId) + emitModelsChanged(providerId) } } } diff --git a/src/main/presenter/configPresenter/systemPromptHelper.ts b/src/main/presenter/configPresenter/systemPromptHelper.ts index b6ffdba12..1ed4f348d 100644 --- a/src/main/presenter/configPresenter/systemPromptHelper.ts +++ b/src/main/presenter/configPresenter/systemPromptHelper.ts @@ -1,8 +1,7 @@ -import { eventBus, SendTarget } from '@/eventbus' -import { CONFIG_EVENTS } from '@/events' import { SystemPrompt } from '@shared/presenter' import ElectronStore from 'electron-store' import { publishDeepchatEvent } from '@/routes/publishDeepchatEvent' +import { emitDefaultSystemPromptChanged } from './eventPublishers' type SetSetting = (key: string, value: T) => void @@ -149,7 +148,7 @@ export class SystemPromptHelper { if (promptId === 'empty') { await this.setSystemPrompts(updatedPrompts) await this.clearSystemPrompt() - eventBus.send(CONFIG_EVENTS.DEFAULT_SYSTEM_PROMPT_CHANGED, SendTarget.ALL_WINDOWS, { + emitDefaultSystemPromptChanged({ promptId: 'empty', content: '' }) @@ -162,7 +161,7 @@ export class SystemPromptHelper { updatedPrompts[targetIndex].isDefault = true await this.setSystemPrompts(updatedPrompts) await this.setDefaultSystemPrompt(updatedPrompts[targetIndex].content) - eventBus.send(CONFIG_EVENTS.DEFAULT_SYSTEM_PROMPT_CHANGED, SendTarget.ALL_WINDOWS, { + emitDefaultSystemPromptChanged({ promptId, content: updatedPrompts[targetIndex].content }) diff --git a/src/main/presenter/configPresenter/uiSettingsHelper.ts b/src/main/presenter/configPresenter/uiSettingsHelper.ts index 1b15c88c2..2302cebc9 100644 --- a/src/main/presenter/configPresenter/uiSettingsHelper.ts +++ b/src/main/presenter/configPresenter/uiSettingsHelper.ts @@ -1,4 +1,4 @@ -import { eventBus, SendTarget } from '@/eventbus' +import { eventBus } from '@/eventbus' import { CONFIG_EVENTS } from '@/events' import { publishDeepchatEvent } from '@/routes/publishDeepchatEvent' import type { SettingsKey, SettingsSnapshotValues } from '@shared/contracts/routes' @@ -65,7 +65,7 @@ export class UiSettingsHelper { setSearchPreviewEnabled(enabled: boolean): void { const boolValue = Boolean(enabled) this.setSetting('searchPreviewEnabled', boolValue) - eventBus.send(CONFIG_EVENTS.SEARCH_PREVIEW_CHANGED, SendTarget.ALL_WINDOWS, boolValue) + eventBus.sendToMain(CONFIG_EVENTS.SEARCH_PREVIEW_CHANGED, boolValue) } getAutoScrollEnabled(): boolean { @@ -77,7 +77,7 @@ export class UiSettingsHelper { setAutoScrollEnabled(enabled: boolean): void { const boolValue = Boolean(enabled) this.setSetting('autoScrollEnabled', boolValue) - eventBus.send(CONFIG_EVENTS.AUTO_SCROLL_CHANGED, SendTarget.ALL_WINDOWS, boolValue) + eventBus.sendToMain(CONFIG_EVENTS.AUTO_SCROLL_CHANGED, boolValue) } getAutoCompactionEnabled(): boolean { @@ -123,7 +123,7 @@ export class UiSettingsHelper { setContentProtectionEnabled(enabled: boolean): void { this.setSetting('contentProtectionEnabled', enabled) - eventBus.send(CONFIG_EVENTS.CONTENT_PROTECTION_CHANGED, SendTarget.ALL_WINDOWS, enabled) + eventBus.sendToMain(CONFIG_EVENTS.CONTENT_PROTECTION_CHANGED, enabled) } getPrivacyModeEnabled(): boolean { @@ -142,12 +142,12 @@ export class UiSettingsHelper { setCopyWithCotEnabled(enabled: boolean): void { this.setSetting('copyWithCotEnabled', enabled) - eventBus.send(CONFIG_EVENTS.COPY_WITH_COT_CHANGED, SendTarget.ALL_WINDOWS, enabled) + eventBus.sendToMain(CONFIG_EVENTS.COPY_WITH_COT_CHANGED, enabled) } setTraceDebugEnabled(enabled: boolean): void { this.setSetting('traceDebugEnabled', enabled) - eventBus.send(CONFIG_EVENTS.TRACE_DEBUG_CHANGED, SendTarget.ALL_WINDOWS, enabled) + eventBus.sendToMain(CONFIG_EVENTS.TRACE_DEBUG_CHANGED, enabled) } getNotificationsEnabled(): boolean { @@ -161,7 +161,7 @@ export class UiSettingsHelper { setNotificationsEnabled(enabled: boolean): void { const boolValue = Boolean(enabled) this.setSetting('notificationsEnabled', boolValue) - eventBus.send(CONFIG_EVENTS.NOTIFICATIONS_CHANGED, SendTarget.ALL_WINDOWS, boolValue) + eventBus.sendToMain(CONFIG_EVENTS.NOTIFICATIONS_CHANGED, boolValue) } getFontFamily(): string { @@ -171,7 +171,7 @@ export class UiSettingsHelper { setFontFamily(fontFamily?: string | null): void { const normalized = this.normalizeStoredFont(fontFamily) this.setSetting('fontFamily', normalized) - eventBus.send(CONFIG_EVENTS.FONT_FAMILY_CHANGED, SendTarget.ALL_WINDOWS, normalized) + eventBus.sendToMain(CONFIG_EVENTS.FONT_FAMILY_CHANGED, normalized) } getCodeFontFamily(): string { @@ -181,7 +181,7 @@ export class UiSettingsHelper { setCodeFontFamily(fontFamily?: string | null): void { const normalized = this.normalizeStoredFont(fontFamily) this.setSetting('codeFontFamily', normalized) - eventBus.send(CONFIG_EVENTS.CODE_FONT_FAMILY_CHANGED, SendTarget.ALL_WINDOWS, normalized) + eventBus.sendToMain(CONFIG_EVENTS.CODE_FONT_FAMILY_CHANGED, normalized) } resetFontSettings(): void { diff --git a/src/main/presenter/deeplinkPresenter/index.ts b/src/main/presenter/deeplinkPresenter/index.ts index f6b4dc9a5..a0a05d674 100644 --- a/src/main/presenter/deeplinkPresenter/index.ts +++ b/src/main/presenter/deeplinkPresenter/index.ts @@ -3,14 +3,10 @@ import { app, BrowserWindow } from 'electron' import { presenter } from '@/presenter' import { IDeeplinkPresenter, MCPServerConfig } from '@shared/presenter' import path from 'path' -import { - NOTIFICATION_EVENTS, - SETTINGS_EVENTS, - DEEPLINK_EVENTS, - MCP_EVENTS, - WINDOW_EVENTS -} from '@/events' -import { eventBus, SendTarget } from '@/eventbus' +import { DEEPLINK_EVENTS, MCP_EVENTS, WINDOW_EVENTS } from '@/events' +import { eventBus } from '@/eventbus' +import { DEEPCHAT_EVENT_CHANNEL } from '@shared/contracts/channels' +import { createDeepchatEventEnvelope, publishDeepchatEvent } from '@/routes/publishDeepchatEvent' import { consumeStartupDeepLink } from '@/lib/startupDeepLink' import { PROVIDER_INSTALL_VERSION, @@ -419,10 +415,14 @@ export class DeeplinkPresenter implements IDeeplinkPresenter { } presenter.windowPresenter.setPendingSettingsProviderInstall(preview) - presenter.windowPresenter.sendToWindow(settingsWindowId, SETTINGS_EVENTS.NAVIGATE, { + presenter.windowPresenter.sendSettingsNavigation(settingsWindowId, { routeName: 'settings-provider' }) - presenter.windowPresenter.sendToWindow(settingsWindowId, SETTINGS_EVENTS.PROVIDER_INSTALL) + presenter.windowPresenter.sendToWindow( + settingsWindowId, + DEEPCHAT_EVENT_CHANNEL, + createDeepchatEventEnvelope('settings.providerInstallRequested', {}) + ) } catch (error) { const message = error instanceof Error ? error.message : 'Invalid provider deeplink.' console.error('Error parsing provider install deeplink:', error) @@ -573,7 +573,7 @@ export class DeeplinkPresenter implements IDeeplinkPresenter { } private notifyProviderImportError(message: string): void { - eventBus.sendToRenderer(NOTIFICATION_EVENTS.SHOW_ERROR, SendTarget.ALL_WINDOWS, { + publishDeepchatEvent('notification.error', { id: `provider-deeplink-${Date.now()}`, title: 'Provider Deeplink', message, diff --git a/src/main/presenter/devicePresenter/index.ts b/src/main/presenter/devicePresenter/index.ts index 0c3540ed2..0fbfc58f2 100644 --- a/src/main/presenter/devicePresenter/index.ts +++ b/src/main/presenter/devicePresenter/index.ts @@ -9,12 +9,14 @@ import { app, dialog } from 'electron' import { nanoid } from 'nanoid' import axios from 'axios' import { is } from '@electron-toolkit/utils' -import { eventBus, SendTarget } from '../../eventbus' -import { NOTIFICATION_EVENTS } from '../../events' import { svgSanitizer } from '../../lib/svgSanitizer' -import { presenter } from '../index' +import { publishDeepchatEvent } from '@/routes/publishDeepchatEvent' const execAsync = promisify(exec) +async function getPresenterRuntime() { + return (await import('../index')).presenter +} + function toMimeType(value: unknown): string { if (typeof value === 'string') { return value @@ -348,13 +350,15 @@ export class DevicePresenter implements IDevicePresenter { } } + const runtimePresenter = await getPresenterRuntime() + switch (resetType) { case 'chat': { // 删除聊天数据 logger.info('Resetting chat data...') try { - if (presenter.sqlitePresenter) { - presenter.sqlitePresenter.close() + if (runtimePresenter.sqlitePresenter) { + runtimePresenter.sqlitePresenter.close() logger.info('SQLite database connection closed') } await new Promise((resolve) => setTimeout(resolve, 500)) @@ -388,8 +392,8 @@ export class DevicePresenter implements IDevicePresenter { // 删除知识库数据 logger.info('Resetting knowledge base data...') try { - if (presenter.knowledgePresenter) { - await presenter.knowledgePresenter.destroy() + if (runtimePresenter.knowledgePresenter) { + await runtimePresenter.knowledgePresenter.destroy() logger.info('Knowledge database connections closed') } await new Promise((resolve) => setTimeout(resolve, 500)) @@ -434,12 +438,12 @@ export class DevicePresenter implements IDevicePresenter { // 删除整个用户数据目录 logger.info('Performing complete reset of user data...') try { - if (presenter.sqlitePresenter) { - presenter.sqlitePresenter.close() + if (runtimePresenter.sqlitePresenter) { + runtimePresenter.sqlitePresenter.close() logger.info('SQLite database connection closed') } - if (presenter.knowledgePresenter) { - await presenter.knowledgePresenter.destroy() + if (runtimePresenter.knowledgePresenter) { + await runtimePresenter.knowledgePresenter.destroy() logger.info('Knowledge database connections closed') } await new Promise((resolve) => setTimeout(resolve, 1000)) @@ -466,7 +470,7 @@ export class DevicePresenter implements IDevicePresenter { try { if (is.dev) { logger.info('开发环境下数据重置完成,发送通知到渲染进程') - eventBus.sendToRenderer(NOTIFICATION_EVENTS.DATA_RESET_COMPLETE_DEV, SendTarget.ALL_WINDOWS) + publishDeepchatEvent('appRuntime.dataResetCompleteDev', {}) return } diff --git a/src/main/presenter/dialogPresenter/index.ts b/src/main/presenter/dialogPresenter/index.ts index 38de4deaf..7fffc603b 100644 --- a/src/main/presenter/dialogPresenter/index.ts +++ b/src/main/presenter/dialogPresenter/index.ts @@ -11,8 +11,6 @@ import { DialogResponse, IDialogPresenter } from '@shared/presenter' -import { eventBus, SendTarget } from '@/eventbus' -import { DIALOG_EVENTS } from '@/events' import { publishDeepchatEvent } from '@/routes/publishDeepchatEvent' import { nanoid } from 'nanoid' @@ -50,8 +48,6 @@ export class DialogPresenter implements IDialogPresenter { } this.pendingDialogs.set(finalRequest.id, { resolve, reject }) try { - // send dialog request to renderer - eventBus.sendToRenderer(DIALOG_EVENTS.REQUEST, SendTarget.DEFAULT_WINDOW, finalRequest) publishDeepchatEvent('dialog.requested', { ...finalRequest, version: Date.now() diff --git a/src/main/presenter/floatingButtonPresenter/FloatingButtonWindow.ts b/src/main/presenter/floatingButtonPresenter/FloatingButtonWindow.ts index 83e3beeb8..a08cc07b6 100644 --- a/src/main/presenter/floatingButtonPresenter/FloatingButtonWindow.ts +++ b/src/main/presenter/floatingButtonPresenter/FloatingButtonWindow.ts @@ -40,7 +40,7 @@ export class FloatingButtonWindow { } try { - const isDev = is.dev + const rendererUrl = process.env['ELECTRON_RENDERER_URL'] const initialBounds = this.resolveInitialBounds() this.dockSide = inferDockSide( initialBounds, @@ -71,7 +71,7 @@ export class FloatingButtonWindow { contextIsolation: true, preload: path.join(__dirname, '../preload/floating.mjs'), webSecurity: false, - devTools: isDev, + devTools: is.dev, sandbox: false } }) @@ -81,8 +81,8 @@ export class FloatingButtonWindow { this.window.setOpacity(1) this.setBounds(initialBounds) - if (isDev) { - await this.window.loadURL('http://localhost:5173/floating/') + if (is.dev && rendererUrl) { + await this.window.loadURL(`${rendererUrl}/floating/`) } else { await this.window.loadFile(path.join(__dirname, '../renderer/floating/index.html')) } diff --git a/src/main/presenter/floatingButtonPresenter/index.ts b/src/main/presenter/floatingButtonPresenter/index.ts index c55250c0b..28146bf1d 100644 --- a/src/main/presenter/floatingButtonPresenter/index.ts +++ b/src/main/presenter/floatingButtonPresenter/index.ts @@ -39,6 +39,23 @@ type DragRuntimeState = { windowHeight: number } +type PointPayload = { + x: number + y: number +} + +const isPointPayload = (payload: unknown): payload is PointPayload => { + if (!payload || typeof payload !== 'object') { + return false + } + + const { x, y } = payload as { x?: unknown; y?: unknown } + return typeof x === 'number' && Number.isFinite(x) && typeof y === 'number' && Number.isFinite(y) +} + +const isNonEmptyString = (payload: unknown): payload is string => + typeof payload === 'string' && payload.trim().length > 0 + export class FloatingButtonPresenter { private floatingWindow: FloatingButtonWindow | null = null private config: FloatingButtonConfig @@ -281,11 +298,19 @@ export class FloatingButtonPresenter { this.setExpanded(Boolean(expanded)) }) - ipcMain.on(FLOATING_BUTTON_EVENTS.OPEN_SESSION, (_event, sessionId: string) => { - void this.openSession(sessionId) + ipcMain.on(FLOATING_BUTTON_EVENTS.OPEN_SESSION, (_event, sessionId: unknown) => { + if (!isNonEmptyString(sessionId)) { + return + } + + void this.openSession(sessionId.trim()) }) - ipcMain.on(FLOATING_BUTTON_EVENTS.DRAG_START, (_event, { x, y }: { x: number; y: number }) => { + ipcMain.on(FLOATING_BUTTON_EVENTS.DRAG_START, (_event, payload: unknown) => { + if (!isPointPayload(payload)) { + return + } + if (!this.floatingWindow?.exists()) { return } @@ -303,8 +328,8 @@ export class FloatingButtonPresenter { this.floatingWindow.setOpacity(this.resolveWindowOpacity()) dragState = { - startX: x, - startY: y, + startX: payload.x, + startY: payload.y, windowX: stableBounds.x, windowY: stableBounds.y, windowWidth: stableBounds.width, @@ -312,13 +337,17 @@ export class FloatingButtonPresenter { } }) - ipcMain.on(FLOATING_BUTTON_EVENTS.DRAG_MOVE, (_event, { x, y }: { x: number; y: number }) => { + ipcMain.on(FLOATING_BUTTON_EVENTS.DRAG_MOVE, (_event, payload: unknown) => { + if (!isPointPayload(payload)) { + return + } + if (!dragState || !this.floatingWindow?.exists()) { return } - const deltaX = x - dragState.startX - const deltaY = y - dragState.startY + const deltaX = payload.x - dragState.startX + const deltaY = payload.y - dragState.startY this.floatingWindow.setBounds({ x: dragState.windowX + deltaX, diff --git a/src/main/presenter/index.ts b/src/main/presenter/index.ts index fdbc631b5..16a1e6fee 100644 --- a/src/main/presenter/index.ts +++ b/src/main/presenter/index.ts @@ -1,7 +1,7 @@ import logger from '@shared/logger' import path from 'path' import { DialogPresenter } from './dialogPresenter/index' -import { BrowserWindow, ipcMain, IpcMainInvokeEvent, app } from 'electron' +import { ipcMain, app } from 'electron' import { WindowPresenter } from './windowPresenter' import { ShortcutPresenter } from './shortcutPresenter' import { @@ -83,21 +83,10 @@ import type { SessionPermissionPort, SessionUiPort } from './runtimePorts' -import { handlePresenterCallError, handlePresenterCallResult } from './presenterCallErrorHandler' import { createMainKernelRouteRuntime, registerMainKernelRoutes } from '@/routes' -import { setupLegacyTypedEventBridge } from '@/routes/legacyTypedEventBridge' import { StartupWorkloadCoordinator } from './startupWorkloadCoordinator' import type { StartupWorkloadTaskContext } from './startupWorkloadCoordinator' -// IPC调用上下文接口 -interface IPCCallContext { - windowId?: number - webContentsId: number - presenterName: string - methodName: string - timestamp: number -} - // 注意: 现在大部分事件已在各自的 presenter 中直接发送到渲染进程 // 剩余的自动转发事件已在 EventBus 的 DEFAULT_RENDERER_EVENTS 中定义 @@ -105,62 +94,6 @@ interface IPCCallContext { export class Presenter implements IPresenter { // 私有静态实例 private static instance: Presenter - static readonly DISPATCHABLE_PRESENTERS = new Set([ - 'windowPresenter', - 'sqlitePresenter', - 'llmproviderPresenter', - 'configPresenter', - 'exporter', - 'devicePresenter', - 'upgradePresenter', - 'shortcutPresenter', - 'filePresenter', - 'mcpPresenter', - 'syncPresenter', - 'deeplinkPresenter', - 'notificationPresenter', - 'tabPresenter', - 'yoBrowserPresenter', - 'oauthPresenter', - 'dialogPresenter', - 'knowledgePresenter', - 'workspacePresenter', - 'toolPresenter', - 'skillPresenter', - 'skillSyncPresenter', - 'agentSessionPresenter', - 'projectPresenter' - ]) - - static readonly REMOTE_CONTROL_METHODS = new Set([ - 'listRemoteChannels', - 'getChannelSettings', - 'saveChannelSettings', - 'getChannelStatus', - 'getChannelBindings', - 'removeChannelBinding', - 'removeChannelPrincipal', - 'getChannelPairingSnapshot', - 'createChannelPairCode', - 'clearChannelPairCode', - 'clearChannelBindings', - 'getTelegramSettings', - 'saveTelegramSettings', - 'getTelegramStatus', - 'getTelegramBindings', - 'removeTelegramBinding', - 'getTelegramPairingSnapshot', - 'createTelegramPairCode', - 'clearTelegramPairCode', - 'clearTelegramBindings', - 'getWeixinIlinkSettings', - 'saveWeixinIlinkSettings', - 'getWeixinIlinkStatus', - 'startWeixinIlinkLogin', - 'waitForWeixinIlinkLogin', - 'removeWeixinIlinkAccount', - 'restartWeixinIlinkAccount' - ]) windowPresenter: IWindowPresenter sqlitePresenter: ISQLitePresenter @@ -190,6 +123,7 @@ export class Presenter implements IPresenter { skillSyncPresenter: ISkillSyncPresenter agentSessionPresenter: IAgentSessionPresenter projectPresenter: IProjectPresenter + remoteControlPresenter: IRemoteControlPresenter pluginPresenter: PluginPresenter databaseSecurityPresenter: DatabaseSecurityPresenter hooksNotifications: HooksNotificationsService @@ -202,7 +136,6 @@ export class Presenter implements IPresenter { private sessionPresenterInternal?: SessionPresenter private hasInitialized = false #remoteControlPresenter: RemoteControlPresenterLike - readonly #remoteControlBridge: IRemoteControlPresenter private constructor(lifecycleManager: ILifecycleManager) { // Store lifecycle manager reference for component access @@ -428,6 +361,8 @@ export class Presenter implements IPresenter { createSettingsWindow: () => this.windowPresenter.createSettingsWindow(), sendToWindow: (windowId, channel, ...args) => this.windowPresenter.sendToWindow(windowId, channel, ...args), + sendSettingsNavigation: (windowId, navigation) => + this.windowPresenter.sendSettingsNavigation(windowId, navigation), getApprovedFilePaths: (conversationId, requiredPermission) => this.filePermissionService.getApprovedPaths(conversationId, requiredPermission), consumeSettingsApproval: (conversationId, toolName) => @@ -609,7 +544,7 @@ export class Presenter implements IPresenter { windowPresenter: this.windowPresenter, tabPresenter: this.tabPresenter }) - this.#remoteControlBridge = this.#remoteControlPresenter + this.remoteControlPresenter = this.#remoteControlPresenter // Update hooksNotifications with actual dependencies now that agentSessionPresenter is ready this.hooksNotifications = new HooksNotificationsService(this.configPresenter, { @@ -906,18 +841,6 @@ export class Presenter implements IPresenter { ) } - async callRemoteControl( - method: keyof IRemoteControlPresenter, - ...payloads: unknown[] - ): Promise { - if (!Presenter.REMOTE_CONTROL_METHODS.has(method)) { - throw new Error(`Method "${String(method)}" is not allowed on "remoteControlPresenter"`) - } - - const handler = this.#remoteControlBridge[method] as (...args: unknown[]) => unknown - return await Reflect.apply(handler, this.#remoteControlBridge, payloads) - } - getStartupWorkloadCoordinator(): StartupWorkloadCoordinator { return this.startupWorkloadCoordinator } @@ -958,7 +881,12 @@ const buildMainKernelRouteRuntime = () => llmProviderPresenter: presenter.llmproviderPresenter, agentSessionPresenter: presenter.agentSessionPresenter, skillPresenter: presenter.skillPresenter, + skillSyncPresenter: presenter.skillSyncPresenter, + exporter: presenter.exporter, + oauthPresenter: presenter.oauthPresenter, mcpPresenter: presenter.mcpPresenter, + remoteControlPresenter: presenter.remoteControlPresenter, + shortcutPresenter: presenter.shortcutPresenter, syncPresenter: presenter.syncPresenter, upgradePresenter: presenter.upgradePresenter, dialogPresenter: presenter.dialogPresenter, @@ -968,6 +896,7 @@ const buildMainKernelRouteRuntime = () => devicePresenter: presenter.devicePresenter, projectPresenter: presenter.projectPresenter, filePresenter: presenter.filePresenter, + knowledgePresenter: presenter.knowledgePresenter, workspacePresenter: presenter.workspacePresenter, yoBrowserPresenter: presenter.yoBrowserPresenter, tabPresenter: presenter.tabPresenter, @@ -991,157 +920,7 @@ export function getMainKernelRouteRuntime(): ReturnType (presenter ? getMainKernelRouteRuntime() : undefined)) - -// 检查对象属性是否为函数 (用于动态调用) -// eslint-disable-next-line @typescript-eslint/no-explicit-any -function isFunction(obj: any, prop: string): obj is { [key: string]: (...args: any[]) => any } { - return typeof obj[prop] === 'function' -} - -// IPC 主进程处理程序:动态调用 Presenter 的方法 (支持 window/webContents 上下文) -ipcMain.handle( - 'presenter:call', - (event: IpcMainInvokeEvent, name: string, method: string, ...payloads: unknown[]) => { - const webContentsId = event.sender.id - try { - // 构建调用上下文 - const windowId = BrowserWindow.fromWebContents(event.sender)?.id - - const context: IPCCallContext = { - windowId, - webContentsId, - presenterName: name, - methodName: method, - timestamp: Date.now() - } - - // 记录调用日志 - if (import.meta.env.VITE_LOG_IPC_CALL === '1') { - logger.info( - `[IPC Call] WebContents:${context.webContentsId} Window:${context.windowId || 'unknown'} -> ${context.presenterName}.${context.methodName}` - ) - } - - if (!Presenter.DISPATCHABLE_PRESENTERS.has(name as keyof IPresenter)) { - console.warn( - `[IPC Warning] WebContents:${context.webContentsId} blocked presenter access: ${name}` - ) - return { error: `Presenter "${name}" is not accessible via generic dispatcher` } - } - - // 通过名称获取对应的 Presenter 实例 - // eslint-disable-next-line @typescript-eslint/no-explicit-any - let calledPresenter: any = presenter[name as keyof Presenter] - let resolvedMethod = method - let resolvedPayloads = payloads - - if (!calledPresenter) { - console.warn( - `[IPC Warning] WebContents:${context.webContentsId} calling wrong presenter: ${name}` - ) - return { error: `Presenter "${name}" not found` } - } - - // 检查方法是否存在且为函数 - if (isFunction(calledPresenter, resolvedMethod)) { - // 调用方法并返回结果 - const result = calledPresenter[resolvedMethod](...resolvedPayloads) - return handlePresenterCallResult(result, { - webContentsId, - presenterName: name, - methodName: method - }) - } else { - console.warn( - `[IPC Warning] WebContents:${context.webContentsId} called method is not a function or does not exist: ${name}.${method}` - ) - return { error: `Method "${method}" not found or not a function on "${name}"` } - } - } catch ( - // eslint-disable-next-line @typescript-eslint/no-explicit-any - e: any - ) { - return handlePresenterCallError(e, { - webContentsId, - presenterName: name, - methodName: method - }) - } - } -) - -ipcMain.handle( - 'remoteControlPresenter:call', - async (event: IpcMainInvokeEvent, method: string, ...payloads: unknown[]) => { - const webContentsId = event.sender.id - try { - const windowId = BrowserWindow.fromWebContents(event.sender)?.id - - if (import.meta.env.VITE_LOG_IPC_CALL === '1') { - logger.info( - `[IPC Call] WebContents:${webContentsId} Window:${windowId || 'unknown'} -> remoteControlPresenter.${method}` - ) - } - - if (!Presenter.REMOTE_CONTROL_METHODS.has(method as keyof IRemoteControlPresenter)) { - console.warn( - `[IPC Warning] WebContents:${webContentsId} blocked remote control method: ${method}` - ) - return { error: `Method "${method}" is not allowed on "remoteControlPresenter"` } - } - - const isSettingsWindow = - windowId != null && presenter.windowPresenter.getSettingsWindowId() === windowId - const shouldTrackRemoteRuntime = - isSettingsWindow && - (method === 'listRemoteChannels' || - method.startsWith('getChannel') || - method.startsWith('getTelegram') || - method.startsWith('getFeishu') || - method.startsWith('getQQBot') || - method.startsWith('getDiscord') || - method.startsWith('getWeixinIlink')) - - const result = shouldTrackRemoteRuntime - ? presenter.startupWorkloadCoordinator.scheduleTask({ - id: `settings.remote.runtime:${method}`, - target: 'settings', - phase: 'deferred', - resource: 'io', - labelKey: 'startup.settings.remote.runtime', - visibleId: 'settings.remote.runtime', - runId: presenter.startupWorkloadCoordinator.getRunId('settings'), - run: async () => { - return await presenter.callRemoteControl( - method as keyof IRemoteControlPresenter, - ...payloads - ) - } - }) - : presenter.callRemoteControl(method as keyof IRemoteControlPresenter, ...payloads) - - return handlePresenterCallResult(result, { - webContentsId, - presenterName: 'remoteControlPresenter', - methodName: method - }) - } catch ( - // eslint-disable-next-line @typescript-eslint/no-explicit-any - e: any - ) { - return handlePresenterCallError(e, { - webContentsId, - presenterName: 'remoteControlPresenter', - methodName: method - }) - } - } -) diff --git a/src/main/presenter/knowledgePresenter/knowledgeStorePresenter.ts b/src/main/presenter/knowledgePresenter/knowledgeStorePresenter.ts index e4ebdf410..f5ff6f76e 100644 --- a/src/main/presenter/knowledgePresenter/knowledgeStorePresenter.ts +++ b/src/main/presenter/knowledgePresenter/knowledgeStorePresenter.ts @@ -16,8 +16,27 @@ import { nanoid } from 'nanoid' import { RecursiveCharacterTextSplitter } from '@/lib/textsplitters' import { sanitizeText } from '@/utils/strings' import { getMetric, normalizeDistance } from '@/utils/vector' -import { eventBus, SendTarget } from '@/eventbus' -import { RAG_EVENTS } from '@/events' +import { publishDeepchatEvent } from '@/routes/publishDeepchatEvent' + +function publishKnowledgeFileUpdated(fileMessage: KnowledgeFileMessage): void { + publishDeepchatEvent('knowledge.file.updated', { + ...fileMessage, + version: Date.now() + }) +} + +function publishKnowledgeFileProgress( + fileId: string, + progress: { completed: number; error: number; total: number } +): void { + publishDeepchatEvent('knowledge.file.progress', { + fileId, + completed: progress.completed, + error: progress.error, + total: progress.total, + version: Date.now() + }) +} export class KnowledgeStorePresenter { private readonly vectorP: IVectorDatabasePresenter @@ -126,7 +145,7 @@ export class KnowledgeStorePresenter { fileMessage.metadata.errorReason = '无法读取文件或文件内容为空,请检查文件是否损坏或格式是否受支持' await this.enqueueFileTask(fileMessage.id, async () => this.vectorP.updateFile(fileMessage)) - eventBus.sendToRenderer(RAG_EVENTS.FILE_UPDATED, SendTarget.ALL_WINDOWS, fileMessage) + publishKnowledgeFileUpdated(fileMessage) return } @@ -143,7 +162,7 @@ export class KnowledgeStorePresenter { await this.enqueueFileTask(fileMessage.id, async () => this.vectorP.updateFile(fileMessage)) // 5. 发送文件更新事件 - eventBus.sendToRenderer(RAG_EVENTS.FILE_UPDATED, SendTarget.ALL_WINDOWS, fileMessage) + publishKnowledgeFileUpdated(fileMessage) // 6. 创建chunk记录 const chunkMessages = chunks.map((content, index) => ({ @@ -239,12 +258,7 @@ export class KnowledgeStorePresenter { progress.completed++ // 更新文件进度 - eventBus.sendToRenderer(RAG_EVENTS.FILE_PROGRESS, SendTarget.ALL_WINDOWS, { - fileId, - completed: progress.completed, - error: progress.error, - total: progress.total - }) + publishKnowledgeFileProgress(fileId, progress) // 检查是否所有分片都完成了 if (progress.completed + progress.error === progress.total) { @@ -271,12 +285,7 @@ export class KnowledgeStorePresenter { progress.error++ // 更新文件进度 - eventBus.sendToRenderer(RAG_EVENTS.FILE_PROGRESS, SendTarget.ALL_WINDOWS, { - fileId, - completed: progress.completed, - error: progress.error, - total: progress.total - }) + publishKnowledgeFileProgress(fileId, progress) // 检查是否所有分片都完成了 if (progress.completed + progress.error === progress.total) { @@ -294,7 +303,7 @@ export class KnowledgeStorePresenter { if (fileMessage) { fileMessage.status = 'completed' await this.enqueueFileTask(fileId, async () => this.vectorP.updateFile(fileMessage)) - eventBus.sendToRenderer(RAG_EVENTS.FILE_UPDATED, SendTarget.ALL_WINDOWS, fileMessage) + publishKnowledgeFileUpdated(fileMessage) logger.info(`[RAG] File processing completed for ${fileId}`) } } catch (error) { @@ -312,7 +321,7 @@ export class KnowledgeStorePresenter { fileMessage.metadata.errorReason = errorMessage } await this.enqueueFileTask(fileId, async () => this.vectorP.updateFile(fileMessage)) - eventBus.sendToRenderer(RAG_EVENTS.FILE_UPDATED, SendTarget.ALL_WINDOWS, fileMessage) + publishKnowledgeFileUpdated(fileMessage) } } catch (error) { console.error(`[RAG] Error handling file processing error for ${fileId}:`, error) diff --git a/src/main/presenter/lifecyclePresenter/SplashWindowManager.ts b/src/main/presenter/lifecyclePresenter/SplashWindowManager.ts index bc6ccb0b9..228732b8a 100644 --- a/src/main/presenter/lifecyclePresenter/SplashWindowManager.ts +++ b/src/main/presenter/lifecyclePresenter/SplashWindowManager.ts @@ -609,10 +609,6 @@ export class SplashWindowManager implements ISplashWindowManager { } private buildInlineFallbackSplashUrl(): string { - const progressChannel = JSON.stringify(DATABASE_UNLOCK_PROGRESS_CHANNEL) - const requestChannel = JSON.stringify(DATABASE_UNLOCK_REQUEST_CHANNEL) - const submitChannel = JSON.stringify(DATABASE_UNLOCK_SUBMIT_CHANNEL) - const cancelChannel = JSON.stringify(DATABASE_UNLOCK_CANCEL_CHANNEL) const html = ` @@ -654,7 +650,7 @@ export class SplashWindowManager implements ISplashWindowManager { diff --git a/src/renderer/floating/env.d.ts b/src/renderer/floating/env.d.ts index 0dea3f91c..cf3184a9c 100644 --- a/src/renderer/floating/env.d.ts +++ b/src/renderer/floating/env.d.ts @@ -2,6 +2,8 @@ import type { FloatingWidgetSnapshot } from '@shared/types/floating-widget' +type FloatingButtonUnsubscribe = () => void + declare module '*.vue' { import type { DefineComponent } from 'vue' // eslint-disable-next-line @typescript-eslint/no-explicit-any, @typescript-eslint/no-empty-object-type @@ -25,11 +27,14 @@ declare global { onDragStart: (x: number, y: number) => void onDragMove: (x: number, y: number) => void onDragEnd: (x: number, y: number) => void - onSnapshotUpdate: (callback: (snapshot: FloatingWidgetSnapshot) => void) => void - onLanguageChanged: (callback: (language: string) => void) => void - onThemeChanged: (callback: (theme: 'dark' | 'light') => void) => void - onConfigUpdate: (callback: (config: Record) => void) => void - removeAllListeners: () => void + onSnapshotUpdate: ( + callback: (snapshot: FloatingWidgetSnapshot) => void + ) => FloatingButtonUnsubscribe + onLanguageChanged: (callback: (language: string) => void) => FloatingButtonUnsubscribe + onThemeChanged: (callback: (theme: 'dark' | 'light') => void) => FloatingButtonUnsubscribe + onConfigUpdate: ( + callback: (config: Record) => void + ) => FloatingButtonUnsubscribe } } } diff --git a/src/renderer/floating/main.ts b/src/renderer/floating/main.ts index 36336b2c2..c512743ed 100644 --- a/src/renderer/floating/main.ts +++ b/src/renderer/floating/main.ts @@ -57,7 +57,7 @@ void window.floatingButtonAPI console.warn('Failed to initialize floating widget language:', error) }) -window.floatingButtonAPI.onLanguageChanged(applyLanguage) +const unsubscribeLanguageChanged = window.floatingButtonAPI.onLanguageChanged(applyLanguage) void window.floatingButtonAPI .getTheme() @@ -66,4 +66,13 @@ void window.floatingButtonAPI console.warn('Failed to initialize floating widget theme:', error) }) -window.floatingButtonAPI.onThemeChanged(applyTheme) +const unsubscribeThemeChanged = window.floatingButtonAPI.onThemeChanged(applyTheme) + +window.addEventListener( + 'beforeunload', + () => { + unsubscribeLanguageChanged() + unsubscribeThemeChanged() + }, + { once: true } +) diff --git a/src/renderer/settings/App.vue b/src/renderer/settings/App.vue index 7aeb4b2b7..d58724183 100644 --- a/src/renderer/settings/App.vue +++ b/src/renderer/settings/App.vue @@ -82,7 +82,10 @@ import { useRouter, useRoute, RouterView } from 'vue-router' import { onMounted, onBeforeUnmount, Ref, ref, watch, computed, nextTick, unref } from 'vue' import { useI18n } from 'vue-i18n' import { useTitle } from '@vueuse/core' -import { useLegacyPresenter } from '@api/legacy/presenters' +import { createConfigClient } from '@api/ConfigClient' +import { createDeviceClient } from '@api/DeviceClient' +import { createWindowClient } from '@api/WindowClient' +import { getRuntimePlatform } from '@api/runtime' import CloseIcon from './icons/CloseIcon.vue' import { useUiSettingsStore } from '../src/stores/uiSettingsStore' import { useLanguageStore } from '../src/stores/language' @@ -92,7 +95,6 @@ import ModelCheckDialog from '@/components/settings/ModelCheckDialog.vue' import { useDeviceVersion } from '../src/composables/useDeviceVersion' import { Toaster } from '@shadcn/components/ui/sonner' import 'vue-sonner/style.css' -import { NOTIFICATION_EVENTS, SETTINGS_EVENTS } from '@/events' import { useToast } from '@/components/use-toast' import { useThemeStore } from '@/stores/theme' import { useProviderStore } from '@/stores/providerStore' @@ -103,11 +105,8 @@ import { useMcpInstallDeeplinkHandler } from '../src/lib/storeInitializer' import { ensureIconsLoaded } from '../src/lib/iconLoader' import { useFontManager } from '../src/composables/useFontManager' import { markStartupInteractive } from '../src/lib/startupDeferred' -import type { - DatabaseRepairSuggestedPayload, - LLM_PROVIDER, - ProviderInstallPreview -} from '@shared/presenter' +import type { DatabaseRepairSuggestedPayload, LLM_PROVIDER } from '@shared/presenter' +import type { ProviderInstallPreview } from '@shared/providerDeeplink' import ProviderDeeplinkImportDialog from './components/ProviderDeeplinkImportDialog.vue' import { nanoid } from 'nanoid' import { @@ -126,9 +125,10 @@ type SettingsWindowState = Window & { __deepchatSettingsPendingSection?: string | null } -const devicePresenter = useLegacyPresenter('devicePresenter') -const windowPresenter = useLegacyPresenter('windowPresenter') -const configPresenter = useLegacyPresenter('configPresenter') +const configClient = createConfigClient() +const deviceClient = createDeviceClient() +const windowClient = createWindowClient() +const settingsEventCleanups: Array<() => void> = [] // Initialize stores const uiSettingsStore = useUiSettingsStore() @@ -262,7 +262,7 @@ const showDatabaseRepairSuggestedToast = (payload: DatabaseRepairSuggestedPayloa }) } -const handleSettingsNavigate = async (_event: unknown, payload?: SettingsNavigationPayload) => { +const handleSettingsNavigate = async (payload?: SettingsNavigationPayload) => { const routeName = payload?.routeName const params = normalizeRouteParams(payload?.params) if (!routeName || !router.hasRoute(routeName)) return @@ -359,7 +359,7 @@ const syncPendingProviderInstall = async () => { let preview: ProviderInstallPreview | null = null try { - preview = await windowPresenter.consumePendingSettingsProviderInstall() + preview = await windowClient.consumePendingSettingsProviderInstall() if (!preview) { return } @@ -368,7 +368,7 @@ const syncPendingProviderInstall = async () => { } catch (error) { if (preview) { try { - windowPresenter.setPendingSettingsProviderInstall(preview) + windowClient.requeuePendingSettingsProviderInstall(preview) } catch (requeueError) { console.error('Failed to requeue pending provider install preview:', requeueError) } @@ -444,13 +444,13 @@ const confirmProviderImport = async () => { } } -if (window?.electron?.ipcRenderer) { - window.electron.ipcRenderer.on(SETTINGS_EVENTS.NAVIGATE, handleSettingsNavigate) - window.electron.ipcRenderer.on(SETTINGS_EVENTS.PROVIDER_INSTALL, handleProviderInstall) -} +const cleanupSettingsNavigate = windowClient.onSettingsNavigate(handleSettingsNavigate) +const cleanupSettingsProviderInstall = windowClient.onSettingsProviderInstall(() => { + void handleProviderInstall() +}) const notifySettingsReady = () => { - window.electron?.ipcRenderer?.send(SETTINGS_EVENTS.READY) + void windowClient.notifySettingsReady() } const settings: Ref< { @@ -460,7 +460,7 @@ const settings: Ref< path: string }[] > = ref( - getSettingsRouteItems(window.electron?.process?.platform).map((item) => ({ + getSettingsRouteItems(getRuntimePlatform()).map((item) => ({ title: item.titleKey, name: item.routeName, icon: item.icon, @@ -469,7 +469,7 @@ const settings: Ref< ) const settingGroups = ref( - getSettingsNavigationGroups(window.electron?.process?.platform).map((group) => ({ + getSettingsNavigationGroups(getRuntimePlatform()).map((group) => ({ key: group.key, titleKey: group.titleKey, items: group.items.map((item) => ({ @@ -535,7 +535,7 @@ const getSettingsTabTestId = (name: string) => watch( () => languageStore.language, async () => { - locale.value = await configPresenter.getLanguage() + locale.value = await configClient.getLanguage() document.documentElement.dir = languageStore.dir } ) @@ -611,19 +611,17 @@ onMounted(async () => { startupWorkloadStore?.connect() // Listen for window maximize/unmaximize events - devicePresenter.getDeviceInfo().then((deviceInfo: any) => { + deviceClient.getDeviceInfo().then((deviceInfo) => { isMacOS.value = deviceInfo.platform === 'darwin' }) - window.electron.ipcRenderer.on(NOTIFICATION_EVENTS.SHOW_ERROR, (_event, error) => { + const cleanupNotificationError = windowClient.onNotificationError((error) => { showErrorToast(error) }) - window.electron.ipcRenderer.on( - NOTIFICATION_EVENTS.DATABASE_REPAIR_SUGGESTED, - (_event, payload) => { - showDatabaseRepairSuggestedToast(payload as DatabaseRepairSuggestedPayload) - } - ) + const cleanupDatabaseRepairSuggested = windowClient.onDatabaseRepairSuggested((payload) => { + showDatabaseRepairSuggestedToast(payload as DatabaseRepairSuggestedPayload) + }) + settingsEventCleanups.push(cleanupNotificationError, cleanupDatabaseRepairSuggested) const [settingsLoadResult, routerReadyResult] = await Promise.allSettled([ uiSettingsStore.loadSettings(), @@ -665,8 +663,8 @@ onMounted(async () => { logSettingsStartup('settings window ready IPC sent') }) -const closeWindow = () => { - windowPresenter.closeSettingsWindow() +const closeWindow = async () => { + await windowClient.closeSettings() } onBeforeUnmount(() => { @@ -675,13 +673,9 @@ onBeforeUnmount(() => { errorDisplayTimer.value = null } - window.electron.ipcRenderer.removeAllListeners(NOTIFICATION_EVENTS.SHOW_ERROR) - window.electron.ipcRenderer.removeAllListeners(NOTIFICATION_EVENTS.DATABASE_REPAIR_SUGGESTED) - window.electron.ipcRenderer.removeListener(SETTINGS_EVENTS.NAVIGATE, handleSettingsNavigate) - window.electron.ipcRenderer.removeListener( - SETTINGS_EVENTS.PROVIDER_INSTALL, - handleProviderInstall - ) + cleanupSettingsNavigate() + cleanupSettingsProviderInstall() + settingsEventCleanups.splice(0).forEach((cleanup) => cleanup()) window.removeEventListener('focus', handleWindowFocus) cleanupMcpDeeplink() }) diff --git a/src/renderer/settings/components/AboutUsSettings.vue b/src/renderer/settings/components/AboutUsSettings.vue index d0dd386c2..2e3362a4b 100644 --- a/src/renderer/settings/components/AboutUsSettings.vue +++ b/src/renderer/settings/components/AboutUsSettings.vue @@ -225,7 +225,10 @@ diff --git a/src/renderer/settings/components/AcpDebugDialog.vue b/src/renderer/settings/components/AcpDebugDialog.vue index a607ecac8..d7f48e115 100644 --- a/src/renderer/settings/components/AcpDebugDialog.vue +++ b/src/renderer/settings/components/AcpDebugDialog.vue @@ -191,8 +191,10 @@ import { Input } from '@shadcn/components/ui/input' import { Badge } from '@shadcn/components/ui/badge' import { Icon } from '@iconify/vue' import type { AcpDebugEventEntry, AcpDebugRequest } from '@shared/presenter' -import { getLegacyWebContentsId, useLegacyPresenter } from '@api/legacy/presenters' -import { ACP_DEBUG_EVENTS } from '@/events' +import { getRuntimeWebContentsId } from '@api/runtime' +import { createConfigClient } from '@api/ConfigClient' +import { createDeviceClient } from '@api/DeviceClient' +import { createProviderClient } from '@api/ProviderClient' import { useToast } from '@/components/use-toast' import { nanoid } from 'nanoid' import { useMonaco } from 'stream-monaco' @@ -210,9 +212,9 @@ const emit = defineEmits<{ const { t } = useI18n() const { toast } = useToast() -const llmProviderPresenter = useLegacyPresenter('llmproviderPresenter') -const configPresenter = useLegacyPresenter('configPresenter') -const devicePresenter = useLegacyPresenter('devicePresenter') +const configClient = createConfigClient() +const deviceClient = createDeviceClient() +const providerClient = createProviderClient() const uiSettingsStore = useUiSettingsStore() const selectedMethod = ref('newSession') @@ -222,11 +224,12 @@ const customMethod = ref('') const loading = ref(false) const events = ref([]) const seenIds = new Set() -const webContentsId = getLegacyWebContentsId() +const webContentsId = getRuntimeWebContentsId() const debugSessionId = ref(createDebugSessionId()) const processReady = ref(false) const payloadEditor = ref(null) let editorCreated = false +let stopDebugEvents: (() => void) | null = null const workdirLabel = computed(() => workdirPath.value ? workdirPath.value : t('settings.acp.debug.workdirPlaceholder') ) @@ -495,7 +498,7 @@ const formatTime = (timestamp: number) => { return `${date.toLocaleTimeString()}` } -const handleDebugEvent = (_event: unknown, payload: unknown) => { +const handleDebugEvent = (payload: unknown) => { const parsed = payload as { webContentsId?: number agentId?: string @@ -557,14 +560,13 @@ const handleSend = async () => { loading.value = true try { - const result = await llmProviderPresenter.runAcpDebugAction({ + const result = await providerClient.runAcpDebugAction({ agentId: props.agentId, action: selectedMethod.value, payload: payloadToSend, sessionId, workdir: workdirPath.value || undefined, - methodName: requiresCustomMethod.value ? customMethod.value.trim() : undefined, - webContentsId: webContentsId || undefined + methodName: requiresCustomMethod.value ? customMethod.value.trim() : undefined }) if (result?.events?.length) { @@ -598,14 +600,13 @@ const runHealthCheck = async () => { debugSessionId.value = '' loading.value = true try { - await configPresenter.ensureAcpAgentInstalled(props.agentId) + await configClient.ensureAcpAgentInstalled(props.agentId) - const initializeResult = await llmProviderPresenter.runAcpDebugAction({ + const initializeResult = await providerClient.runAcpDebugAction({ agentId: props.agentId, action: 'initialize', payload: templateForMethod('initialize'), - workdir: workdirPath.value || undefined, - webContentsId: webContentsId || undefined + workdir: workdirPath.value || undefined }) appendEvents(initializeResult.events ?? []) @@ -615,12 +616,11 @@ const runHealthCheck = async () => { processReady.value = true - const newSessionResult = await llmProviderPresenter.runAcpDebugAction({ + const newSessionResult = await providerClient.runAcpDebugAction({ agentId: props.agentId, action: 'newSession', payload: applyWorkdirToPayload(templateForMethod('newSession')), - workdir: workdirPath.value || undefined, - webContentsId: webContentsId || undefined + workdir: workdirPath.value || undefined }) appendEvents(newSessionResult.events ?? []) @@ -630,13 +630,12 @@ const runHealthCheck = async () => { const newSessionId = newSessionResult.sessionId - const cancelResult = await llmProviderPresenter.runAcpDebugAction({ + const cancelResult = await providerClient.runAcpDebugAction({ agentId: props.agentId, action: 'cancel', payload: templateForMethod('cancel'), sessionId: newSessionId, - workdir: workdirPath.value || undefined, - webContentsId: webContentsId || undefined + workdir: workdirPath.value || undefined }) appendEvents(cancelResult.events ?? []) @@ -659,7 +658,7 @@ const runHealthCheck = async () => { } const handleSelectWorkdir = async () => { - const result = await devicePresenter.selectDirectory() + const result = await deviceClient.selectDirectory() if (result?.canceled || !result.filePaths?.length) return workdirPath.value = result.filePaths[0] syncWorkdirIntoPayload() @@ -715,15 +714,12 @@ onMounted(async () => { await ensureEditor() resetPayload() } - if (window.electron) { - window.electron.ipcRenderer.on(ACP_DEBUG_EVENTS.EVENT, handleDebugEvent) - } + stopDebugEvents = providerClient.onAcpDebugEvent(handleDebugEvent) }) onBeforeUnmount(() => { disposeEditor() - if (window.electron) { - window.electron.ipcRenderer.removeListener(ACP_DEBUG_EVENTS.EVENT, handleDebugEvent) - } + stopDebugEvents?.() + stopDebugEvents = null }) diff --git a/src/renderer/settings/components/AcpDependencyDialog.vue b/src/renderer/settings/components/AcpDependencyDialog.vue index 486cf52c6..215473ffc 100644 --- a/src/renderer/settings/components/AcpDependencyDialog.vue +++ b/src/renderer/settings/components/AcpDependencyDialog.vue @@ -100,6 +100,7 @@ import { import { Button } from '@shadcn/components/ui/button' import { Label } from '@shadcn/components/ui/label' import { Icon } from '@iconify/vue' +import { createDeviceClient } from '@api/DeviceClient' interface ExternalDependency { name: string @@ -127,6 +128,7 @@ const emit = defineEmits<{ const { t } = useI18n() const { toast } = useToast() +const deviceClient = createDeviceClient() const hasInstallCommands = (commands: ExternalDependency['installCommands']): boolean => { if (!commands) return false @@ -135,20 +137,22 @@ const hasInstallCommands = (commands: ExternalDependency['installCommands']): bo const copyToClipboard = async (text: string) => { try { - if (window.api?.copyText) { - window.api.copyText(text) + try { + deviceClient.copyText(text) toast({ title: t('settings.acp.dependency.copied'), duration: 2000 }) - } else if (navigator.clipboard) { + } catch { + if (!navigator.clipboard) { + console.warn('[AcpDependencyDialog] Clipboard API not available') + return + } await navigator.clipboard.writeText(text) toast({ title: t('settings.acp.dependency.copied'), duration: 2000 }) - } else { - console.warn('[AcpDependencyDialog] Clipboard API not available') } } catch (error) { console.error('[AcpDependencyDialog] Failed to copy to clipboard:', error) diff --git a/src/renderer/settings/components/AcpSettings.vue b/src/renderer/settings/components/AcpSettings.vue index 20db9241d..170bae3d1 100644 --- a/src/renderer/settings/components/AcpSettings.vue +++ b/src/renderer/settings/components/AcpSettings.vue @@ -564,9 +564,8 @@ import type { AcpManualAgent, AcpRegistryAgent } from '@shared/presenter' import type { AgentTransferImpact } from '@shared/types/agent-interface' import { useI18n } from 'vue-i18n' import { useToast } from '@/components/use-toast' -import { useLegacyPresenter } from '@api/legacy/presenters' +import { createConfigClient } from '@api/ConfigClient' import { createSessionClient } from '@api/SessionClient' -import { CONFIG_EVENTS } from '@/events' import { Icon } from '@iconify/vue' import { Card, @@ -598,7 +597,7 @@ import AcpAgentIcon from '@/components/icons/AcpAgentIcon.vue' const { t } = useI18n() const { toast } = useToast() -const configPresenter = useLegacyPresenter('configPresenter') +const configClient = createConfigClient() type RegistryDialogFilter = 'all' | 'installed' | 'not_installed' type PendingDeleteAgent = { @@ -786,13 +785,13 @@ const syncEnvDrafts = (agents: AcpRegistryAgent[]) => { } const loadSharedMcpCount = async () => { - sharedMcpCount.value = (await configPresenter.getAcpSharedMcpSelections()).length + sharedMcpCount.value = (await configClient.getAcpSharedMcpSelections()).length } const loadAcpData = async () => { loading.value = true try { - acpEnabled.value = await configPresenter.getAcpEnabled() + acpEnabled.value = await configClient.getAcpEnabled() if (!acpEnabled.value) { registryAgents.value = [] manualAgents.value = [] @@ -801,8 +800,8 @@ const loadAcpData = async () => { } const [registryList, manualList] = await Promise.all([ - configPresenter.listAcpRegistryAgents(), - configPresenter.listManualAcpAgents() + configClient.listAcpRegistryAgents(), + configClient.listManualAcpAgents() ]) registryAgents.value = registryList @@ -820,7 +819,7 @@ const handleToggle = async (enabled: boolean) => { if (toggling.value) return toggling.value = true try { - await configPresenter.setAcpEnabled(enabled) + await configClient.setAcpEnabled(enabled) acpEnabled.value = enabled if (enabled) { await loadAcpData() @@ -835,7 +834,7 @@ const handleToggle = async (enabled: boolean) => { const refreshRegistry = async () => { refreshing.value = true try { - registryAgents.value = await configPresenter.refreshAcpRegistry(true) + registryAgents.value = await configClient.refreshAcpRegistry(true) syncEnvDrafts(registryAgents.value) } catch (error) { handleError(error) @@ -851,7 +850,7 @@ const handleSharedMcpUpdated = (selections: string[]) => { const toggleRegistryAgent = async (agent: AcpRegistryAgent, enabled: boolean) => { setAgentPending(agent.id, true) try { - await configPresenter.setAcpAgentEnabled(agent.id, enabled) + await configClient.setAcpAgentEnabled(agent.id, enabled) await loadAcpData() } catch (error) { handleError(error) @@ -863,7 +862,7 @@ const toggleRegistryAgent = async (agent: AcpRegistryAgent, enabled: boolean) => const saveEnvOverride = async (agent: AcpRegistryAgent) => { setAgentPending(agent.id, true) try { - await configPresenter.setAcpAgentEnvOverride(agent.id, parseEnvBlock(envDrafts[agent.id] ?? '')) + await configClient.setAcpAgentEnvOverride(agent.id, parseEnvBlock(envDrafts[agent.id] ?? '')) await loadAcpData() toast({ title: t('settings.acp.saveSuccess') }) } catch (error) { @@ -882,9 +881,9 @@ const installRegistryAgent = async (agent: AcpRegistryAgent) => { setAgentPending(agent.id, true) try { if (agent.installState?.status === 'error') { - await configPresenter.repairAcpAgent(agent.id) + await configClient.repairAcpAgent(agent.id) } else { - await configPresenter.ensureAcpAgentInstalled(agent.id) + await configClient.ensureAcpAgentInstalled(agent.id) } await loadAcpData() } catch (error) { @@ -897,7 +896,7 @@ const installRegistryAgent = async (agent: AcpRegistryAgent) => { const repairRegistryAgent = async (agent: AcpRegistryAgent) => { setAgentPending(agent.id, true) try { - await configPresenter.repairAcpAgent(agent.id) + await configClient.repairAcpAgent(agent.id) await loadAcpData() } catch (error) { handleError(error) @@ -943,9 +942,9 @@ const saveManualAgent = async () => { } if (manualDialog.agentId) { - await configPresenter.updateManualAcpAgent(manualDialog.agentId, payload) + await configClient.updateManualAcpAgent(manualDialog.agentId, payload) } else { - await configPresenter.addManualAcpAgent(payload) + await configClient.addManualAcpAgent(payload) } manualDialog.open = false @@ -961,7 +960,7 @@ const saveManualAgent = async () => { const toggleManualAgent = async (agent: AcpManualAgent, enabled: boolean) => { setAgentPending(agent.id, true) try { - await configPresenter.updateManualAcpAgent(agent.id, { enabled }) + await configClient.updateManualAcpAgent(agent.id, { enabled }) await loadAcpData() } catch (error) { handleError(error) @@ -980,7 +979,7 @@ const openAgentTransferDialog = async (agent: PendingDeleteAgent) => { const sessionClient = createSessionClient() const [impact, agents] = await Promise.all([ sessionClient.getAgentTransferImpact(agent.id), - configPresenter.listAgents() + configClient.listAgents() ]) transferImpact.value = impact transferAgents.value = agents @@ -1016,10 +1015,10 @@ const confirmRegistryAgentUninstall = async (agent: AcpRegistryAgent) => { const finishDeleteAgent = async (agent: PendingDeleteAgent) => { if (agent.source === 'registry') { - await configPresenter.uninstallAcpRegistryAgent(agent.id) + await configClient.uninstallAcpRegistryAgent(agent.id) toast({ title: t('settings.acp.deleteSuccess') }) } else { - const removed = await configPresenter.removeManualAcpAgent(agent.id) + const removed = await configClient.removeManualAcpAgent(agent.id) if (!removed) { throw new Error(t('dialog.agentTransfer.agentDeleteBlocked')) } @@ -1112,6 +1111,7 @@ const handleRegistryCatalogAction = async (agent: AcpRegistryAgent) => { } let refreshTimer: ReturnType | null = null +let cleanupAgentsChanged: (() => void) | null = null const scheduleAcpDataReload = () => { if (refreshTimer) { @@ -1125,7 +1125,7 @@ const scheduleAcpDataReload = () => { onMounted(() => { void loadAcpData() - window.electron?.ipcRenderer?.on(CONFIG_EVENTS.AGENTS_CHANGED, scheduleAcpDataReload) + cleanupAgentsChanged = configClient.onAgentsChanged(scheduleAcpDataReload) }) onBeforeUnmount(() => { @@ -1133,6 +1133,7 @@ onBeforeUnmount(() => { clearTimeout(refreshTimer) refreshTimer = null } - window.electron?.ipcRenderer?.removeListener(CONFIG_EVENTS.AGENTS_CHANGED, scheduleAcpDataReload) + cleanupAgentsChanged?.() + cleanupAgentsChanged = null }) diff --git a/src/renderer/settings/components/AcpTerminalDialog.vue b/src/renderer/settings/components/AcpTerminalDialog.vue index f2f3e05ea..eecdd92af 100644 --- a/src/renderer/settings/components/AcpTerminalDialog.vue +++ b/src/renderer/settings/components/AcpTerminalDialog.vue @@ -45,6 +45,8 @@ import { Dialog, DialogContent, DialogHeader, DialogTitle } from '@shadcn/compon import { Button } from '@shadcn/components/ui/button' import { Icon } from '@iconify/vue' import { useToast } from '@/components/use-toast' +import { createAcpTerminalClient } from '@api/AcpTerminalClient' +import { createDeviceClient } from '@api/DeviceClient' const props = defineProps<{ open: boolean @@ -58,9 +60,12 @@ const emit = defineEmits<{ const { t } = useI18n() const { toast } = useToast() +const acpTerminalClient = createAcpTerminalClient() +const deviceClient = createDeviceClient() const terminalContainer = ref(null) let terminal: Terminal | null = null +let terminalEventCleanups: Array<() => void> = [] const isRunning = ref(false) const status = ref<'idle' | 'running' | 'completed' | 'error'>('idle') @@ -114,9 +119,9 @@ const handleOpenUpdate = (val: boolean) => { if (!val) { // Kill process if running if (isRunning.value) { - if (window.electron) { - window.electron.ipcRenderer.send('acp-terminal:kill') - } + void acpTerminalClient.kill().catch((error) => { + console.warn('[AcpTerminal] Failed to kill terminal:', error) + }) } emit('update:open', false) emit('close') @@ -156,9 +161,9 @@ const ensureTerminal = () => { // Send input to backend process // Don't echo locally - let the backend process handle all output // This avoids xterm.js parsing errors with control characters - if (window.electron) { - window.electron.ipcRenderer.send('acp-terminal:input', data) - } + void acpTerminalClient.sendInput(data).catch((error) => { + console.warn('[AcpTerminal] Failed to send terminal input:', error) + }) }) } } @@ -172,7 +177,7 @@ const cleanupTerminal = () => { console.log('[AcpTerminal] Terminal cleaned up') } -const handleOutput = (_event: unknown, data: string | { type: string; data: string }) => { +const handleOutput = (data: string | { type: string; data: string }) => { if (!terminal) { console.warn('[AcpTerminal] Received output but terminal is not initialized') return @@ -229,7 +234,7 @@ const handleOutput = (_event: unknown, data: string | { type: string; data: stri } } -const handleStart = (_event: unknown) => { +const handleStart = () => { isRunning.value = true status.value = 'running' if (terminal) { @@ -237,7 +242,7 @@ const handleStart = (_event: unknown) => { } } -const handleExit = (_event: unknown, data: { code: number | null; signal: string | null }) => { +const handleExit = (data: { code: number | null; signal: string | null }) => { isRunning.value = false if (data.code === 0) { status.value = 'completed' @@ -251,7 +256,7 @@ const handleExit = (_event: unknown, data: { code: number | null; signal: string } } -const handleError = (_event: unknown, data: { message: string }) => { +const handleError = (data: { message: string }) => { status.value = 'error' if (terminal) { terminal.writeln(`\r\n\x1b[31mError: ${data.message}\x1b[0m`) @@ -260,14 +265,9 @@ const handleError = (_event: unknown, data: { message: string }) => { const handlePaste = async () => { try { - if (!window.api || typeof window.api.readClipboardText !== 'function') { - console.warn('[AcpTerminal] readClipboardText API not available') - return - } - - const text = window.api.readClipboardText() - if (text && window.electron) { - window.electron.ipcRenderer.send('acp-terminal:input', text) + const text = deviceClient.readClipboardText() + if (text) { + await acpTerminalClient.sendInput(text) console.log('[AcpTerminal] Pasted text to terminal:', text.length, 'characters') } } catch (error) { @@ -280,10 +280,10 @@ const handlePaste = async () => { } } -const handleExternalDepsRequired = ( - _event: unknown, - data: { agentId: string; missingDeps: ExternalDependency[] } -) => { +const handleExternalDepsRequired = (data: { + agentId: string + missingDeps: ExternalDependency[] +}) => { console.log('[AcpTerminal] External dependencies required:', data) if (!data.missingDeps || data.missingDeps.length === 0) { @@ -299,30 +299,20 @@ const handleExternalDepsRequired = ( } const setupIpcListeners = () => { - if (typeof window === 'undefined' || !window.electron) { - console.warn('[AcpTerminal] Cannot setup IPC listeners - window.electron not available') - return - } - console.log('[AcpTerminal] Setting up IPC listeners') - window.electron.ipcRenderer.on('acp-init:start', handleStart) - window.electron.ipcRenderer.on('acp-init:output', handleOutput) - window.electron.ipcRenderer.on('acp-init:exit', handleExit) - window.electron.ipcRenderer.on('acp-init:error', handleError) - window.electron.ipcRenderer.on('external-deps-required', handleExternalDepsRequired) + removeIpcListeners() + terminalEventCleanups = [ + acpTerminalClient.onStarted(handleStart), + acpTerminalClient.onOutput(handleOutput), + acpTerminalClient.onExited(handleExit), + acpTerminalClient.onError(handleError), + acpTerminalClient.onExternalDependenciesRequired(handleExternalDepsRequired) + ] console.log('[AcpTerminal] IPC listeners set up successfully') } const removeIpcListeners = () => { - if (typeof window === 'undefined' || !window.electron) { - return - } - - window.electron.ipcRenderer.removeAllListeners('acp-init:start') - window.electron.ipcRenderer.removeAllListeners('acp-init:output') - window.electron.ipcRenderer.removeAllListeners('acp-init:exit') - window.electron.ipcRenderer.removeAllListeners('acp-init:error') - window.electron.ipcRenderer.removeAllListeners('external-deps-required') + terminalEventCleanups.splice(0).forEach((cleanup) => cleanup()) } watch( diff --git a/src/renderer/settings/components/BuiltinKnowledgeSettings.vue b/src/renderer/settings/components/BuiltinKnowledgeSettings.vue index 8a4611703..2ea8fa2bb 100644 --- a/src/renderer/settings/components/BuiltinKnowledgeSettings.vue +++ b/src/renderer/settings/components/BuiltinKnowledgeSettings.vue @@ -598,17 +598,18 @@ import { BuiltinKnowledgeConfig, RENDERER_MODEL_META } from '@shared/presenter' import { toast } from '@/components/use-toast' import { useRoute } from 'vue-router' import { nanoid } from 'nanoid' -import { useLegacyPresenter } from '@api/legacy/presenters' import { useModelStore } from '@/stores/modelStore' import { createConfigClient } from '@api/ConfigClient' +import { createKnowledgeClient } from '@api/KnowledgeClient' +import { createProviderClient } from '@api/ProviderClient' // 全局对象 const { t } = useI18n() const mcpStore = useMcpStore() const modelStore = useModelStore() const themeStore = useThemeStore() const configClient = createConfigClient() -const llmP = useLegacyPresenter('llmproviderPresenter') -const knowledgeP = useLegacyPresenter('knowledgePresenter') +const knowledgeClient = createKnowledgeClient() +const providerClient = createProviderClient() const emit = defineEmits<{ (e: 'showDetail', config: BuiltinKnowledgeConfig): void }>() @@ -815,7 +816,7 @@ const saveBuiltinConfig = async () => { } // 自动获取dimensions if (autoDetectDimensionsSwitch.value) { - const result = await llmP.getDimensions( + const result = await providerClient.getEmbeddingDimensions( editingBuiltinConfig.value.embedding.providerId, editingBuiltinConfig.value.embedding.modelId ) @@ -943,7 +944,7 @@ const loadBuiltinConfig = async () => { const separators = ref('') const supportedLanguages = ref([]) -knowledgeP.getSupportedLanguages().then((res) => { +knowledgeClient.getSupportedLanguages().then((res) => { supportedLanguages.value = res console.log('支持的语言:', supportedLanguages.value) }) @@ -955,7 +956,7 @@ const handleLanguageSelect = async (language: string) => { } const getSeparatorsForLanguage = async (language: string) => { - return await knowledgeP.getSeparatorsForLanguage(language) + return await knowledgeClient.getSeparatorsForLanguage(language) } /** diff --git a/src/renderer/settings/components/DashboardSettings.vue b/src/renderer/settings/components/DashboardSettings.vue index 79d55b01f..10d7be505 100644 --- a/src/renderer/settings/components/DashboardSettings.vue +++ b/src/renderer/settings/components/DashboardSettings.vue @@ -673,7 +673,7 @@ import { } from '@shadcn/components/ui/chart' import type { ChartConfig } from '@shadcn/components/ui/chart' import type { UsageDashboardCalendarDay, UsageDashboardData } from '@shared/types/agent-interface' -import { useLegacyPresenter } from '@api/legacy/presenters' +import { createSessionClient } from '@api/SessionClient' import UsageNostalgiaCard from './control-center/UsageNostalgiaCard.vue' type CalendarCell = UsageDashboardCalendarDay | null @@ -700,7 +700,7 @@ type BreakdownChartRow = { barRatio: number } const { t, locale } = useI18n() -const agentSessionPresenter = useLegacyPresenter('agentSessionPresenter') +const sessionClient = createSessionClient() const props = withDefaults( defineProps<{ hideNostalgia?: boolean @@ -957,7 +957,7 @@ async function loadDashboard(): Promise { try { isLoading.value = true errorMessage.value = '' - const nextDashboard = await agentSessionPresenter.getUsageDashboard() + const nextDashboard = await sessionClient.getUsageDashboard() if (!isDashboardMounted) { return } @@ -986,7 +986,7 @@ async function retryRtkHealthCheck(): Promise { try { isRetryingRtk.value = true - await agentSessionPresenter.retryRtkHealthCheck() + await sessionClient.retryRtkHealthCheck() await loadDashboard() } catch (error) { errorMessage.value = diff --git a/src/renderer/settings/components/DataSettings.vue b/src/renderer/settings/components/DataSettings.vue index 5ef140d50..74e1a97cb 100644 --- a/src/renderer/settings/components/DataSettings.vue +++ b/src/renderer/settings/components/DataSettings.vue @@ -5,7 +5,10 @@ :description="t('settings.data.privacyDescription')" >
-
+
@@ -533,6 +538,7 @@
- +
-
@@ -109,6 +117,7 @@